{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.0, "global_step": 37211, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 1.7905102954341989e-06, "loss": 6.1826, "step": 1 }, { "epoch": 0.0, "learning_rate": 3.5810205908683977e-06, "loss": 6.8213, "step": 2 }, { "epoch": 0.0, "learning_rate": 5.371530886302596e-06, "loss": 5.572, "step": 3 }, { "epoch": 0.0, "learning_rate": 7.162041181736795e-06, "loss": 5.3955, "step": 4 }, { "epoch": 0.0, "learning_rate": 8.952551477170994e-06, "loss": 5.7434, "step": 5 }, { "epoch": 0.0, "learning_rate": 1.0743061772605193e-05, "loss": 5.4297, "step": 6 }, { "epoch": 0.0, "learning_rate": 1.2533572068039392e-05, "loss": 5.7735, "step": 7 }, { "epoch": 0.0, "learning_rate": 1.432408236347359e-05, "loss": 5.8672, "step": 8 }, { "epoch": 0.0, "learning_rate": 1.611459265890779e-05, "loss": 7.4761, "step": 9 }, { "epoch": 0.0, "learning_rate": 1.7905102954341987e-05, "loss": 6.0311, "step": 10 }, { "epoch": 0.0, "learning_rate": 1.9695613249776186e-05, "loss": 6.3132, "step": 11 }, { "epoch": 0.0, "learning_rate": 2.1486123545210385e-05, "loss": 5.9963, "step": 12 }, { "epoch": 0.0, "learning_rate": 2.3276633840644584e-05, "loss": 6.2576, "step": 13 }, { "epoch": 0.0, "learning_rate": 2.5067144136078783e-05, "loss": 5.9447, "step": 14 }, { "epoch": 0.0, "learning_rate": 2.685765443151298e-05, "loss": 5.7409, "step": 15 }, { "epoch": 0.0, "learning_rate": 2.864816472694718e-05, "loss": 5.8309, "step": 16 }, { "epoch": 0.0, "learning_rate": 3.043867502238138e-05, "loss": 6.3418, "step": 17 }, { "epoch": 0.0, "learning_rate": 3.222918531781558e-05, "loss": 5.9853, "step": 18 }, { "epoch": 0.0, "learning_rate": 3.4019695613249775e-05, "loss": 5.9629, "step": 19 }, { "epoch": 0.0, "learning_rate": 3.5810205908683974e-05, "loss": 5.7306, "step": 20 }, { "epoch": 0.0, "learning_rate": 3.7600716204118174e-05, "loss": 5.2967, "step": 21 }, { "epoch": 0.0, "learning_rate": 3.939122649955237e-05, "loss": 5.6911, "step": 22 }, { "epoch": 0.0, "learning_rate": 4.118173679498657e-05, "loss": 5.5883, "step": 23 }, { "epoch": 0.0, "learning_rate": 4.297224709042077e-05, "loss": 6.063, "step": 24 }, { "epoch": 0.0, "learning_rate": 4.476275738585497e-05, "loss": 5.8071, "step": 25 }, { "epoch": 0.0, "learning_rate": 4.655326768128917e-05, "loss": 5.5738, "step": 26 }, { "epoch": 0.0, "learning_rate": 4.834377797672337e-05, "loss": 6.062, "step": 27 }, { "epoch": 0.0, "learning_rate": 5.013428827215757e-05, "loss": 5.8632, "step": 28 }, { "epoch": 0.0, "learning_rate": 5.1924798567591766e-05, "loss": 5.3881, "step": 29 }, { "epoch": 0.0, "learning_rate": 5.371530886302596e-05, "loss": 5.9246, "step": 30 }, { "epoch": 0.0, "learning_rate": 5.550581915846016e-05, "loss": 5.3834, "step": 31 }, { "epoch": 0.0, "learning_rate": 5.729632945389436e-05, "loss": 5.8481, "step": 32 }, { "epoch": 0.0, "learning_rate": 5.908683974932856e-05, "loss": 5.2308, "step": 33 }, { "epoch": 0.0, "learning_rate": 6.087735004476276e-05, "loss": 5.1837, "step": 34 }, { "epoch": 0.0, "learning_rate": 6.266786034019697e-05, "loss": 5.0742, "step": 35 }, { "epoch": 0.0, "learning_rate": 6.445837063563117e-05, "loss": 5.4956, "step": 36 }, { "epoch": 0.0, "learning_rate": 6.624888093106537e-05, "loss": 5.9875, "step": 37 }, { "epoch": 0.0, "learning_rate": 6.803939122649955e-05, "loss": 5.3769, "step": 38 }, { "epoch": 0.0, "learning_rate": 6.982990152193375e-05, "loss": 5.7253, "step": 39 }, { "epoch": 0.0, "learning_rate": 7.162041181736795e-05, "loss": 5.7492, "step": 40 }, { "epoch": 0.0, "learning_rate": 7.341092211280215e-05, "loss": 6.1361, "step": 41 }, { "epoch": 0.0, "learning_rate": 7.520143240823635e-05, "loss": 5.5321, "step": 42 }, { "epoch": 0.0, "learning_rate": 7.699194270367055e-05, "loss": 5.0738, "step": 43 }, { "epoch": 0.0, "learning_rate": 7.878245299910475e-05, "loss": 5.0518, "step": 44 }, { "epoch": 0.0, "learning_rate": 8.057296329453894e-05, "loss": 5.3827, "step": 45 }, { "epoch": 0.0, "learning_rate": 8.236347358997314e-05, "loss": 5.5468, "step": 46 }, { "epoch": 0.0, "learning_rate": 8.415398388540734e-05, "loss": 5.578, "step": 47 }, { "epoch": 0.0, "learning_rate": 8.594449418084154e-05, "loss": 5.6742, "step": 48 }, { "epoch": 0.0, "learning_rate": 8.773500447627574e-05, "loss": 5.521, "step": 49 }, { "epoch": 0.0, "learning_rate": 8.952551477170994e-05, "loss": 5.2121, "step": 50 }, { "epoch": 0.0, "learning_rate": 9.131602506714414e-05, "loss": 5.5945, "step": 51 }, { "epoch": 0.0, "learning_rate": 9.310653536257834e-05, "loss": 6.3142, "step": 52 }, { "epoch": 0.0, "learning_rate": 9.489704565801254e-05, "loss": 5.7057, "step": 53 }, { "epoch": 0.0, "learning_rate": 9.668755595344674e-05, "loss": 5.4487, "step": 54 }, { "epoch": 0.0, "learning_rate": 9.847806624888093e-05, "loss": 5.4613, "step": 55 }, { "epoch": 0.0, "learning_rate": 0.00010026857654431513, "loss": 5.2324, "step": 56 }, { "epoch": 0.0, "learning_rate": 0.00010205908683974933, "loss": 6.0, "step": 57 }, { "epoch": 0.0, "learning_rate": 0.00010384959713518353, "loss": 5.9019, "step": 58 }, { "epoch": 0.0, "learning_rate": 0.00010564010743061773, "loss": 5.7448, "step": 59 }, { "epoch": 0.0, "learning_rate": 0.00010743061772605192, "loss": 4.7486, "step": 60 }, { "epoch": 0.0, "learning_rate": 0.00010922112802148612, "loss": 5.6497, "step": 61 }, { "epoch": 0.0, "learning_rate": 0.00011101163831692031, "loss": 5.5156, "step": 62 }, { "epoch": 0.0, "learning_rate": 0.00011280214861235453, "loss": 5.6869, "step": 63 }, { "epoch": 0.0, "learning_rate": 0.00011459265890778873, "loss": 5.4785, "step": 64 }, { "epoch": 0.0, "learning_rate": 0.00011638316920322293, "loss": 6.2784, "step": 65 }, { "epoch": 0.0, "learning_rate": 0.00011817367949865712, "loss": 5.8701, "step": 66 }, { "epoch": 0.0, "learning_rate": 0.00011996418979409132, "loss": 5.4097, "step": 67 }, { "epoch": 0.0, "learning_rate": 0.00012175470008952552, "loss": 5.751, "step": 68 }, { "epoch": 0.0, "learning_rate": 0.00012354521038495972, "loss": 5.3207, "step": 69 }, { "epoch": 0.0, "learning_rate": 0.00012533572068039393, "loss": 5.4571, "step": 70 }, { "epoch": 0.0, "learning_rate": 0.00012712623097582812, "loss": 5.4739, "step": 71 }, { "epoch": 0.0, "learning_rate": 0.00012891674127126233, "loss": 5.5135, "step": 72 }, { "epoch": 0.0, "learning_rate": 0.00013070725156669652, "loss": 5.5011, "step": 73 }, { "epoch": 0.0, "learning_rate": 0.00013249776186213073, "loss": 4.9623, "step": 74 }, { "epoch": 0.0, "learning_rate": 0.00013428827215756492, "loss": 5.4076, "step": 75 }, { "epoch": 0.0, "learning_rate": 0.0001360787824529991, "loss": 4.9327, "step": 76 }, { "epoch": 0.0, "learning_rate": 0.0001378692927484333, "loss": 5.6639, "step": 77 }, { "epoch": 0.0, "learning_rate": 0.0001396598030438675, "loss": 5.3374, "step": 78 }, { "epoch": 0.0, "learning_rate": 0.00014145031333930169, "loss": 5.4614, "step": 79 }, { "epoch": 0.0, "learning_rate": 0.0001432408236347359, "loss": 5.6015, "step": 80 }, { "epoch": 0.0, "learning_rate": 0.00014503133393017008, "loss": 5.6592, "step": 81 }, { "epoch": 0.0, "learning_rate": 0.0001468218442256043, "loss": 5.8598, "step": 82 }, { "epoch": 0.0, "learning_rate": 0.0001486123545210385, "loss": 5.0475, "step": 83 }, { "epoch": 0.0, "learning_rate": 0.0001504028648164727, "loss": 5.4381, "step": 84 }, { "epoch": 0.0, "learning_rate": 0.0001521933751119069, "loss": 5.7197, "step": 85 }, { "epoch": 0.0, "learning_rate": 0.0001539838854073411, "loss": 5.0679, "step": 86 }, { "epoch": 0.0, "learning_rate": 0.0001557743957027753, "loss": 5.2652, "step": 87 }, { "epoch": 0.0, "learning_rate": 0.0001575649059982095, "loss": 5.3016, "step": 88 }, { "epoch": 0.0, "learning_rate": 0.0001593554162936437, "loss": 5.7023, "step": 89 }, { "epoch": 0.0, "learning_rate": 0.0001611459265890779, "loss": 5.1533, "step": 90 }, { "epoch": 0.0, "learning_rate": 0.0001629364368845121, "loss": 5.4728, "step": 91 }, { "epoch": 0.0, "learning_rate": 0.0001647269471799463, "loss": 5.1333, "step": 92 }, { "epoch": 0.0, "learning_rate": 0.0001665174574753805, "loss": 5.5092, "step": 93 }, { "epoch": 0.0, "learning_rate": 0.00016830796777081468, "loss": 5.1976, "step": 94 }, { "epoch": 0.0, "learning_rate": 0.0001700984780662489, "loss": 5.2945, "step": 95 }, { "epoch": 0.0, "learning_rate": 0.00017188898836168308, "loss": 5.4452, "step": 96 }, { "epoch": 0.0, "learning_rate": 0.00017367949865711727, "loss": 5.2503, "step": 97 }, { "epoch": 0.0, "learning_rate": 0.00017547000895255148, "loss": 5.2474, "step": 98 }, { "epoch": 0.0, "learning_rate": 0.00017726051924798567, "loss": 5.0333, "step": 99 }, { "epoch": 0.0, "learning_rate": 0.00017905102954341988, "loss": 5.0758, "step": 100 }, { "epoch": 0.0, "learning_rate": 0.00018084153983885406, "loss": 5.1012, "step": 101 }, { "epoch": 0.0, "learning_rate": 0.00018263205013428828, "loss": 5.8717, "step": 102 }, { "epoch": 0.0, "learning_rate": 0.00018442256042972246, "loss": 5.1825, "step": 103 }, { "epoch": 0.0, "learning_rate": 0.00018621307072515668, "loss": 5.1728, "step": 104 }, { "epoch": 0.0, "learning_rate": 0.00018800358102059086, "loss": 5.4939, "step": 105 }, { "epoch": 0.0, "learning_rate": 0.00018979409131602507, "loss": 5.1274, "step": 106 }, { "epoch": 0.0, "learning_rate": 0.00019158460161145926, "loss": 4.8049, "step": 107 }, { "epoch": 0.0, "learning_rate": 0.00019337511190689347, "loss": 5.441, "step": 108 }, { "epoch": 0.0, "learning_rate": 0.00019516562220232766, "loss": 5.3848, "step": 109 }, { "epoch": 0.0, "learning_rate": 0.00019695613249776187, "loss": 6.0025, "step": 110 }, { "epoch": 0.0, "learning_rate": 0.00019874664279319608, "loss": 5.5571, "step": 111 }, { "epoch": 0.0, "learning_rate": 0.00020053715308863027, "loss": 5.6561, "step": 112 }, { "epoch": 0.0, "learning_rate": 0.00020232766338406448, "loss": 5.2902, "step": 113 }, { "epoch": 0.0, "learning_rate": 0.00020411817367949867, "loss": 4.9122, "step": 114 }, { "epoch": 0.0, "learning_rate": 0.00020590868397493288, "loss": 5.1986, "step": 115 }, { "epoch": 0.0, "learning_rate": 0.00020769919427036706, "loss": 5.1434, "step": 116 }, { "epoch": 0.0, "learning_rate": 0.00020948970456580128, "loss": 5.4702, "step": 117 }, { "epoch": 0.0, "learning_rate": 0.00021128021486123546, "loss": 4.8427, "step": 118 }, { "epoch": 0.0, "learning_rate": 0.00021307072515666965, "loss": 4.7161, "step": 119 }, { "epoch": 0.0, "learning_rate": 0.00021486123545210383, "loss": 5.4529, "step": 120 }, { "epoch": 0.0, "learning_rate": 0.00021665174574753805, "loss": 5.3212, "step": 121 }, { "epoch": 0.0, "learning_rate": 0.00021844225604297223, "loss": 5.4355, "step": 122 }, { "epoch": 0.0, "learning_rate": 0.00022023276633840644, "loss": 5.1143, "step": 123 }, { "epoch": 0.0, "learning_rate": 0.00022202327663384063, "loss": 4.8161, "step": 124 }, { "epoch": 0.0, "learning_rate": 0.00022381378692927484, "loss": 4.9862, "step": 125 }, { "epoch": 0.0, "learning_rate": 0.00022560429722470905, "loss": 4.9511, "step": 126 }, { "epoch": 0.0, "learning_rate": 0.00022739480752014324, "loss": 5.5627, "step": 127 }, { "epoch": 0.0, "learning_rate": 0.00022918531781557745, "loss": 5.1222, "step": 128 }, { "epoch": 0.0, "learning_rate": 0.00023097582811101164, "loss": 5.1012, "step": 129 }, { "epoch": 0.0, "learning_rate": 0.00023276633840644585, "loss": 5.4852, "step": 130 }, { "epoch": 0.0, "learning_rate": 0.00023455684870188004, "loss": 4.5526, "step": 131 }, { "epoch": 0.0, "learning_rate": 0.00023634735899731425, "loss": 5.1244, "step": 132 }, { "epoch": 0.0, "learning_rate": 0.00023813786929274843, "loss": 4.9629, "step": 133 }, { "epoch": 0.0, "learning_rate": 0.00023992837958818265, "loss": 5.3469, "step": 134 }, { "epoch": 0.0, "learning_rate": 0.00024171888988361683, "loss": 5.7059, "step": 135 }, { "epoch": 0.0, "learning_rate": 0.00024350940017905105, "loss": 4.5826, "step": 136 }, { "epoch": 0.0, "learning_rate": 0.00024529991047448523, "loss": 5.4452, "step": 137 }, { "epoch": 0.0, "learning_rate": 0.00024709042076991944, "loss": 4.9594, "step": 138 }, { "epoch": 0.0, "learning_rate": 0.00024888093106535366, "loss": 5.1658, "step": 139 }, { "epoch": 0.0, "learning_rate": 0.00025067144136078787, "loss": 5.3831, "step": 140 }, { "epoch": 0.0, "learning_rate": 0.00025246195165622203, "loss": 5.522, "step": 141 }, { "epoch": 0.0, "learning_rate": 0.00025425246195165624, "loss": 4.7598, "step": 142 }, { "epoch": 0.0, "learning_rate": 0.00025604297224709045, "loss": 4.8058, "step": 143 }, { "epoch": 0.0, "learning_rate": 0.00025783348254252467, "loss": 5.1982, "step": 144 }, { "epoch": 0.0, "learning_rate": 0.0002596239928379588, "loss": 5.0529, "step": 145 }, { "epoch": 0.0, "learning_rate": 0.00026141450313339304, "loss": 4.7906, "step": 146 }, { "epoch": 0.0, "learning_rate": 0.00026320501342882725, "loss": 4.7997, "step": 147 }, { "epoch": 0.0, "learning_rate": 0.00026499552372426146, "loss": 4.748, "step": 148 }, { "epoch": 0.0, "learning_rate": 0.0002667860340196956, "loss": 4.9114, "step": 149 }, { "epoch": 0.0, "learning_rate": 0.00026857654431512983, "loss": 4.8683, "step": 150 }, { "epoch": 0.0, "learning_rate": 0.000270367054610564, "loss": 5.2543, "step": 151 }, { "epoch": 0.0, "learning_rate": 0.0002721575649059982, "loss": 5.2464, "step": 152 }, { "epoch": 0.0, "learning_rate": 0.0002739480752014324, "loss": 4.5451, "step": 153 }, { "epoch": 0.0, "learning_rate": 0.0002757385854968666, "loss": 4.581, "step": 154 }, { "epoch": 0.0, "learning_rate": 0.0002775290957923008, "loss": 4.4974, "step": 155 }, { "epoch": 0.0, "learning_rate": 0.000279319606087735, "loss": 4.811, "step": 156 }, { "epoch": 0.0, "learning_rate": 0.0002811101163831692, "loss": 4.8212, "step": 157 }, { "epoch": 0.0, "learning_rate": 0.00028290062667860337, "loss": 4.9435, "step": 158 }, { "epoch": 0.0, "learning_rate": 0.0002846911369740376, "loss": 4.586, "step": 159 }, { "epoch": 0.0, "learning_rate": 0.0002864816472694718, "loss": 4.4881, "step": 160 }, { "epoch": 0.0, "learning_rate": 0.000288272157564906, "loss": 4.9852, "step": 161 }, { "epoch": 0.0, "learning_rate": 0.00029006266786034017, "loss": 4.4589, "step": 162 }, { "epoch": 0.0, "learning_rate": 0.0002918531781557744, "loss": 4.6184, "step": 163 }, { "epoch": 0.0, "learning_rate": 0.0002936436884512086, "loss": 4.1212, "step": 164 }, { "epoch": 0.0, "learning_rate": 0.0002954341987466428, "loss": 3.8551, "step": 165 }, { "epoch": 0.0, "learning_rate": 0.000297224709042077, "loss": 4.4829, "step": 166 }, { "epoch": 0.0, "learning_rate": 0.0002990152193375112, "loss": 4.2405, "step": 167 }, { "epoch": 0.0, "learning_rate": 0.0003008057296329454, "loss": 4.3964, "step": 168 }, { "epoch": 0.0, "learning_rate": 0.0003025962399283796, "loss": 4.4555, "step": 169 }, { "epoch": 0.0, "learning_rate": 0.0003043867502238138, "loss": 4.018, "step": 170 }, { "epoch": 0.0, "learning_rate": 0.00030617726051924797, "loss": 4.4453, "step": 171 }, { "epoch": 0.0, "learning_rate": 0.0003079677708146822, "loss": 4.3352, "step": 172 }, { "epoch": 0.0, "learning_rate": 0.0003097582811101164, "loss": 4.4495, "step": 173 }, { "epoch": 0.0, "learning_rate": 0.0003115487914055506, "loss": 4.1979, "step": 174 }, { "epoch": 0.0, "learning_rate": 0.00031333930170098477, "loss": 3.74, "step": 175 }, { "epoch": 0.0, "learning_rate": 0.000315129811996419, "loss": 4.4224, "step": 176 }, { "epoch": 0.0, "learning_rate": 0.0003169203222918532, "loss": 4.5516, "step": 177 }, { "epoch": 0.0, "learning_rate": 0.0003187108325872874, "loss": 4.2591, "step": 178 }, { "epoch": 0.0, "learning_rate": 0.00032050134288272156, "loss": 3.827, "step": 179 }, { "epoch": 0.0, "learning_rate": 0.0003222918531781558, "loss": 3.9175, "step": 180 }, { "epoch": 0.0, "learning_rate": 0.00032408236347359, "loss": 4.1426, "step": 181 }, { "epoch": 0.0, "learning_rate": 0.0003258728737690242, "loss": 3.7717, "step": 182 }, { "epoch": 0.0, "learning_rate": 0.0003276633840644584, "loss": 3.6061, "step": 183 }, { "epoch": 0.0, "learning_rate": 0.0003294538943598926, "loss": 3.9013, "step": 184 }, { "epoch": 0.0, "learning_rate": 0.0003312444046553268, "loss": 3.9956, "step": 185 }, { "epoch": 0.0, "learning_rate": 0.000333034914950761, "loss": 4.1133, "step": 186 }, { "epoch": 0.01, "learning_rate": 0.0003348254252461952, "loss": 4.1065, "step": 187 }, { "epoch": 0.01, "learning_rate": 0.00033661593554162937, "loss": 3.9546, "step": 188 }, { "epoch": 0.01, "learning_rate": 0.0003384064458370636, "loss": 3.8297, "step": 189 }, { "epoch": 0.01, "learning_rate": 0.0003401969561324978, "loss": 4.0219, "step": 190 }, { "epoch": 0.01, "learning_rate": 0.000341987466427932, "loss": 4.3016, "step": 191 }, { "epoch": 0.01, "learning_rate": 0.00034377797672336617, "loss": 3.6119, "step": 192 }, { "epoch": 0.01, "learning_rate": 0.0003455684870188004, "loss": 3.7551, "step": 193 }, { "epoch": 0.01, "learning_rate": 0.00034735899731423454, "loss": 3.8241, "step": 194 }, { "epoch": 0.01, "learning_rate": 0.00034914950760966875, "loss": 3.8894, "step": 195 }, { "epoch": 0.01, "learning_rate": 0.00035094001790510296, "loss": 4.205, "step": 196 }, { "epoch": 0.01, "learning_rate": 0.0003527305282005371, "loss": 3.7176, "step": 197 }, { "epoch": 0.01, "learning_rate": 0.00035452103849597133, "loss": 4.0282, "step": 198 }, { "epoch": 0.01, "learning_rate": 0.00035631154879140555, "loss": 4.248, "step": 199 }, { "epoch": 0.01, "learning_rate": 0.00035810205908683976, "loss": 4.0002, "step": 200 }, { "epoch": 0.01, "learning_rate": 0.0003598925693822739, "loss": 4.0733, "step": 201 }, { "epoch": 0.01, "learning_rate": 0.00036168307967770813, "loss": 4.0621, "step": 202 }, { "epoch": 0.01, "learning_rate": 0.00036347358997314234, "loss": 4.214, "step": 203 }, { "epoch": 0.01, "learning_rate": 0.00036526410026857655, "loss": 3.8581, "step": 204 }, { "epoch": 0.01, "learning_rate": 0.0003670546105640107, "loss": 4.1524, "step": 205 }, { "epoch": 0.01, "learning_rate": 0.0003688451208594449, "loss": 3.7195, "step": 206 }, { "epoch": 0.01, "learning_rate": 0.00037063563115487914, "loss": 3.9658, "step": 207 }, { "epoch": 0.01, "learning_rate": 0.00037242614145031335, "loss": 4.185, "step": 208 }, { "epoch": 0.01, "learning_rate": 0.00037421665174574756, "loss": 3.9456, "step": 209 }, { "epoch": 0.01, "learning_rate": 0.0003760071620411817, "loss": 3.8828, "step": 210 }, { "epoch": 0.01, "learning_rate": 0.00037779767233661593, "loss": 4.1765, "step": 211 }, { "epoch": 0.01, "learning_rate": 0.00037958818263205015, "loss": 4.1349, "step": 212 }, { "epoch": 0.01, "learning_rate": 0.00038137869292748436, "loss": 4.0311, "step": 213 }, { "epoch": 0.01, "learning_rate": 0.0003831692032229185, "loss": 3.8383, "step": 214 }, { "epoch": 0.01, "learning_rate": 0.00038495971351835273, "loss": 3.9558, "step": 215 }, { "epoch": 0.01, "learning_rate": 0.00038675022381378694, "loss": 4.0246, "step": 216 }, { "epoch": 0.01, "learning_rate": 0.00038854073410922116, "loss": 3.89, "step": 217 }, { "epoch": 0.01, "learning_rate": 0.0003903312444046553, "loss": 3.8704, "step": 218 }, { "epoch": 0.01, "learning_rate": 0.0003921217547000895, "loss": 3.8425, "step": 219 }, { "epoch": 0.01, "learning_rate": 0.00039391226499552374, "loss": 4.1319, "step": 220 }, { "epoch": 0.01, "learning_rate": 0.00039570277529095795, "loss": 3.3613, "step": 221 }, { "epoch": 0.01, "learning_rate": 0.00039749328558639216, "loss": 3.5188, "step": 222 }, { "epoch": 0.01, "learning_rate": 0.0003992837958818263, "loss": 3.3119, "step": 223 }, { "epoch": 0.01, "learning_rate": 0.00040107430617726054, "loss": 3.7839, "step": 224 }, { "epoch": 0.01, "learning_rate": 0.00040286481647269475, "loss": 4.104, "step": 225 }, { "epoch": 0.01, "learning_rate": 0.00040465532676812896, "loss": 3.8107, "step": 226 }, { "epoch": 0.01, "learning_rate": 0.0004064458370635631, "loss": 3.9727, "step": 227 }, { "epoch": 0.01, "learning_rate": 0.00040823634735899733, "loss": 3.9511, "step": 228 }, { "epoch": 0.01, "learning_rate": 0.00041002685765443154, "loss": 3.775, "step": 229 }, { "epoch": 0.01, "learning_rate": 0.00041181736794986576, "loss": 3.6117, "step": 230 }, { "epoch": 0.01, "learning_rate": 0.0004136078782452999, "loss": 3.9469, "step": 231 }, { "epoch": 0.01, "learning_rate": 0.00041539838854073413, "loss": 4.0704, "step": 232 }, { "epoch": 0.01, "learning_rate": 0.00041718889883616834, "loss": 3.673, "step": 233 }, { "epoch": 0.01, "learning_rate": 0.00041897940913160255, "loss": 3.5402, "step": 234 }, { "epoch": 0.01, "learning_rate": 0.00042076991942703677, "loss": 3.9595, "step": 235 }, { "epoch": 0.01, "learning_rate": 0.0004225604297224709, "loss": 3.7778, "step": 236 }, { "epoch": 0.01, "learning_rate": 0.0004243509400179051, "loss": 3.9856, "step": 237 }, { "epoch": 0.01, "learning_rate": 0.0004261414503133393, "loss": 3.518, "step": 238 }, { "epoch": 0.01, "learning_rate": 0.0004279319606087735, "loss": 4.0735, "step": 239 }, { "epoch": 0.01, "learning_rate": 0.00042972247090420767, "loss": 3.7076, "step": 240 }, { "epoch": 0.01, "learning_rate": 0.0004315129811996419, "loss": 4.5105, "step": 241 }, { "epoch": 0.01, "learning_rate": 0.0004333034914950761, "loss": 5.0486, "step": 242 }, { "epoch": 0.01, "learning_rate": 0.0004350940017905103, "loss": 4.4837, "step": 243 }, { "epoch": 0.01, "learning_rate": 0.00043688451208594446, "loss": 5.4953, "step": 244 }, { "epoch": 0.01, "learning_rate": 0.0004386750223813787, "loss": 5.8736, "step": 245 }, { "epoch": 0.01, "learning_rate": 0.0004404655326768129, "loss": 4.2137, "step": 246 }, { "epoch": 0.01, "learning_rate": 0.0004422560429722471, "loss": 5.6172, "step": 247 }, { "epoch": 0.01, "learning_rate": 0.00044404655326768126, "loss": 5.093, "step": 248 }, { "epoch": 0.01, "learning_rate": 0.00044583706356311547, "loss": 5.4453, "step": 249 }, { "epoch": 0.01, "learning_rate": 0.0004476275738585497, "loss": 5.4778, "step": 250 }, { "epoch": 0.01, "learning_rate": 0.0004494180841539839, "loss": 3.9836, "step": 251 }, { "epoch": 0.01, "learning_rate": 0.0004512085944494181, "loss": 5.5934, "step": 252 }, { "epoch": 0.01, "learning_rate": 0.00045299910474485227, "loss": 5.7119, "step": 253 }, { "epoch": 0.01, "learning_rate": 0.0004547896150402865, "loss": 5.1526, "step": 254 }, { "epoch": 0.01, "learning_rate": 0.0004565801253357207, "loss": 5.5668, "step": 255 }, { "epoch": 0.01, "learning_rate": 0.0004583706356311549, "loss": 3.8288, "step": 256 }, { "epoch": 0.01, "learning_rate": 0.00046016114592658906, "loss": 5.0193, "step": 257 }, { "epoch": 0.01, "learning_rate": 0.0004619516562220233, "loss": 5.6345, "step": 258 }, { "epoch": 0.01, "learning_rate": 0.0004637421665174575, "loss": 3.9663, "step": 259 }, { "epoch": 0.01, "learning_rate": 0.0004655326768128917, "loss": 4.6789, "step": 260 }, { "epoch": 0.01, "learning_rate": 0.00046732318710832586, "loss": 5.1286, "step": 261 }, { "epoch": 0.01, "learning_rate": 0.0004691136974037601, "loss": 4.4272, "step": 262 }, { "epoch": 0.01, "learning_rate": 0.0004709042076991943, "loss": 3.6719, "step": 263 }, { "epoch": 0.01, "learning_rate": 0.0004726947179946285, "loss": 4.0172, "step": 264 }, { "epoch": 0.01, "learning_rate": 0.0004744852282900627, "loss": 4.3998, "step": 265 }, { "epoch": 0.01, "learning_rate": 0.00047627573858549687, "loss": 4.0789, "step": 266 }, { "epoch": 0.01, "learning_rate": 0.0004780662488809311, "loss": 3.4893, "step": 267 }, { "epoch": 0.01, "learning_rate": 0.0004798567591763653, "loss": 3.683, "step": 268 }, { "epoch": 0.01, "learning_rate": 0.0004816472694717995, "loss": 3.6118, "step": 269 }, { "epoch": 0.01, "learning_rate": 0.00048343777976723367, "loss": 3.5021, "step": 270 }, { "epoch": 0.01, "learning_rate": 0.0004852282900626679, "loss": 3.9293, "step": 271 }, { "epoch": 0.01, "learning_rate": 0.0004870188003581021, "loss": 3.5696, "step": 272 }, { "epoch": 0.01, "learning_rate": 0.0004888093106535363, "loss": 3.2711, "step": 273 }, { "epoch": 0.01, "learning_rate": 0.0004905998209489705, "loss": 3.521, "step": 274 }, { "epoch": 0.01, "learning_rate": 0.0004923903312444047, "loss": 3.9253, "step": 275 }, { "epoch": 0.01, "learning_rate": 0.0004941808415398389, "loss": 4.0937, "step": 276 }, { "epoch": 0.01, "learning_rate": 0.000495971351835273, "loss": 3.5425, "step": 277 }, { "epoch": 0.01, "learning_rate": 0.0004977618621307073, "loss": 3.239, "step": 278 }, { "epoch": 0.01, "learning_rate": 0.0004995523724261415, "loss": 3.7604, "step": 279 }, { "epoch": 0.01, "learning_rate": 0.0005013428827215757, "loss": 3.3447, "step": 280 }, { "epoch": 0.01, "learning_rate": 0.0005031333930170099, "loss": 3.5071, "step": 281 }, { "epoch": 0.01, "learning_rate": 0.0005049239033124441, "loss": 3.5459, "step": 282 }, { "epoch": 0.01, "learning_rate": 0.0005067144136078783, "loss": 3.5922, "step": 283 }, { "epoch": 0.01, "learning_rate": 0.0005085049239033125, "loss": 3.9944, "step": 284 }, { "epoch": 0.01, "learning_rate": 0.0005102954341987466, "loss": 3.6343, "step": 285 }, { "epoch": 0.01, "learning_rate": 0.0005120859444941809, "loss": 3.8104, "step": 286 }, { "epoch": 0.01, "learning_rate": 0.0005138764547896151, "loss": 3.552, "step": 287 }, { "epoch": 0.01, "learning_rate": 0.0005156669650850493, "loss": 3.4447, "step": 288 }, { "epoch": 0.01, "learning_rate": 0.0005174574753804835, "loss": 3.4319, "step": 289 }, { "epoch": 0.01, "learning_rate": 0.0005192479856759176, "loss": 3.534, "step": 290 }, { "epoch": 0.01, "learning_rate": 0.0005210384959713519, "loss": 4.1717, "step": 291 }, { "epoch": 0.01, "learning_rate": 0.0005228290062667861, "loss": 3.6194, "step": 292 }, { "epoch": 0.01, "learning_rate": 0.0005246195165622203, "loss": 3.2478, "step": 293 }, { "epoch": 0.01, "learning_rate": 0.0005264100268576545, "loss": 3.7416, "step": 294 }, { "epoch": 0.01, "learning_rate": 0.0005282005371530887, "loss": 3.2613, "step": 295 }, { "epoch": 0.01, "learning_rate": 0.0005299910474485229, "loss": 3.7742, "step": 296 }, { "epoch": 0.01, "learning_rate": 0.0005317815577439571, "loss": 3.7118, "step": 297 }, { "epoch": 0.01, "learning_rate": 0.0005335720680393912, "loss": 3.2314, "step": 298 }, { "epoch": 0.01, "learning_rate": 0.0005353625783348255, "loss": 3.6318, "step": 299 }, { "epoch": 0.01, "learning_rate": 0.0005371530886302597, "loss": 3.3492, "step": 300 }, { "epoch": 0.01, "learning_rate": 0.0005389435989256938, "loss": 3.4706, "step": 301 }, { "epoch": 0.01, "learning_rate": 0.000540734109221128, "loss": 3.5113, "step": 302 }, { "epoch": 0.01, "learning_rate": 0.0005425246195165621, "loss": 3.7259, "step": 303 }, { "epoch": 0.01, "learning_rate": 0.0005443151298119964, "loss": 3.6912, "step": 304 }, { "epoch": 0.01, "learning_rate": 0.0005461056401074306, "loss": 3.3586, "step": 305 }, { "epoch": 0.01, "learning_rate": 0.0005478961504028648, "loss": 3.2479, "step": 306 }, { "epoch": 0.01, "learning_rate": 0.000549686660698299, "loss": 3.4546, "step": 307 }, { "epoch": 0.01, "learning_rate": 0.0005514771709937331, "loss": 4.1328, "step": 308 }, { "epoch": 0.01, "learning_rate": 0.0005532676812891674, "loss": 3.2299, "step": 309 }, { "epoch": 0.01, "learning_rate": 0.0005550581915846016, "loss": 3.5139, "step": 310 }, { "epoch": 0.01, "learning_rate": 0.0005568487018800357, "loss": 3.3561, "step": 311 }, { "epoch": 0.01, "learning_rate": 0.00055863921217547, "loss": 3.3174, "step": 312 }, { "epoch": 0.01, "learning_rate": 0.0005604297224709042, "loss": 3.2827, "step": 313 }, { "epoch": 0.01, "learning_rate": 0.0005622202327663384, "loss": 3.5024, "step": 314 }, { "epoch": 0.01, "learning_rate": 0.0005640107430617726, "loss": 3.3989, "step": 315 }, { "epoch": 0.01, "learning_rate": 0.0005658012533572067, "loss": 3.5208, "step": 316 }, { "epoch": 0.01, "learning_rate": 0.000567591763652641, "loss": 3.502, "step": 317 }, { "epoch": 0.01, "learning_rate": 0.0005693822739480752, "loss": 3.439, "step": 318 }, { "epoch": 0.01, "learning_rate": 0.0005711727842435094, "loss": 3.3613, "step": 319 }, { "epoch": 0.01, "learning_rate": 0.0005729632945389436, "loss": 3.3534, "step": 320 }, { "epoch": 0.01, "learning_rate": 0.0005747538048343778, "loss": 3.3617, "step": 321 }, { "epoch": 0.01, "learning_rate": 0.000576544315129812, "loss": 3.5724, "step": 322 }, { "epoch": 0.01, "learning_rate": 0.0005783348254252462, "loss": 3.574, "step": 323 }, { "epoch": 0.01, "learning_rate": 0.0005801253357206803, "loss": 3.3338, "step": 324 }, { "epoch": 0.01, "learning_rate": 0.0005819158460161146, "loss": 3.5673, "step": 325 }, { "epoch": 0.01, "learning_rate": 0.0005837063563115488, "loss": 3.392, "step": 326 }, { "epoch": 0.01, "learning_rate": 0.000585496866606983, "loss": 3.4044, "step": 327 }, { "epoch": 0.01, "learning_rate": 0.0005872873769024172, "loss": 3.0586, "step": 328 }, { "epoch": 0.01, "learning_rate": 0.0005890778871978513, "loss": 3.638, "step": 329 }, { "epoch": 0.01, "learning_rate": 0.0005908683974932856, "loss": 3.7448, "step": 330 }, { "epoch": 0.01, "learning_rate": 0.0005926589077887198, "loss": 3.5442, "step": 331 }, { "epoch": 0.01, "learning_rate": 0.000594449418084154, "loss": 3.9698, "step": 332 }, { "epoch": 0.01, "learning_rate": 0.0005962399283795882, "loss": 3.7641, "step": 333 }, { "epoch": 0.01, "learning_rate": 0.0005980304386750224, "loss": 3.7359, "step": 334 }, { "epoch": 0.01, "learning_rate": 0.0005998209489704566, "loss": 3.7512, "step": 335 }, { "epoch": 0.01, "learning_rate": 0.0006016114592658908, "loss": 3.5493, "step": 336 }, { "epoch": 0.01, "learning_rate": 0.0006034019695613249, "loss": 3.2754, "step": 337 }, { "epoch": 0.01, "learning_rate": 0.0006051924798567592, "loss": 3.6352, "step": 338 }, { "epoch": 0.01, "learning_rate": 0.0006069829901521934, "loss": 3.1621, "step": 339 }, { "epoch": 0.01, "learning_rate": 0.0006087735004476276, "loss": 3.6362, "step": 340 }, { "epoch": 0.01, "learning_rate": 0.0006105640107430618, "loss": 3.3867, "step": 341 }, { "epoch": 0.01, "learning_rate": 0.0006123545210384959, "loss": 3.7399, "step": 342 }, { "epoch": 0.01, "learning_rate": 0.0006141450313339302, "loss": 3.4761, "step": 343 }, { "epoch": 0.01, "learning_rate": 0.0006159355416293644, "loss": 3.4959, "step": 344 }, { "epoch": 0.01, "learning_rate": 0.0006177260519247986, "loss": 3.4228, "step": 345 }, { "epoch": 0.01, "learning_rate": 0.0006195165622202328, "loss": 3.5332, "step": 346 }, { "epoch": 0.01, "learning_rate": 0.000621307072515667, "loss": 3.41, "step": 347 }, { "epoch": 0.01, "learning_rate": 0.0006230975828111012, "loss": 3.8024, "step": 348 }, { "epoch": 0.01, "learning_rate": 0.0006248880931065354, "loss": 3.5774, "step": 349 }, { "epoch": 0.01, "learning_rate": 0.0006266786034019695, "loss": 3.8261, "step": 350 }, { "epoch": 0.01, "learning_rate": 0.0006284691136974038, "loss": 3.5932, "step": 351 }, { "epoch": 0.01, "learning_rate": 0.000630259623992838, "loss": 3.6554, "step": 352 }, { "epoch": 0.01, "learning_rate": 0.0006320501342882722, "loss": 3.2644, "step": 353 }, { "epoch": 0.01, "learning_rate": 0.0006338406445837064, "loss": 3.4426, "step": 354 }, { "epoch": 0.01, "learning_rate": 0.0006356311548791405, "loss": 3.3817, "step": 355 }, { "epoch": 0.01, "learning_rate": 0.0006374216651745748, "loss": 3.4123, "step": 356 }, { "epoch": 0.01, "learning_rate": 0.000639212175470009, "loss": 3.5975, "step": 357 }, { "epoch": 0.01, "learning_rate": 0.0006410026857654431, "loss": 3.1913, "step": 358 }, { "epoch": 0.01, "learning_rate": 0.0006427931960608774, "loss": 3.2236, "step": 359 }, { "epoch": 0.01, "learning_rate": 0.0006445837063563116, "loss": 3.546, "step": 360 }, { "epoch": 0.01, "learning_rate": 0.0006463742166517458, "loss": 3.1708, "step": 361 }, { "epoch": 0.01, "learning_rate": 0.00064816472694718, "loss": 3.4521, "step": 362 }, { "epoch": 0.01, "learning_rate": 0.0006499552372426141, "loss": 3.0231, "step": 363 }, { "epoch": 0.01, "learning_rate": 0.0006517457475380484, "loss": 3.2148, "step": 364 }, { "epoch": 0.01, "learning_rate": 0.0006535362578334826, "loss": 3.3602, "step": 365 }, { "epoch": 0.01, "learning_rate": 0.0006553267681289168, "loss": 3.5744, "step": 366 }, { "epoch": 0.01, "learning_rate": 0.000657117278424351, "loss": 3.5998, "step": 367 }, { "epoch": 0.01, "learning_rate": 0.0006589077887197851, "loss": 3.6652, "step": 368 }, { "epoch": 0.01, "learning_rate": 0.0006606982990152194, "loss": 3.463, "step": 369 }, { "epoch": 0.01, "learning_rate": 0.0006624888093106536, "loss": 2.9099, "step": 370 }, { "epoch": 0.01, "learning_rate": 0.0006642793196060877, "loss": 3.143, "step": 371 }, { "epoch": 0.01, "learning_rate": 0.000666069829901522, "loss": 3.4898, "step": 372 }, { "epoch": 0.01, "learning_rate": 0.0006678603401969562, "loss": 3.3458, "step": 373 }, { "epoch": 0.01, "learning_rate": 0.0006696508504923904, "loss": 3.6675, "step": 374 }, { "epoch": 0.01, "learning_rate": 0.0006714413607878246, "loss": 3.417, "step": 375 }, { "epoch": 0.01, "learning_rate": 0.0006732318710832587, "loss": 3.7407, "step": 376 }, { "epoch": 0.01, "learning_rate": 0.000675022381378693, "loss": 3.0268, "step": 377 }, { "epoch": 0.01, "learning_rate": 0.0006768128916741272, "loss": 3.399, "step": 378 }, { "epoch": 0.01, "learning_rate": 0.0006786034019695614, "loss": 3.4602, "step": 379 }, { "epoch": 0.01, "learning_rate": 0.0006803939122649956, "loss": 3.0577, "step": 380 }, { "epoch": 0.01, "learning_rate": 0.0006821844225604297, "loss": 3.1608, "step": 381 }, { "epoch": 0.01, "learning_rate": 0.000683974932855864, "loss": 3.3228, "step": 382 }, { "epoch": 0.01, "learning_rate": 0.0006857654431512982, "loss": 3.4515, "step": 383 }, { "epoch": 0.01, "learning_rate": 0.0006875559534467323, "loss": 3.5448, "step": 384 }, { "epoch": 0.01, "learning_rate": 0.0006893464637421666, "loss": 3.5919, "step": 385 }, { "epoch": 0.01, "learning_rate": 0.0006911369740376008, "loss": 3.6327, "step": 386 }, { "epoch": 0.01, "learning_rate": 0.0006929274843330349, "loss": 3.287, "step": 387 }, { "epoch": 0.01, "learning_rate": 0.0006947179946284691, "loss": 3.4324, "step": 388 }, { "epoch": 0.01, "learning_rate": 0.0006965085049239032, "loss": 3.0475, "step": 389 }, { "epoch": 0.01, "learning_rate": 0.0006982990152193375, "loss": 3.614, "step": 390 }, { "epoch": 0.01, "learning_rate": 0.0007000895255147717, "loss": 3.6682, "step": 391 }, { "epoch": 0.01, "learning_rate": 0.0007018800358102059, "loss": 3.1188, "step": 392 }, { "epoch": 0.01, "learning_rate": 0.0007036705461056401, "loss": 3.1511, "step": 393 }, { "epoch": 0.01, "learning_rate": 0.0007054610564010742, "loss": 3.6047, "step": 394 }, { "epoch": 0.01, "learning_rate": 0.0007072515666965085, "loss": 3.1462, "step": 395 }, { "epoch": 0.01, "learning_rate": 0.0007090420769919427, "loss": 3.2402, "step": 396 }, { "epoch": 0.01, "learning_rate": 0.0007108325872873768, "loss": 3.6904, "step": 397 }, { "epoch": 0.01, "learning_rate": 0.0007126230975828111, "loss": 3.2493, "step": 398 }, { "epoch": 0.01, "learning_rate": 0.0007144136078782452, "loss": 3.4675, "step": 399 }, { "epoch": 0.01, "learning_rate": 0.0007162041181736795, "loss": 3.2085, "step": 400 }, { "epoch": 0.01, "learning_rate": 0.0007179946284691137, "loss": 3.3776, "step": 401 }, { "epoch": 0.01, "learning_rate": 0.0007197851387645478, "loss": 3.2554, "step": 402 }, { "epoch": 0.01, "learning_rate": 0.0007215756490599821, "loss": 3.2872, "step": 403 }, { "epoch": 0.01, "learning_rate": 0.0007233661593554163, "loss": 3.2138, "step": 404 }, { "epoch": 0.01, "learning_rate": 0.0007251566696508505, "loss": 3.4977, "step": 405 }, { "epoch": 0.01, "learning_rate": 0.0007269471799462847, "loss": 3.2995, "step": 406 }, { "epoch": 0.01, "learning_rate": 0.0007287376902417188, "loss": 3.2328, "step": 407 }, { "epoch": 0.01, "learning_rate": 0.0007305282005371531, "loss": 3.0464, "step": 408 }, { "epoch": 0.01, "learning_rate": 0.0007323187108325873, "loss": 3.0698, "step": 409 }, { "epoch": 0.01, "learning_rate": 0.0007341092211280214, "loss": 3.1015, "step": 410 }, { "epoch": 0.01, "learning_rate": 0.0007358997314234557, "loss": 3.3449, "step": 411 }, { "epoch": 0.01, "learning_rate": 0.0007376902417188899, "loss": 3.0336, "step": 412 }, { "epoch": 0.01, "learning_rate": 0.0007394807520143241, "loss": 3.5707, "step": 413 }, { "epoch": 0.01, "learning_rate": 0.0007412712623097583, "loss": 3.3676, "step": 414 }, { "epoch": 0.01, "learning_rate": 0.0007430617726051924, "loss": 3.3709, "step": 415 }, { "epoch": 0.01, "learning_rate": 0.0007448522829006267, "loss": 3.0944, "step": 416 }, { "epoch": 0.01, "learning_rate": 0.0007466427931960609, "loss": 3.1165, "step": 417 }, { "epoch": 0.01, "learning_rate": 0.0007484333034914951, "loss": 3.4108, "step": 418 }, { "epoch": 0.01, "learning_rate": 0.0007502238137869293, "loss": 3.3192, "step": 419 }, { "epoch": 0.01, "learning_rate": 0.0007520143240823634, "loss": 3.1601, "step": 420 }, { "epoch": 0.01, "learning_rate": 0.0007538048343777977, "loss": 3.2573, "step": 421 }, { "epoch": 0.01, "learning_rate": 0.0007555953446732319, "loss": 3.3103, "step": 422 }, { "epoch": 0.01, "learning_rate": 0.000757385854968666, "loss": 3.4379, "step": 423 }, { "epoch": 0.01, "learning_rate": 0.0007591763652641003, "loss": 3.4999, "step": 424 }, { "epoch": 0.01, "learning_rate": 0.0007609668755595345, "loss": 3.51, "step": 425 }, { "epoch": 0.01, "learning_rate": 0.0007627573858549687, "loss": 3.0963, "step": 426 }, { "epoch": 0.01, "learning_rate": 0.0007645478961504029, "loss": 3.4669, "step": 427 }, { "epoch": 0.01, "learning_rate": 0.000766338406445837, "loss": 3.4328, "step": 428 }, { "epoch": 0.01, "learning_rate": 0.0007681289167412713, "loss": 3.0618, "step": 429 }, { "epoch": 0.01, "learning_rate": 0.0007699194270367055, "loss": 3.512, "step": 430 }, { "epoch": 0.01, "learning_rate": 0.0007717099373321397, "loss": 3.2691, "step": 431 }, { "epoch": 0.01, "learning_rate": 0.0007735004476275739, "loss": 2.9747, "step": 432 }, { "epoch": 0.01, "learning_rate": 0.000775290957923008, "loss": 3.4736, "step": 433 }, { "epoch": 0.01, "learning_rate": 0.0007770814682184423, "loss": 3.337, "step": 434 }, { "epoch": 0.01, "learning_rate": 0.0007788719785138765, "loss": 3.0916, "step": 435 }, { "epoch": 0.01, "learning_rate": 0.0007806624888093106, "loss": 3.0492, "step": 436 }, { "epoch": 0.01, "learning_rate": 0.0007824529991047449, "loss": 3.1553, "step": 437 }, { "epoch": 0.01, "learning_rate": 0.000784243509400179, "loss": 3.0561, "step": 438 }, { "epoch": 0.01, "learning_rate": 0.0007860340196956133, "loss": 3.2285, "step": 439 }, { "epoch": 0.01, "learning_rate": 0.0007878245299910475, "loss": 3.0457, "step": 440 }, { "epoch": 0.01, "learning_rate": 0.0007896150402864816, "loss": 3.1644, "step": 441 }, { "epoch": 0.01, "learning_rate": 0.0007914055505819159, "loss": 3.0102, "step": 442 }, { "epoch": 0.01, "learning_rate": 0.0007931960608773501, "loss": 3.2131, "step": 443 }, { "epoch": 0.01, "learning_rate": 0.0007949865711727843, "loss": 3.342, "step": 444 }, { "epoch": 0.01, "learning_rate": 0.0007967770814682185, "loss": 3.0169, "step": 445 }, { "epoch": 0.01, "learning_rate": 0.0007985675917636526, "loss": 3.1876, "step": 446 }, { "epoch": 0.01, "learning_rate": 0.0008003581020590869, "loss": 3.5914, "step": 447 }, { "epoch": 0.01, "learning_rate": 0.0008021486123545211, "loss": 3.0662, "step": 448 }, { "epoch": 0.01, "learning_rate": 0.0008039391226499552, "loss": 3.6263, "step": 449 }, { "epoch": 0.01, "learning_rate": 0.0008057296329453895, "loss": 3.1521, "step": 450 }, { "epoch": 0.01, "learning_rate": 0.0008075201432408237, "loss": 2.9175, "step": 451 }, { "epoch": 0.01, "learning_rate": 0.0008093106535362579, "loss": 3.0264, "step": 452 }, { "epoch": 0.01, "learning_rate": 0.0008111011638316921, "loss": 3.4028, "step": 453 }, { "epoch": 0.01, "learning_rate": 0.0008128916741271262, "loss": 3.2034, "step": 454 }, { "epoch": 0.01, "learning_rate": 0.0008146821844225605, "loss": 3.14, "step": 455 }, { "epoch": 0.01, "learning_rate": 0.0008164726947179947, "loss": 3.1843, "step": 456 }, { "epoch": 0.01, "learning_rate": 0.0008182632050134289, "loss": 3.5349, "step": 457 }, { "epoch": 0.01, "learning_rate": 0.0008200537153088631, "loss": 3.1724, "step": 458 }, { "epoch": 0.01, "learning_rate": 0.0008218442256042972, "loss": 3.3373, "step": 459 }, { "epoch": 0.01, "learning_rate": 0.0008236347358997315, "loss": 2.8137, "step": 460 }, { "epoch": 0.01, "learning_rate": 0.0008254252461951657, "loss": 3.1698, "step": 461 }, { "epoch": 0.01, "learning_rate": 0.0008272157564905998, "loss": 3.1764, "step": 462 }, { "epoch": 0.01, "learning_rate": 0.0008290062667860341, "loss": 3.5221, "step": 463 }, { "epoch": 0.01, "learning_rate": 0.0008307967770814683, "loss": 3.5673, "step": 464 }, { "epoch": 0.01, "learning_rate": 0.0008325872873769025, "loss": 3.3826, "step": 465 }, { "epoch": 0.01, "learning_rate": 0.0008343777976723367, "loss": 3.4042, "step": 466 }, { "epoch": 0.01, "learning_rate": 0.0008361683079677708, "loss": 3.1004, "step": 467 }, { "epoch": 0.01, "learning_rate": 0.0008379588182632051, "loss": 3.0786, "step": 468 }, { "epoch": 0.01, "learning_rate": 0.0008397493285586393, "loss": 3.477, "step": 469 }, { "epoch": 0.01, "learning_rate": 0.0008415398388540735, "loss": 3.1772, "step": 470 }, { "epoch": 0.01, "learning_rate": 0.0008433303491495077, "loss": 3.2516, "step": 471 }, { "epoch": 0.01, "learning_rate": 0.0008451208594449418, "loss": 3.1066, "step": 472 }, { "epoch": 0.01, "learning_rate": 0.000846911369740376, "loss": 3.2839, "step": 473 }, { "epoch": 0.01, "learning_rate": 0.0008487018800358102, "loss": 3.0541, "step": 474 }, { "epoch": 0.01, "learning_rate": 0.0008504923903312443, "loss": 3.1582, "step": 475 }, { "epoch": 0.01, "learning_rate": 0.0008522829006266786, "loss": 3.0824, "step": 476 }, { "epoch": 0.01, "learning_rate": 0.0008540734109221127, "loss": 3.2805, "step": 477 }, { "epoch": 0.01, "learning_rate": 0.000855863921217547, "loss": 2.7879, "step": 478 }, { "epoch": 0.01, "learning_rate": 0.0008576544315129812, "loss": 3.0792, "step": 479 }, { "epoch": 0.01, "learning_rate": 0.0008594449418084153, "loss": 3.424, "step": 480 }, { "epoch": 0.01, "learning_rate": 0.0008612354521038496, "loss": 3.3996, "step": 481 }, { "epoch": 0.01, "learning_rate": 0.0008630259623992838, "loss": 3.3897, "step": 482 }, { "epoch": 0.01, "learning_rate": 0.0008648164726947179, "loss": 3.1662, "step": 483 }, { "epoch": 0.01, "learning_rate": 0.0008666069829901522, "loss": 3.128, "step": 484 }, { "epoch": 0.01, "learning_rate": 0.0008683974932855863, "loss": 3.1417, "step": 485 }, { "epoch": 0.01, "learning_rate": 0.0008701880035810206, "loss": 3.2643, "step": 486 }, { "epoch": 0.01, "learning_rate": 0.0008719785138764548, "loss": 3.0019, "step": 487 }, { "epoch": 0.01, "learning_rate": 0.0008737690241718889, "loss": 3.0688, "step": 488 }, { "epoch": 0.01, "learning_rate": 0.0008755595344673232, "loss": 3.0983, "step": 489 }, { "epoch": 0.01, "learning_rate": 0.0008773500447627574, "loss": 3.1612, "step": 490 }, { "epoch": 0.01, "learning_rate": 0.0008791405550581916, "loss": 3.2111, "step": 491 }, { "epoch": 0.01, "learning_rate": 0.0008809310653536258, "loss": 3.4782, "step": 492 }, { "epoch": 0.01, "learning_rate": 0.0008827215756490599, "loss": 3.166, "step": 493 }, { "epoch": 0.01, "learning_rate": 0.0008845120859444942, "loss": 3.6083, "step": 494 }, { "epoch": 0.01, "learning_rate": 0.0008863025962399284, "loss": 3.2796, "step": 495 }, { "epoch": 0.01, "learning_rate": 0.0008880931065353625, "loss": 3.3072, "step": 496 }, { "epoch": 0.01, "learning_rate": 0.0008898836168307968, "loss": 3.0319, "step": 497 }, { "epoch": 0.01, "learning_rate": 0.0008916741271262309, "loss": 2.9963, "step": 498 }, { "epoch": 0.01, "learning_rate": 0.0008934646374216652, "loss": 3.5126, "step": 499 }, { "epoch": 0.01, "learning_rate": 0.0008952551477170994, "loss": 3.4318, "step": 500 }, { "epoch": 0.01, "learning_rate": 0.0008970456580125335, "loss": 3.4824, "step": 501 }, { "epoch": 0.01, "learning_rate": 0.0008988361683079678, "loss": 3.1286, "step": 502 }, { "epoch": 0.01, "learning_rate": 0.000900626678603402, "loss": 2.8894, "step": 503 }, { "epoch": 0.01, "learning_rate": 0.0009024171888988362, "loss": 2.9164, "step": 504 }, { "epoch": 0.01, "learning_rate": 0.0009042076991942704, "loss": 3.1285, "step": 505 }, { "epoch": 0.01, "learning_rate": 0.0009059982094897045, "loss": 3.1487, "step": 506 }, { "epoch": 0.01, "learning_rate": 0.0009077887197851388, "loss": 3.1334, "step": 507 }, { "epoch": 0.01, "learning_rate": 0.000909579230080573, "loss": 3.1966, "step": 508 }, { "epoch": 0.01, "learning_rate": 0.0009113697403760071, "loss": 2.9846, "step": 509 }, { "epoch": 0.01, "learning_rate": 0.0009131602506714414, "loss": 2.87, "step": 510 }, { "epoch": 0.01, "learning_rate": 0.0009149507609668755, "loss": 3.0338, "step": 511 }, { "epoch": 0.01, "learning_rate": 0.0009167412712623098, "loss": 3.0743, "step": 512 }, { "epoch": 0.01, "learning_rate": 0.000918531781557744, "loss": 2.9198, "step": 513 }, { "epoch": 0.01, "learning_rate": 0.0009203222918531781, "loss": 2.9597, "step": 514 }, { "epoch": 0.01, "learning_rate": 0.0009221128021486124, "loss": 3.2017, "step": 515 }, { "epoch": 0.01, "learning_rate": 0.0009239033124440466, "loss": 3.1606, "step": 516 }, { "epoch": 0.01, "learning_rate": 0.0009256938227394808, "loss": 2.8733, "step": 517 }, { "epoch": 0.01, "learning_rate": 0.000927484333034915, "loss": 3.0833, "step": 518 }, { "epoch": 0.01, "learning_rate": 0.0009292748433303491, "loss": 3.2412, "step": 519 }, { "epoch": 0.01, "learning_rate": 0.0009310653536257834, "loss": 2.7794, "step": 520 }, { "epoch": 0.01, "learning_rate": 0.0009328558639212176, "loss": 2.876, "step": 521 }, { "epoch": 0.01, "learning_rate": 0.0009346463742166517, "loss": 2.9848, "step": 522 }, { "epoch": 0.01, "learning_rate": 0.000936436884512086, "loss": 3.3686, "step": 523 }, { "epoch": 0.01, "learning_rate": 0.0009382273948075201, "loss": 2.7405, "step": 524 }, { "epoch": 0.01, "learning_rate": 0.0009400179051029544, "loss": 2.9974, "step": 525 }, { "epoch": 0.01, "learning_rate": 0.0009418084153983886, "loss": 3.0855, "step": 526 }, { "epoch": 0.01, "learning_rate": 0.0009435989256938227, "loss": 3.4936, "step": 527 }, { "epoch": 0.01, "learning_rate": 0.000945389435989257, "loss": 3.0144, "step": 528 }, { "epoch": 0.01, "learning_rate": 0.0009471799462846912, "loss": 3.4589, "step": 529 }, { "epoch": 0.01, "learning_rate": 0.0009489704565801254, "loss": 2.8507, "step": 530 }, { "epoch": 0.01, "learning_rate": 0.0009507609668755596, "loss": 3.0169, "step": 531 }, { "epoch": 0.01, "learning_rate": 0.0009525514771709937, "loss": 2.9429, "step": 532 }, { "epoch": 0.01, "learning_rate": 0.000954341987466428, "loss": 2.855, "step": 533 }, { "epoch": 0.01, "learning_rate": 0.0009561324977618622, "loss": 3.2347, "step": 534 }, { "epoch": 0.01, "learning_rate": 0.0009579230080572963, "loss": 3.0188, "step": 535 }, { "epoch": 0.01, "learning_rate": 0.0009597135183527306, "loss": 2.8774, "step": 536 }, { "epoch": 0.01, "learning_rate": 0.0009615040286481647, "loss": 2.8611, "step": 537 }, { "epoch": 0.01, "learning_rate": 0.000963294538943599, "loss": 3.0985, "step": 538 }, { "epoch": 0.01, "learning_rate": 0.0009650850492390332, "loss": 3.1152, "step": 539 }, { "epoch": 0.01, "learning_rate": 0.0009668755595344673, "loss": 3.1147, "step": 540 }, { "epoch": 0.01, "learning_rate": 0.0009686660698299016, "loss": 3.288, "step": 541 }, { "epoch": 0.01, "learning_rate": 0.0009704565801253358, "loss": 3.0032, "step": 542 }, { "epoch": 0.01, "learning_rate": 0.00097224709042077, "loss": 3.4751, "step": 543 }, { "epoch": 0.01, "learning_rate": 0.0009740376007162042, "loss": 3.1331, "step": 544 }, { "epoch": 0.01, "learning_rate": 0.0009758281110116383, "loss": 2.9328, "step": 545 }, { "epoch": 0.01, "learning_rate": 0.0009776186213070726, "loss": 3.3086, "step": 546 }, { "epoch": 0.01, "learning_rate": 0.0009794091316025068, "loss": 3.1845, "step": 547 }, { "epoch": 0.01, "learning_rate": 0.000981199641897941, "loss": 3.4527, "step": 548 }, { "epoch": 0.01, "learning_rate": 0.000982990152193375, "loss": 3.287, "step": 549 }, { "epoch": 0.01, "learning_rate": 0.0009847806624888095, "loss": 3.2336, "step": 550 }, { "epoch": 0.01, "learning_rate": 0.0009865711727842436, "loss": 2.7652, "step": 551 }, { "epoch": 0.01, "learning_rate": 0.0009883616830796778, "loss": 3.1686, "step": 552 }, { "epoch": 0.01, "learning_rate": 0.000990152193375112, "loss": 3.0342, "step": 553 }, { "epoch": 0.01, "learning_rate": 0.000991942703670546, "loss": 3.1282, "step": 554 }, { "epoch": 0.01, "learning_rate": 0.0009937332139659805, "loss": 2.9819, "step": 555 }, { "epoch": 0.01, "learning_rate": 0.0009955237242614146, "loss": 3.1044, "step": 556 }, { "epoch": 0.01, "learning_rate": 0.0009973142345568488, "loss": 3.1355, "step": 557 }, { "epoch": 0.01, "learning_rate": 0.000999104744852283, "loss": 3.2472, "step": 558 }, { "epoch": 0.02, "learning_rate": 0.001000895255147717, "loss": 2.9824, "step": 559 }, { "epoch": 0.02, "learning_rate": 0.0010026857654431515, "loss": 2.5624, "step": 560 }, { "epoch": 0.02, "learning_rate": 0.0010044762757385854, "loss": 3.0125, "step": 561 }, { "epoch": 0.02, "learning_rate": 0.0010062667860340198, "loss": 2.9381, "step": 562 }, { "epoch": 0.02, "learning_rate": 0.001008057296329454, "loss": 2.9866, "step": 563 }, { "epoch": 0.02, "learning_rate": 0.0010098478066248881, "loss": 2.7968, "step": 564 }, { "epoch": 0.02, "learning_rate": 0.0010116383169203223, "loss": 3.1933, "step": 565 }, { "epoch": 0.02, "learning_rate": 0.0010134288272157566, "loss": 3.2999, "step": 566 }, { "epoch": 0.02, "learning_rate": 0.0010152193375111906, "loss": 3.2938, "step": 567 }, { "epoch": 0.02, "learning_rate": 0.001017009847806625, "loss": 2.9808, "step": 568 }, { "epoch": 0.02, "learning_rate": 0.0010188003581020591, "loss": 3.4899, "step": 569 }, { "epoch": 0.02, "learning_rate": 0.0010205908683974933, "loss": 3.2661, "step": 570 }, { "epoch": 0.02, "learning_rate": 0.0010223813786929274, "loss": 2.9455, "step": 571 }, { "epoch": 0.02, "learning_rate": 0.0010241718889883618, "loss": 3.1972, "step": 572 }, { "epoch": 0.02, "learning_rate": 0.001025962399283796, "loss": 2.9645, "step": 573 }, { "epoch": 0.02, "learning_rate": 0.0010277529095792301, "loss": 3.3339, "step": 574 }, { "epoch": 0.02, "learning_rate": 0.0010295434198746643, "loss": 3.1887, "step": 575 }, { "epoch": 0.02, "learning_rate": 0.0010313339301700987, "loss": 3.1085, "step": 576 }, { "epoch": 0.02, "learning_rate": 0.0010331244404655326, "loss": 3.0069, "step": 577 }, { "epoch": 0.02, "learning_rate": 0.001034914950760967, "loss": 3.3705, "step": 578 }, { "epoch": 0.02, "learning_rate": 0.0010367054610564011, "loss": 3.188, "step": 579 }, { "epoch": 0.02, "learning_rate": 0.0010384959713518353, "loss": 3.1761, "step": 580 }, { "epoch": 0.02, "learning_rate": 0.0010402864816472695, "loss": 3.0234, "step": 581 }, { "epoch": 0.02, "learning_rate": 0.0010420769919427038, "loss": 3.1539, "step": 582 }, { "epoch": 0.02, "learning_rate": 0.0010438675022381378, "loss": 3.2404, "step": 583 }, { "epoch": 0.02, "learning_rate": 0.0010456580125335721, "loss": 3.0502, "step": 584 }, { "epoch": 0.02, "learning_rate": 0.0010474485228290063, "loss": 3.1492, "step": 585 }, { "epoch": 0.02, "learning_rate": 0.0010492390331244407, "loss": 2.9362, "step": 586 }, { "epoch": 0.02, "learning_rate": 0.0010510295434198746, "loss": 3.3083, "step": 587 }, { "epoch": 0.02, "learning_rate": 0.001052820053715309, "loss": 3.0571, "step": 588 }, { "epoch": 0.02, "learning_rate": 0.0010546105640107432, "loss": 2.5231, "step": 589 }, { "epoch": 0.02, "learning_rate": 0.0010564010743061773, "loss": 2.922, "step": 590 }, { "epoch": 0.02, "learning_rate": 0.0010581915846016115, "loss": 2.9979, "step": 591 }, { "epoch": 0.02, "learning_rate": 0.0010599820948970458, "loss": 3.302, "step": 592 }, { "epoch": 0.02, "learning_rate": 0.0010617726051924798, "loss": 3.0749, "step": 593 }, { "epoch": 0.02, "learning_rate": 0.0010635631154879142, "loss": 2.9853, "step": 594 }, { "epoch": 0.02, "learning_rate": 0.0010653536257833483, "loss": 3.1422, "step": 595 }, { "epoch": 0.02, "learning_rate": 0.0010671441360787825, "loss": 2.8182, "step": 596 }, { "epoch": 0.02, "learning_rate": 0.0010689346463742166, "loss": 2.4912, "step": 597 }, { "epoch": 0.02, "learning_rate": 0.001070725156669651, "loss": 2.9133, "step": 598 }, { "epoch": 0.02, "learning_rate": 0.0010725156669650852, "loss": 3.2807, "step": 599 }, { "epoch": 0.02, "learning_rate": 0.0010743061772605193, "loss": 3.0849, "step": 600 }, { "epoch": 0.02, "learning_rate": 0.0010760966875559535, "loss": 2.7954, "step": 601 }, { "epoch": 0.02, "learning_rate": 0.0010778871978513876, "loss": 3.2443, "step": 602 }, { "epoch": 0.02, "learning_rate": 0.0010796777081468218, "loss": 2.5537, "step": 603 }, { "epoch": 0.02, "learning_rate": 0.001081468218442256, "loss": 2.9807, "step": 604 }, { "epoch": 0.02, "learning_rate": 0.0010832587287376903, "loss": 3.3966, "step": 605 }, { "epoch": 0.02, "learning_rate": 0.0010850492390331243, "loss": 3.1741, "step": 606 }, { "epoch": 0.02, "learning_rate": 0.0010868397493285587, "loss": 2.9869, "step": 607 }, { "epoch": 0.02, "learning_rate": 0.0010886302596239928, "loss": 3.0665, "step": 608 }, { "epoch": 0.02, "learning_rate": 0.001090420769919427, "loss": 3.012, "step": 609 }, { "epoch": 0.02, "learning_rate": 0.0010922112802148611, "loss": 3.2066, "step": 610 }, { "epoch": 0.02, "learning_rate": 0.0010940017905102955, "loss": 3.3281, "step": 611 }, { "epoch": 0.02, "learning_rate": 0.0010957923008057297, "loss": 3.0821, "step": 612 }, { "epoch": 0.02, "learning_rate": 0.0010975828111011638, "loss": 2.9335, "step": 613 }, { "epoch": 0.02, "learning_rate": 0.001099373321396598, "loss": 3.2701, "step": 614 }, { "epoch": 0.02, "learning_rate": 0.0011011638316920324, "loss": 3.246, "step": 615 }, { "epoch": 0.02, "learning_rate": 0.0011029543419874663, "loss": 3.0125, "step": 616 }, { "epoch": 0.02, "learning_rate": 0.0011047448522829007, "loss": 2.7121, "step": 617 }, { "epoch": 0.02, "learning_rate": 0.0011065353625783348, "loss": 2.9574, "step": 618 }, { "epoch": 0.02, "learning_rate": 0.001108325872873769, "loss": 3.1381, "step": 619 }, { "epoch": 0.02, "learning_rate": 0.0011101163831692031, "loss": 3.0214, "step": 620 }, { "epoch": 0.02, "learning_rate": 0.0011119068934646375, "loss": 3.0803, "step": 621 }, { "epoch": 0.02, "learning_rate": 0.0011136974037600715, "loss": 3.4239, "step": 622 }, { "epoch": 0.02, "learning_rate": 0.0011154879140555058, "loss": 2.7398, "step": 623 }, { "epoch": 0.02, "learning_rate": 0.00111727842435094, "loss": 3.0272, "step": 624 }, { "epoch": 0.02, "learning_rate": 0.0011190689346463744, "loss": 3.134, "step": 625 }, { "epoch": 0.02, "learning_rate": 0.0011208594449418083, "loss": 2.9826, "step": 626 }, { "epoch": 0.02, "learning_rate": 0.0011226499552372427, "loss": 3.5885, "step": 627 }, { "epoch": 0.02, "learning_rate": 0.0011244404655326768, "loss": 3.1614, "step": 628 }, { "epoch": 0.02, "learning_rate": 0.001126230975828111, "loss": 3.0917, "step": 629 }, { "epoch": 0.02, "learning_rate": 0.0011280214861235452, "loss": 3.2919, "step": 630 }, { "epoch": 0.02, "learning_rate": 0.0011298119964189795, "loss": 2.9722, "step": 631 }, { "epoch": 0.02, "learning_rate": 0.0011316025067144135, "loss": 2.899, "step": 632 }, { "epoch": 0.02, "learning_rate": 0.0011333930170098479, "loss": 3.27, "step": 633 }, { "epoch": 0.02, "learning_rate": 0.001135183527305282, "loss": 2.8951, "step": 634 }, { "epoch": 0.02, "learning_rate": 0.0011369740376007162, "loss": 3.1242, "step": 635 }, { "epoch": 0.02, "learning_rate": 0.0011387645478961503, "loss": 3.1584, "step": 636 }, { "epoch": 0.02, "learning_rate": 0.0011405550581915847, "loss": 2.8446, "step": 637 }, { "epoch": 0.02, "learning_rate": 0.0011423455684870189, "loss": 2.6843, "step": 638 }, { "epoch": 0.02, "learning_rate": 0.001144136078782453, "loss": 2.8268, "step": 639 }, { "epoch": 0.02, "learning_rate": 0.0011459265890778872, "loss": 2.6234, "step": 640 }, { "epoch": 0.02, "learning_rate": 0.0011477170993733216, "loss": 3.113, "step": 641 }, { "epoch": 0.02, "learning_rate": 0.0011495076096687555, "loss": 2.9994, "step": 642 }, { "epoch": 0.02, "learning_rate": 0.0011512981199641899, "loss": 2.7561, "step": 643 }, { "epoch": 0.02, "learning_rate": 0.001153088630259624, "loss": 2.7375, "step": 644 }, { "epoch": 0.02, "learning_rate": 0.0011548791405550582, "loss": 3.0852, "step": 645 }, { "epoch": 0.02, "learning_rate": 0.0011566696508504924, "loss": 3.0991, "step": 646 }, { "epoch": 0.02, "learning_rate": 0.0011584601611459267, "loss": 3.1126, "step": 647 }, { "epoch": 0.02, "learning_rate": 0.0011602506714413607, "loss": 2.9769, "step": 648 }, { "epoch": 0.02, "learning_rate": 0.001162041181736795, "loss": 3.0358, "step": 649 }, { "epoch": 0.02, "learning_rate": 0.0011638316920322292, "loss": 2.8115, "step": 650 }, { "epoch": 0.02, "learning_rate": 0.0011656222023276636, "loss": 3.0637, "step": 651 }, { "epoch": 0.02, "learning_rate": 0.0011674127126230975, "loss": 3.2342, "step": 652 }, { "epoch": 0.02, "learning_rate": 0.001169203222918532, "loss": 3.2154, "step": 653 }, { "epoch": 0.02, "learning_rate": 0.001170993733213966, "loss": 2.9512, "step": 654 }, { "epoch": 0.02, "learning_rate": 0.0011727842435094002, "loss": 3.1556, "step": 655 }, { "epoch": 0.02, "learning_rate": 0.0011745747538048344, "loss": 3.1786, "step": 656 }, { "epoch": 0.02, "learning_rate": 0.0011763652641002687, "loss": 2.9746, "step": 657 }, { "epoch": 0.02, "learning_rate": 0.0011781557743957027, "loss": 2.991, "step": 658 }, { "epoch": 0.02, "learning_rate": 0.001179946284691137, "loss": 3.1472, "step": 659 }, { "epoch": 0.02, "learning_rate": 0.0011817367949865712, "loss": 3.0777, "step": 660 }, { "epoch": 0.02, "learning_rate": 0.0011835273052820054, "loss": 2.9102, "step": 661 }, { "epoch": 0.02, "learning_rate": 0.0011853178155774395, "loss": 3.1299, "step": 662 }, { "epoch": 0.02, "learning_rate": 0.001187108325872874, "loss": 3.5082, "step": 663 }, { "epoch": 0.02, "learning_rate": 0.001188898836168308, "loss": 3.0491, "step": 664 }, { "epoch": 0.02, "learning_rate": 0.0011906893464637422, "loss": 3.1377, "step": 665 }, { "epoch": 0.02, "learning_rate": 0.0011924798567591764, "loss": 3.122, "step": 666 }, { "epoch": 0.02, "learning_rate": 0.0011942703670546108, "loss": 3.2087, "step": 667 }, { "epoch": 0.02, "learning_rate": 0.0011960608773500447, "loss": 2.9683, "step": 668 }, { "epoch": 0.02, "learning_rate": 0.001197851387645479, "loss": 3.0564, "step": 669 }, { "epoch": 0.02, "learning_rate": 0.0011996418979409132, "loss": 2.8713, "step": 670 }, { "epoch": 0.02, "learning_rate": 0.0012014324082363474, "loss": 2.9306, "step": 671 }, { "epoch": 0.02, "learning_rate": 0.0012032229185317816, "loss": 3.0644, "step": 672 }, { "epoch": 0.02, "learning_rate": 0.001205013428827216, "loss": 2.9973, "step": 673 }, { "epoch": 0.02, "learning_rate": 0.0012068039391226499, "loss": 3.1468, "step": 674 }, { "epoch": 0.02, "learning_rate": 0.0012085944494180842, "loss": 3.0212, "step": 675 }, { "epoch": 0.02, "learning_rate": 0.0012103849597135184, "loss": 2.9409, "step": 676 }, { "epoch": 0.02, "learning_rate": 0.0012121754700089528, "loss": 3.2535, "step": 677 }, { "epoch": 0.02, "learning_rate": 0.0012139659803043867, "loss": 3.138, "step": 678 }, { "epoch": 0.02, "learning_rate": 0.001215756490599821, "loss": 3.0041, "step": 679 }, { "epoch": 0.02, "learning_rate": 0.0012175470008952553, "loss": 3.1502, "step": 680 }, { "epoch": 0.02, "learning_rate": 0.0012193375111906894, "loss": 2.9993, "step": 681 }, { "epoch": 0.02, "learning_rate": 0.0012211280214861236, "loss": 2.9221, "step": 682 }, { "epoch": 0.02, "learning_rate": 0.001222918531781558, "loss": 3.2176, "step": 683 }, { "epoch": 0.02, "learning_rate": 0.0012247090420769919, "loss": 3.5158, "step": 684 }, { "epoch": 0.02, "learning_rate": 0.0012264995523724263, "loss": 2.9603, "step": 685 }, { "epoch": 0.02, "learning_rate": 0.0012282900626678604, "loss": 2.869, "step": 686 }, { "epoch": 0.02, "learning_rate": 0.0012300805729632946, "loss": 2.994, "step": 687 }, { "epoch": 0.02, "learning_rate": 0.0012318710832587287, "loss": 3.0858, "step": 688 }, { "epoch": 0.02, "learning_rate": 0.001233661593554163, "loss": 2.9306, "step": 689 }, { "epoch": 0.02, "learning_rate": 0.0012354521038495973, "loss": 2.9132, "step": 690 }, { "epoch": 0.02, "learning_rate": 0.0012372426141450312, "loss": 3.6906, "step": 691 }, { "epoch": 0.02, "learning_rate": 0.0012390331244404656, "loss": 3.3497, "step": 692 }, { "epoch": 0.02, "learning_rate": 0.0012408236347358997, "loss": 2.9572, "step": 693 }, { "epoch": 0.02, "learning_rate": 0.001242614145031334, "loss": 2.937, "step": 694 }, { "epoch": 0.02, "learning_rate": 0.001244404655326768, "loss": 3.0086, "step": 695 }, { "epoch": 0.02, "learning_rate": 0.0012461951656222024, "loss": 2.9799, "step": 696 }, { "epoch": 0.02, "learning_rate": 0.0012479856759176364, "loss": 2.521, "step": 697 }, { "epoch": 0.02, "learning_rate": 0.0012497761862130708, "loss": 3.2311, "step": 698 }, { "epoch": 0.02, "learning_rate": 0.001251566696508505, "loss": 3.0671, "step": 699 }, { "epoch": 0.02, "learning_rate": 0.001253357206803939, "loss": 2.9271, "step": 700 }, { "epoch": 0.02, "learning_rate": 0.0012551477170993732, "loss": 2.8768, "step": 701 }, { "epoch": 0.02, "learning_rate": 0.0012569382273948076, "loss": 3.0956, "step": 702 }, { "epoch": 0.02, "learning_rate": 0.0012587287376902415, "loss": 3.0784, "step": 703 }, { "epoch": 0.02, "learning_rate": 0.001260519247985676, "loss": 2.4724, "step": 704 }, { "epoch": 0.02, "learning_rate": 0.00126230975828111, "loss": 3.0196, "step": 705 }, { "epoch": 0.02, "learning_rate": 0.0012641002685765445, "loss": 2.9604, "step": 706 }, { "epoch": 0.02, "learning_rate": 0.0012658907788719784, "loss": 3.0084, "step": 707 }, { "epoch": 0.02, "learning_rate": 0.0012676812891674128, "loss": 2.7038, "step": 708 }, { "epoch": 0.02, "learning_rate": 0.001269471799462847, "loss": 2.9453, "step": 709 }, { "epoch": 0.02, "learning_rate": 0.001271262309758281, "loss": 3.2443, "step": 710 }, { "epoch": 0.02, "learning_rate": 0.0012730528200537152, "loss": 3.0389, "step": 711 }, { "epoch": 0.02, "learning_rate": 0.0012748433303491496, "loss": 3.2961, "step": 712 }, { "epoch": 0.02, "learning_rate": 0.0012766338406445836, "loss": 3.0314, "step": 713 }, { "epoch": 0.02, "learning_rate": 0.001278424350940018, "loss": 2.9929, "step": 714 }, { "epoch": 0.02, "learning_rate": 0.001280214861235452, "loss": 3.2547, "step": 715 }, { "epoch": 0.02, "learning_rate": 0.0012820053715308863, "loss": 3.4342, "step": 716 }, { "epoch": 0.02, "learning_rate": 0.0012837958818263204, "loss": 3.0363, "step": 717 }, { "epoch": 0.02, "learning_rate": 0.0012855863921217548, "loss": 3.1313, "step": 718 }, { "epoch": 0.02, "learning_rate": 0.001287376902417189, "loss": 2.9444, "step": 719 }, { "epoch": 0.02, "learning_rate": 0.0012891674127126231, "loss": 3.3177, "step": 720 }, { "epoch": 0.02, "learning_rate": 0.0012909579230080573, "loss": 2.9526, "step": 721 }, { "epoch": 0.02, "learning_rate": 0.0012927484333034916, "loss": 3.0659, "step": 722 }, { "epoch": 0.02, "learning_rate": 0.0012945389435989256, "loss": 3.2577, "step": 723 }, { "epoch": 0.02, "learning_rate": 0.00129632945389436, "loss": 2.9366, "step": 724 }, { "epoch": 0.02, "learning_rate": 0.0012981199641897941, "loss": 3.2847, "step": 725 }, { "epoch": 0.02, "learning_rate": 0.0012999104744852283, "loss": 3.0575, "step": 726 }, { "epoch": 0.02, "learning_rate": 0.0013017009847806624, "loss": 3.0766, "step": 727 }, { "epoch": 0.02, "learning_rate": 0.0013034914950760968, "loss": 3.6822, "step": 728 }, { "epoch": 0.02, "learning_rate": 0.0013052820053715308, "loss": 3.1488, "step": 729 }, { "epoch": 0.02, "learning_rate": 0.0013070725156669651, "loss": 3.5179, "step": 730 }, { "epoch": 0.02, "learning_rate": 0.0013088630259623993, "loss": 3.2128, "step": 731 }, { "epoch": 0.02, "learning_rate": 0.0013106535362578337, "loss": 3.0216, "step": 732 }, { "epoch": 0.02, "learning_rate": 0.0013124440465532676, "loss": 3.222, "step": 733 }, { "epoch": 0.02, "learning_rate": 0.001314234556848702, "loss": 3.0193, "step": 734 }, { "epoch": 0.02, "learning_rate": 0.0013160250671441361, "loss": 3.1145, "step": 735 }, { "epoch": 0.02, "learning_rate": 0.0013178155774395703, "loss": 3.1324, "step": 736 }, { "epoch": 0.02, "learning_rate": 0.0013196060877350045, "loss": 3.2207, "step": 737 }, { "epoch": 0.02, "learning_rate": 0.0013213965980304388, "loss": 3.0572, "step": 738 }, { "epoch": 0.02, "learning_rate": 0.0013231871083258728, "loss": 3.135, "step": 739 }, { "epoch": 0.02, "learning_rate": 0.0013249776186213071, "loss": 2.8383, "step": 740 }, { "epoch": 0.02, "learning_rate": 0.0013267681289167413, "loss": 2.9127, "step": 741 }, { "epoch": 0.02, "learning_rate": 0.0013285586392121755, "loss": 3.4213, "step": 742 }, { "epoch": 0.02, "learning_rate": 0.0013303491495076096, "loss": 2.5194, "step": 743 }, { "epoch": 0.02, "learning_rate": 0.001332139659803044, "loss": 3.1198, "step": 744 }, { "epoch": 0.02, "learning_rate": 0.0013339301700984782, "loss": 2.7389, "step": 745 }, { "epoch": 0.02, "learning_rate": 0.0013357206803939123, "loss": 2.8883, "step": 746 }, { "epoch": 0.02, "learning_rate": 0.0013375111906893465, "loss": 3.4741, "step": 747 }, { "epoch": 0.02, "learning_rate": 0.0013393017009847808, "loss": 3.1125, "step": 748 }, { "epoch": 0.02, "learning_rate": 0.0013410922112802148, "loss": 3.1103, "step": 749 }, { "epoch": 0.02, "learning_rate": 0.0013428827215756492, "loss": 3.2014, "step": 750 }, { "epoch": 0.02, "learning_rate": 0.0013446732318710833, "loss": 3.0973, "step": 751 }, { "epoch": 0.02, "learning_rate": 0.0013464637421665175, "loss": 2.5428, "step": 752 }, { "epoch": 0.02, "learning_rate": 0.0013482542524619516, "loss": 2.7931, "step": 753 }, { "epoch": 0.02, "learning_rate": 0.001350044762757386, "loss": 3.3219, "step": 754 }, { "epoch": 0.02, "learning_rate": 0.00135183527305282, "loss": 2.8146, "step": 755 }, { "epoch": 0.02, "learning_rate": 0.0013536257833482543, "loss": 3.0516, "step": 756 }, { "epoch": 0.02, "learning_rate": 0.0013554162936436885, "loss": 3.0369, "step": 757 }, { "epoch": 0.02, "learning_rate": 0.0013572068039391229, "loss": 3.1963, "step": 758 }, { "epoch": 0.02, "learning_rate": 0.0013589973142345568, "loss": 3.1214, "step": 759 }, { "epoch": 0.02, "learning_rate": 0.0013607878245299912, "loss": 3.1769, "step": 760 }, { "epoch": 0.02, "learning_rate": 0.0013625783348254253, "loss": 2.8255, "step": 761 }, { "epoch": 0.02, "learning_rate": 0.0013643688451208595, "loss": 2.8414, "step": 762 }, { "epoch": 0.02, "learning_rate": 0.0013661593554162937, "loss": 3.0994, "step": 763 }, { "epoch": 0.02, "learning_rate": 0.001367949865711728, "loss": 2.89, "step": 764 }, { "epoch": 0.02, "learning_rate": 0.001369740376007162, "loss": 2.7897, "step": 765 }, { "epoch": 0.02, "learning_rate": 0.0013715308863025963, "loss": 2.9747, "step": 766 }, { "epoch": 0.02, "learning_rate": 0.0013733213965980305, "loss": 3.0805, "step": 767 }, { "epoch": 0.02, "learning_rate": 0.0013751119068934647, "loss": 3.0227, "step": 768 }, { "epoch": 0.02, "learning_rate": 0.0013769024171888988, "loss": 3.0051, "step": 769 }, { "epoch": 0.02, "learning_rate": 0.0013786929274843332, "loss": 3.1259, "step": 770 }, { "epoch": 0.02, "learning_rate": 0.0013804834377797674, "loss": 2.9011, "step": 771 }, { "epoch": 0.02, "learning_rate": 0.0013822739480752015, "loss": 3.1323, "step": 772 }, { "epoch": 0.02, "learning_rate": 0.0013840644583706357, "loss": 2.5573, "step": 773 }, { "epoch": 0.02, "learning_rate": 0.0013858549686660698, "loss": 3.338, "step": 774 }, { "epoch": 0.02, "learning_rate": 0.001387645478961504, "loss": 3.1688, "step": 775 }, { "epoch": 0.02, "learning_rate": 0.0013894359892569381, "loss": 3.1004, "step": 776 }, { "epoch": 0.02, "learning_rate": 0.0013912264995523725, "loss": 3.0332, "step": 777 }, { "epoch": 0.02, "learning_rate": 0.0013930170098478065, "loss": 2.6528, "step": 778 }, { "epoch": 0.02, "learning_rate": 0.0013948075201432408, "loss": 3.0754, "step": 779 }, { "epoch": 0.02, "learning_rate": 0.001396598030438675, "loss": 2.8338, "step": 780 }, { "epoch": 0.02, "learning_rate": 0.0013983885407341092, "loss": 3.1009, "step": 781 }, { "epoch": 0.02, "learning_rate": 0.0014001790510295433, "loss": 2.914, "step": 782 }, { "epoch": 0.02, "learning_rate": 0.0014019695613249777, "loss": 3.3243, "step": 783 }, { "epoch": 0.02, "learning_rate": 0.0014037600716204118, "loss": 2.6732, "step": 784 }, { "epoch": 0.02, "learning_rate": 0.001405550581915846, "loss": 2.8511, "step": 785 }, { "epoch": 0.02, "learning_rate": 0.0014073410922112802, "loss": 2.977, "step": 786 }, { "epoch": 0.02, "learning_rate": 0.0014091316025067145, "loss": 2.9137, "step": 787 }, { "epoch": 0.02, "learning_rate": 0.0014109221128021485, "loss": 2.9553, "step": 788 }, { "epoch": 0.02, "learning_rate": 0.0014127126230975829, "loss": 3.3546, "step": 789 }, { "epoch": 0.02, "learning_rate": 0.001414503133393017, "loss": 2.9064, "step": 790 }, { "epoch": 0.02, "learning_rate": 0.0014162936436884512, "loss": 3.1972, "step": 791 }, { "epoch": 0.02, "learning_rate": 0.0014180841539838853, "loss": 2.9635, "step": 792 }, { "epoch": 0.02, "learning_rate": 0.0014198746642793197, "loss": 2.6947, "step": 793 }, { "epoch": 0.02, "learning_rate": 0.0014216651745747536, "loss": 2.8379, "step": 794 }, { "epoch": 0.02, "learning_rate": 0.001423455684870188, "loss": 2.8606, "step": 795 }, { "epoch": 0.02, "learning_rate": 0.0014252461951656222, "loss": 2.8528, "step": 796 }, { "epoch": 0.02, "learning_rate": 0.0014270367054610566, "loss": 3.0627, "step": 797 }, { "epoch": 0.02, "learning_rate": 0.0014288272157564905, "loss": 2.7937, "step": 798 }, { "epoch": 0.02, "learning_rate": 0.0014306177260519249, "loss": 2.7733, "step": 799 }, { "epoch": 0.02, "learning_rate": 0.001432408236347359, "loss": 2.9113, "step": 800 }, { "epoch": 0.02, "learning_rate": 0.0014341987466427932, "loss": 3.1064, "step": 801 }, { "epoch": 0.02, "learning_rate": 0.0014359892569382274, "loss": 3.0906, "step": 802 }, { "epoch": 0.02, "learning_rate": 0.0014377797672336617, "loss": 2.8816, "step": 803 }, { "epoch": 0.02, "learning_rate": 0.0014395702775290957, "loss": 2.9152, "step": 804 }, { "epoch": 0.02, "learning_rate": 0.00144136078782453, "loss": 2.5105, "step": 805 }, { "epoch": 0.02, "learning_rate": 0.0014431512981199642, "loss": 3.1448, "step": 806 }, { "epoch": 0.02, "learning_rate": 0.0014449418084153984, "loss": 2.6824, "step": 807 }, { "epoch": 0.02, "learning_rate": 0.0014467323187108325, "loss": 3.2022, "step": 808 }, { "epoch": 0.02, "learning_rate": 0.001448522829006267, "loss": 2.7443, "step": 809 }, { "epoch": 0.02, "learning_rate": 0.001450313339301701, "loss": 2.9053, "step": 810 }, { "epoch": 0.02, "learning_rate": 0.0014521038495971352, "loss": 3.2299, "step": 811 }, { "epoch": 0.02, "learning_rate": 0.0014538943598925694, "loss": 3.1168, "step": 812 }, { "epoch": 0.02, "learning_rate": 0.0014556848701880037, "loss": 2.8397, "step": 813 }, { "epoch": 0.02, "learning_rate": 0.0014574753804834377, "loss": 3.165, "step": 814 }, { "epoch": 0.02, "learning_rate": 0.001459265890778872, "loss": 3.0899, "step": 815 }, { "epoch": 0.02, "learning_rate": 0.0014610564010743062, "loss": 3.2855, "step": 816 }, { "epoch": 0.02, "learning_rate": 0.0014628469113697404, "loss": 2.6166, "step": 817 }, { "epoch": 0.02, "learning_rate": 0.0014646374216651745, "loss": 2.9365, "step": 818 }, { "epoch": 0.02, "learning_rate": 0.001466427931960609, "loss": 2.5891, "step": 819 }, { "epoch": 0.02, "learning_rate": 0.0014682184422560429, "loss": 2.9735, "step": 820 }, { "epoch": 0.02, "learning_rate": 0.0014700089525514772, "loss": 3.2057, "step": 821 }, { "epoch": 0.02, "learning_rate": 0.0014717994628469114, "loss": 2.9763, "step": 822 }, { "epoch": 0.02, "learning_rate": 0.0014735899731423458, "loss": 2.9591, "step": 823 }, { "epoch": 0.02, "learning_rate": 0.0014753804834377797, "loss": 3.1378, "step": 824 }, { "epoch": 0.02, "learning_rate": 0.001477170993733214, "loss": 2.7631, "step": 825 }, { "epoch": 0.02, "learning_rate": 0.0014789615040286482, "loss": 2.712, "step": 826 }, { "epoch": 0.02, "learning_rate": 0.0014807520143240824, "loss": 2.8613, "step": 827 }, { "epoch": 0.02, "learning_rate": 0.0014825425246195166, "loss": 2.8172, "step": 828 }, { "epoch": 0.02, "learning_rate": 0.001484333034914951, "loss": 3.0149, "step": 829 }, { "epoch": 0.02, "learning_rate": 0.0014861235452103849, "loss": 2.9344, "step": 830 }, { "epoch": 0.02, "learning_rate": 0.0014879140555058192, "loss": 2.8955, "step": 831 }, { "epoch": 0.02, "learning_rate": 0.0014897045658012534, "loss": 3.0717, "step": 832 }, { "epoch": 0.02, "learning_rate": 0.0014914950760966876, "loss": 2.987, "step": 833 }, { "epoch": 0.02, "learning_rate": 0.0014932855863921217, "loss": 2.7203, "step": 834 }, { "epoch": 0.02, "learning_rate": 0.001495076096687556, "loss": 3.0006, "step": 835 }, { "epoch": 0.02, "learning_rate": 0.0014968666069829903, "loss": 2.7462, "step": 836 }, { "epoch": 0.02, "learning_rate": 0.0014986571172784244, "loss": 3.2753, "step": 837 }, { "epoch": 0.02, "learning_rate": 0.0015004476275738586, "loss": 3.0293, "step": 838 }, { "epoch": 0.02, "learning_rate": 0.001502238137869293, "loss": 3.1166, "step": 839 }, { "epoch": 0.02, "learning_rate": 0.0015040286481647269, "loss": 2.9117, "step": 840 }, { "epoch": 0.02, "learning_rate": 0.0015058191584601613, "loss": 3.0017, "step": 841 }, { "epoch": 0.02, "learning_rate": 0.0015076096687555954, "loss": 3.2975, "step": 842 }, { "epoch": 0.02, "learning_rate": 0.0015094001790510296, "loss": 2.6791, "step": 843 }, { "epoch": 0.02, "learning_rate": 0.0015111906893464637, "loss": 3.0283, "step": 844 }, { "epoch": 0.02, "learning_rate": 0.0015129811996418981, "loss": 3.2143, "step": 845 }, { "epoch": 0.02, "learning_rate": 0.001514771709937332, "loss": 2.6444, "step": 846 }, { "epoch": 0.02, "learning_rate": 0.0015165622202327664, "loss": 3.0716, "step": 847 }, { "epoch": 0.02, "learning_rate": 0.0015183527305282006, "loss": 3.3214, "step": 848 }, { "epoch": 0.02, "learning_rate": 0.001520143240823635, "loss": 3.3072, "step": 849 }, { "epoch": 0.02, "learning_rate": 0.001521933751119069, "loss": 3.0511, "step": 850 }, { "epoch": 0.02, "learning_rate": 0.0015237242614145033, "loss": 3.2943, "step": 851 }, { "epoch": 0.02, "learning_rate": 0.0015255147717099374, "loss": 2.6775, "step": 852 }, { "epoch": 0.02, "learning_rate": 0.0015273052820053716, "loss": 3.4816, "step": 853 }, { "epoch": 0.02, "learning_rate": 0.0015290957923008058, "loss": 3.1206, "step": 854 }, { "epoch": 0.02, "learning_rate": 0.0015308863025962401, "loss": 2.6644, "step": 855 }, { "epoch": 0.02, "learning_rate": 0.001532676812891674, "loss": 2.7555, "step": 856 }, { "epoch": 0.02, "learning_rate": 0.0015344673231871084, "loss": 2.8915, "step": 857 }, { "epoch": 0.02, "learning_rate": 0.0015362578334825426, "loss": 3.3381, "step": 858 }, { "epoch": 0.02, "learning_rate": 0.0015380483437779768, "loss": 2.8096, "step": 859 }, { "epoch": 0.02, "learning_rate": 0.001539838854073411, "loss": 2.8366, "step": 860 }, { "epoch": 0.02, "learning_rate": 0.001541629364368845, "loss": 2.9588, "step": 861 }, { "epoch": 0.02, "learning_rate": 0.0015434198746642795, "loss": 3.2669, "step": 862 }, { "epoch": 0.02, "learning_rate": 0.0015452103849597134, "loss": 2.8403, "step": 863 }, { "epoch": 0.02, "learning_rate": 0.0015470008952551478, "loss": 2.6163, "step": 864 }, { "epoch": 0.02, "learning_rate": 0.001548791405550582, "loss": 3.0528, "step": 865 }, { "epoch": 0.02, "learning_rate": 0.001550581915846016, "loss": 2.8563, "step": 866 }, { "epoch": 0.02, "learning_rate": 0.0015523724261414502, "loss": 2.8836, "step": 867 }, { "epoch": 0.02, "learning_rate": 0.0015541629364368846, "loss": 2.9604, "step": 868 }, { "epoch": 0.02, "learning_rate": 0.0015559534467323186, "loss": 3.0629, "step": 869 }, { "epoch": 0.02, "learning_rate": 0.001557743957027753, "loss": 2.8225, "step": 870 }, { "epoch": 0.02, "learning_rate": 0.001559534467323187, "loss": 2.826, "step": 871 }, { "epoch": 0.02, "learning_rate": 0.0015613249776186213, "loss": 2.6514, "step": 872 }, { "epoch": 0.02, "learning_rate": 0.0015631154879140554, "loss": 2.5678, "step": 873 }, { "epoch": 0.02, "learning_rate": 0.0015649059982094898, "loss": 3.4262, "step": 874 }, { "epoch": 0.02, "learning_rate": 0.001566696508504924, "loss": 3.1022, "step": 875 }, { "epoch": 0.02, "learning_rate": 0.001568487018800358, "loss": 3.0311, "step": 876 }, { "epoch": 0.02, "learning_rate": 0.0015702775290957923, "loss": 3.1829, "step": 877 }, { "epoch": 0.02, "learning_rate": 0.0015720680393912266, "loss": 3.0158, "step": 878 }, { "epoch": 0.02, "learning_rate": 0.0015738585496866606, "loss": 2.9941, "step": 879 }, { "epoch": 0.02, "learning_rate": 0.001575649059982095, "loss": 2.9966, "step": 880 }, { "epoch": 0.02, "learning_rate": 0.0015774395702775291, "loss": 3.018, "step": 881 }, { "epoch": 0.02, "learning_rate": 0.0015792300805729633, "loss": 2.5467, "step": 882 }, { "epoch": 0.02, "learning_rate": 0.0015810205908683974, "loss": 2.4611, "step": 883 }, { "epoch": 0.02, "learning_rate": 0.0015828111011638318, "loss": 2.97, "step": 884 }, { "epoch": 0.02, "learning_rate": 0.0015846016114592658, "loss": 2.9436, "step": 885 }, { "epoch": 0.02, "learning_rate": 0.0015863921217547001, "loss": 2.9737, "step": 886 }, { "epoch": 0.02, "learning_rate": 0.0015881826320501343, "loss": 2.7776, "step": 887 }, { "epoch": 0.02, "learning_rate": 0.0015899731423455687, "loss": 2.8749, "step": 888 }, { "epoch": 0.02, "learning_rate": 0.0015917636526410026, "loss": 3.1012, "step": 889 }, { "epoch": 0.02, "learning_rate": 0.001593554162936437, "loss": 3.0227, "step": 890 }, { "epoch": 0.02, "learning_rate": 0.0015953446732318711, "loss": 2.913, "step": 891 }, { "epoch": 0.02, "learning_rate": 0.0015971351835273053, "loss": 2.8145, "step": 892 }, { "epoch": 0.02, "learning_rate": 0.0015989256938227395, "loss": 2.8184, "step": 893 }, { "epoch": 0.02, "learning_rate": 0.0016007162041181738, "loss": 3.052, "step": 894 }, { "epoch": 0.02, "learning_rate": 0.0016025067144136078, "loss": 2.8674, "step": 895 }, { "epoch": 0.02, "learning_rate": 0.0016042972247090421, "loss": 2.8385, "step": 896 }, { "epoch": 0.02, "learning_rate": 0.0016060877350044763, "loss": 2.6831, "step": 897 }, { "epoch": 0.02, "learning_rate": 0.0016078782452999105, "loss": 2.682, "step": 898 }, { "epoch": 0.02, "learning_rate": 0.0016096687555953446, "loss": 3.3527, "step": 899 }, { "epoch": 0.02, "learning_rate": 0.001611459265890779, "loss": 2.8256, "step": 900 }, { "epoch": 0.02, "learning_rate": 0.0016132497761862132, "loss": 3.2997, "step": 901 }, { "epoch": 0.02, "learning_rate": 0.0016150402864816473, "loss": 3.0012, "step": 902 }, { "epoch": 0.02, "learning_rate": 0.0016168307967770815, "loss": 3.1225, "step": 903 }, { "epoch": 0.02, "learning_rate": 0.0016186213070725158, "loss": 2.8413, "step": 904 }, { "epoch": 0.02, "learning_rate": 0.0016204118173679498, "loss": 2.8896, "step": 905 }, { "epoch": 0.02, "learning_rate": 0.0016222023276633842, "loss": 3.1583, "step": 906 }, { "epoch": 0.02, "learning_rate": 0.0016239928379588183, "loss": 2.8161, "step": 907 }, { "epoch": 0.02, "learning_rate": 0.0016257833482542525, "loss": 3.2538, "step": 908 }, { "epoch": 0.02, "learning_rate": 0.0016275738585496866, "loss": 2.8083, "step": 909 }, { "epoch": 0.02, "learning_rate": 0.001629364368845121, "loss": 2.9282, "step": 910 }, { "epoch": 0.02, "learning_rate": 0.001631154879140555, "loss": 2.8539, "step": 911 }, { "epoch": 0.02, "learning_rate": 0.0016329453894359893, "loss": 2.85, "step": 912 }, { "epoch": 0.02, "learning_rate": 0.0016347358997314235, "loss": 2.5489, "step": 913 }, { "epoch": 0.02, "learning_rate": 0.0016365264100268579, "loss": 3.0661, "step": 914 }, { "epoch": 0.02, "learning_rate": 0.0016383169203222918, "loss": 3.2183, "step": 915 }, { "epoch": 0.02, "learning_rate": 0.0016401074306177262, "loss": 2.7266, "step": 916 }, { "epoch": 0.02, "learning_rate": 0.0016418979409131603, "loss": 2.9193, "step": 917 }, { "epoch": 0.02, "learning_rate": 0.0016436884512085945, "loss": 2.8377, "step": 918 }, { "epoch": 0.02, "learning_rate": 0.0016454789615040287, "loss": 3.2445, "step": 919 }, { "epoch": 0.02, "learning_rate": 0.001647269471799463, "loss": 3.0459, "step": 920 }, { "epoch": 0.02, "learning_rate": 0.001649059982094897, "loss": 3.4266, "step": 921 }, { "epoch": 0.02, "learning_rate": 0.0016508504923903313, "loss": 3.2444, "step": 922 }, { "epoch": 0.02, "learning_rate": 0.0016526410026857655, "loss": 2.6663, "step": 923 }, { "epoch": 0.02, "learning_rate": 0.0016544315129811997, "loss": 3.2841, "step": 924 }, { "epoch": 0.02, "learning_rate": 0.0016562220232766338, "loss": 2.8768, "step": 925 }, { "epoch": 0.02, "learning_rate": 0.0016580125335720682, "loss": 3.0439, "step": 926 }, { "epoch": 0.02, "learning_rate": 0.0016598030438675024, "loss": 3.4424, "step": 927 }, { "epoch": 0.02, "learning_rate": 0.0016615935541629365, "loss": 2.6921, "step": 928 }, { "epoch": 0.02, "learning_rate": 0.0016633840644583707, "loss": 3.1254, "step": 929 }, { "epoch": 0.02, "learning_rate": 0.001665174574753805, "loss": 2.9349, "step": 930 }, { "epoch": 0.03, "learning_rate": 0.001666965085049239, "loss": 2.7176, "step": 931 }, { "epoch": 0.03, "learning_rate": 0.0016687555953446734, "loss": 2.9824, "step": 932 }, { "epoch": 0.03, "learning_rate": 0.0016705461056401075, "loss": 3.2495, "step": 933 }, { "epoch": 0.03, "learning_rate": 0.0016723366159355417, "loss": 2.8437, "step": 934 }, { "epoch": 0.03, "learning_rate": 0.0016741271262309758, "loss": 3.143, "step": 935 }, { "epoch": 0.03, "learning_rate": 0.0016759176365264102, "loss": 3.1234, "step": 936 }, { "epoch": 0.03, "learning_rate": 0.0016777081468218442, "loss": 2.6919, "step": 937 }, { "epoch": 0.03, "learning_rate": 0.0016794986571172785, "loss": 3.1395, "step": 938 }, { "epoch": 0.03, "learning_rate": 0.0016812891674127127, "loss": 3.3771, "step": 939 }, { "epoch": 0.03, "learning_rate": 0.001683079677708147, "loss": 2.5294, "step": 940 }, { "epoch": 0.03, "learning_rate": 0.001684870188003581, "loss": 2.8449, "step": 941 }, { "epoch": 0.03, "learning_rate": 0.0016866606982990154, "loss": 2.6461, "step": 942 }, { "epoch": 0.03, "learning_rate": 0.0016884512085944495, "loss": 2.6486, "step": 943 }, { "epoch": 0.03, "learning_rate": 0.0016902417188898837, "loss": 3.0296, "step": 944 }, { "epoch": 0.03, "learning_rate": 0.0016920322291853179, "loss": 2.6314, "step": 945 }, { "epoch": 0.03, "learning_rate": 0.001693822739480752, "loss": 2.8845, "step": 946 }, { "epoch": 0.03, "learning_rate": 0.0016956132497761862, "loss": 2.7511, "step": 947 }, { "epoch": 0.03, "learning_rate": 0.0016974037600716203, "loss": 3.2578, "step": 948 }, { "epoch": 0.03, "learning_rate": 0.0016991942703670547, "loss": 3.0211, "step": 949 }, { "epoch": 0.03, "learning_rate": 0.0017009847806624886, "loss": 2.8322, "step": 950 }, { "epoch": 0.03, "learning_rate": 0.001702775290957923, "loss": 3.3315, "step": 951 }, { "epoch": 0.03, "learning_rate": 0.0017045658012533572, "loss": 3.275, "step": 952 }, { "epoch": 0.03, "learning_rate": 0.0017063563115487916, "loss": 2.7457, "step": 953 }, { "epoch": 0.03, "learning_rate": 0.0017081468218442255, "loss": 2.96, "step": 954 }, { "epoch": 0.03, "learning_rate": 0.0017099373321396599, "loss": 2.8708, "step": 955 }, { "epoch": 0.03, "learning_rate": 0.001711727842435094, "loss": 2.9006, "step": 956 }, { "epoch": 0.03, "learning_rate": 0.0017135183527305282, "loss": 2.6801, "step": 957 }, { "epoch": 0.03, "learning_rate": 0.0017153088630259623, "loss": 2.9447, "step": 958 }, { "epoch": 0.03, "learning_rate": 0.0017170993733213967, "loss": 2.8904, "step": 959 }, { "epoch": 0.03, "learning_rate": 0.0017188898836168307, "loss": 2.9695, "step": 960 }, { "epoch": 0.03, "learning_rate": 0.001720680393912265, "loss": 3.1627, "step": 961 }, { "epoch": 0.03, "learning_rate": 0.0017224709042076992, "loss": 3.0276, "step": 962 }, { "epoch": 0.03, "learning_rate": 0.0017242614145031334, "loss": 2.8813, "step": 963 }, { "epoch": 0.03, "learning_rate": 0.0017260519247985675, "loss": 2.5968, "step": 964 }, { "epoch": 0.03, "learning_rate": 0.001727842435094002, "loss": 2.7712, "step": 965 }, { "epoch": 0.03, "learning_rate": 0.0017296329453894358, "loss": 2.9337, "step": 966 }, { "epoch": 0.03, "learning_rate": 0.0017314234556848702, "loss": 3.1013, "step": 967 }, { "epoch": 0.03, "learning_rate": 0.0017332139659803044, "loss": 2.8767, "step": 968 }, { "epoch": 0.03, "learning_rate": 0.0017350044762757387, "loss": 2.8672, "step": 969 }, { "epoch": 0.03, "learning_rate": 0.0017367949865711727, "loss": 2.642, "step": 970 }, { "epoch": 0.03, "learning_rate": 0.001738585496866607, "loss": 3.3815, "step": 971 }, { "epoch": 0.03, "learning_rate": 0.0017403760071620412, "loss": 3.249, "step": 972 }, { "epoch": 0.03, "learning_rate": 0.0017421665174574754, "loss": 2.9024, "step": 973 }, { "epoch": 0.03, "learning_rate": 0.0017439570277529095, "loss": 2.9573, "step": 974 }, { "epoch": 0.03, "learning_rate": 0.001745747538048344, "loss": 3.0669, "step": 975 }, { "epoch": 0.03, "learning_rate": 0.0017475380483437779, "loss": 2.8647, "step": 976 }, { "epoch": 0.03, "learning_rate": 0.0017493285586392122, "loss": 2.6503, "step": 977 }, { "epoch": 0.03, "learning_rate": 0.0017511190689346464, "loss": 3.2259, "step": 978 }, { "epoch": 0.03, "learning_rate": 0.0017529095792300808, "loss": 3.1582, "step": 979 }, { "epoch": 0.03, "learning_rate": 0.0017547000895255147, "loss": 3.3876, "step": 980 }, { "epoch": 0.03, "learning_rate": 0.001756490599820949, "loss": 3.454, "step": 981 }, { "epoch": 0.03, "learning_rate": 0.0017582811101163832, "loss": 2.9204, "step": 982 }, { "epoch": 0.03, "learning_rate": 0.0017600716204118174, "loss": 2.9245, "step": 983 }, { "epoch": 0.03, "learning_rate": 0.0017618621307072516, "loss": 2.8441, "step": 984 }, { "epoch": 0.03, "learning_rate": 0.001763652641002686, "loss": 2.7282, "step": 985 }, { "epoch": 0.03, "learning_rate": 0.0017654431512981199, "loss": 2.7774, "step": 986 }, { "epoch": 0.03, "learning_rate": 0.0017672336615935542, "loss": 2.7873, "step": 987 }, { "epoch": 0.03, "learning_rate": 0.0017690241718889884, "loss": 3.0489, "step": 988 }, { "epoch": 0.03, "learning_rate": 0.0017708146821844226, "loss": 2.947, "step": 989 }, { "epoch": 0.03, "learning_rate": 0.0017726051924798567, "loss": 2.6735, "step": 990 }, { "epoch": 0.03, "learning_rate": 0.001774395702775291, "loss": 3.0439, "step": 991 }, { "epoch": 0.03, "learning_rate": 0.001776186213070725, "loss": 2.8365, "step": 992 }, { "epoch": 0.03, "learning_rate": 0.0017779767233661594, "loss": 3.2071, "step": 993 }, { "epoch": 0.03, "learning_rate": 0.0017797672336615936, "loss": 2.7233, "step": 994 }, { "epoch": 0.03, "learning_rate": 0.001781557743957028, "loss": 3.0594, "step": 995 }, { "epoch": 0.03, "learning_rate": 0.0017833482542524619, "loss": 3.1834, "step": 996 }, { "epoch": 0.03, "learning_rate": 0.0017851387645478963, "loss": 2.7202, "step": 997 }, { "epoch": 0.03, "learning_rate": 0.0017869292748433304, "loss": 2.7948, "step": 998 }, { "epoch": 0.03, "learning_rate": 0.0017887197851387646, "loss": 2.7038, "step": 999 }, { "epoch": 0.03, "learning_rate": 0.0017905102954341987, "loss": 2.9279, "step": 1000 }, { "epoch": 0.03, "learning_rate": 0.0017923008057296331, "loss": 2.6936, "step": 1001 }, { "epoch": 0.03, "learning_rate": 0.001794091316025067, "loss": 3.1465, "step": 1002 }, { "epoch": 0.03, "learning_rate": 0.0017958818263205014, "loss": 2.8872, "step": 1003 }, { "epoch": 0.03, "learning_rate": 0.0017976723366159356, "loss": 2.869, "step": 1004 }, { "epoch": 0.03, "learning_rate": 0.00179946284691137, "loss": 2.6008, "step": 1005 }, { "epoch": 0.03, "learning_rate": 0.001801253357206804, "loss": 3.3484, "step": 1006 }, { "epoch": 0.03, "learning_rate": 0.0018030438675022383, "loss": 2.735, "step": 1007 }, { "epoch": 0.03, "learning_rate": 0.0018048343777976724, "loss": 3.2924, "step": 1008 }, { "epoch": 0.03, "learning_rate": 0.0018066248880931066, "loss": 2.5632, "step": 1009 }, { "epoch": 0.03, "learning_rate": 0.0018084153983885408, "loss": 2.819, "step": 1010 }, { "epoch": 0.03, "learning_rate": 0.0018102059086839751, "loss": 2.8791, "step": 1011 }, { "epoch": 0.03, "learning_rate": 0.001811996418979409, "loss": 2.5739, "step": 1012 }, { "epoch": 0.03, "learning_rate": 0.0018137869292748434, "loss": 2.8974, "step": 1013 }, { "epoch": 0.03, "learning_rate": 0.0018155774395702776, "loss": 2.6427, "step": 1014 }, { "epoch": 0.03, "learning_rate": 0.0018173679498657118, "loss": 3.1048, "step": 1015 }, { "epoch": 0.03, "learning_rate": 0.001819158460161146, "loss": 2.873, "step": 1016 }, { "epoch": 0.03, "learning_rate": 0.0018209489704565803, "loss": 2.7493, "step": 1017 }, { "epoch": 0.03, "learning_rate": 0.0018227394807520142, "loss": 2.7305, "step": 1018 }, { "epoch": 0.03, "learning_rate": 0.0018245299910474486, "loss": 2.9095, "step": 1019 }, { "epoch": 0.03, "learning_rate": 0.0018263205013428828, "loss": 2.4336, "step": 1020 }, { "epoch": 0.03, "learning_rate": 0.0018281110116383171, "loss": 2.8584, "step": 1021 }, { "epoch": 0.03, "learning_rate": 0.001829901521933751, "loss": 2.8959, "step": 1022 }, { "epoch": 0.03, "learning_rate": 0.0018316920322291855, "loss": 2.5541, "step": 1023 }, { "epoch": 0.03, "learning_rate": 0.0018334825425246196, "loss": 2.7394, "step": 1024 }, { "epoch": 0.03, "learning_rate": 0.0018352730528200538, "loss": 2.9615, "step": 1025 }, { "epoch": 0.03, "learning_rate": 0.001837063563115488, "loss": 3.0935, "step": 1026 }, { "epoch": 0.03, "learning_rate": 0.0018388540734109223, "loss": 2.9139, "step": 1027 }, { "epoch": 0.03, "learning_rate": 0.0018406445837063563, "loss": 2.8732, "step": 1028 }, { "epoch": 0.03, "learning_rate": 0.0018424350940017906, "loss": 3.1139, "step": 1029 }, { "epoch": 0.03, "learning_rate": 0.0018442256042972248, "loss": 3.1814, "step": 1030 }, { "epoch": 0.03, "learning_rate": 0.001846016114592659, "loss": 2.9363, "step": 1031 }, { "epoch": 0.03, "learning_rate": 0.001847806624888093, "loss": 2.9217, "step": 1032 }, { "epoch": 0.03, "learning_rate": 0.0018495971351835273, "loss": 2.826, "step": 1033 }, { "epoch": 0.03, "learning_rate": 0.0018513876454789616, "loss": 3.1802, "step": 1034 }, { "epoch": 0.03, "learning_rate": 0.0018531781557743956, "loss": 3.0625, "step": 1035 }, { "epoch": 0.03, "learning_rate": 0.00185496866606983, "loss": 3.0424, "step": 1036 }, { "epoch": 0.03, "learning_rate": 0.0018567591763652641, "loss": 2.9527, "step": 1037 }, { "epoch": 0.03, "learning_rate": 0.0018585496866606983, "loss": 2.6786, "step": 1038 }, { "epoch": 0.03, "learning_rate": 0.0018603401969561324, "loss": 3.1444, "step": 1039 }, { "epoch": 0.03, "learning_rate": 0.0018621307072515668, "loss": 3.0752, "step": 1040 }, { "epoch": 0.03, "learning_rate": 0.0018639212175470008, "loss": 2.6378, "step": 1041 }, { "epoch": 0.03, "learning_rate": 0.0018657117278424351, "loss": 2.7321, "step": 1042 }, { "epoch": 0.03, "learning_rate": 0.0018675022381378693, "loss": 2.6516, "step": 1043 }, { "epoch": 0.03, "learning_rate": 0.0018692927484333034, "loss": 2.7673, "step": 1044 }, { "epoch": 0.03, "learning_rate": 0.0018710832587287376, "loss": 2.9705, "step": 1045 }, { "epoch": 0.03, "learning_rate": 0.001872873769024172, "loss": 3.1063, "step": 1046 }, { "epoch": 0.03, "learning_rate": 0.0018746642793196061, "loss": 2.8569, "step": 1047 }, { "epoch": 0.03, "learning_rate": 0.0018764547896150403, "loss": 2.8661, "step": 1048 }, { "epoch": 0.03, "learning_rate": 0.0018782452999104745, "loss": 2.9516, "step": 1049 }, { "epoch": 0.03, "learning_rate": 0.0018800358102059088, "loss": 2.9906, "step": 1050 }, { "epoch": 0.03, "learning_rate": 0.0018818263205013428, "loss": 3.1855, "step": 1051 }, { "epoch": 0.03, "learning_rate": 0.0018836168307967771, "loss": 2.7303, "step": 1052 }, { "epoch": 0.03, "learning_rate": 0.0018854073410922113, "loss": 2.846, "step": 1053 }, { "epoch": 0.03, "learning_rate": 0.0018871978513876455, "loss": 2.7051, "step": 1054 }, { "epoch": 0.03, "learning_rate": 0.0018889883616830796, "loss": 3.4048, "step": 1055 }, { "epoch": 0.03, "learning_rate": 0.001890778871978514, "loss": 2.7893, "step": 1056 }, { "epoch": 0.03, "learning_rate": 0.001892569382273948, "loss": 2.9735, "step": 1057 }, { "epoch": 0.03, "learning_rate": 0.0018943598925693823, "loss": 3.1908, "step": 1058 }, { "epoch": 0.03, "learning_rate": 0.0018961504028648165, "loss": 3.1034, "step": 1059 }, { "epoch": 0.03, "learning_rate": 0.0018979409131602508, "loss": 2.8321, "step": 1060 }, { "epoch": 0.03, "learning_rate": 0.0018997314234556848, "loss": 3.3513, "step": 1061 }, { "epoch": 0.03, "learning_rate": 0.0019015219337511192, "loss": 3.0396, "step": 1062 }, { "epoch": 0.03, "learning_rate": 0.0019033124440465533, "loss": 2.84, "step": 1063 }, { "epoch": 0.03, "learning_rate": 0.0019051029543419875, "loss": 3.1624, "step": 1064 }, { "epoch": 0.03, "learning_rate": 0.0019068934646374216, "loss": 3.2421, "step": 1065 }, { "epoch": 0.03, "learning_rate": 0.001908683974932856, "loss": 3.0279, "step": 1066 }, { "epoch": 0.03, "learning_rate": 0.00191047448522829, "loss": 2.9036, "step": 1067 }, { "epoch": 0.03, "learning_rate": 0.0019122649955237243, "loss": 2.9999, "step": 1068 }, { "epoch": 0.03, "learning_rate": 0.0019140555058191585, "loss": 2.931, "step": 1069 }, { "epoch": 0.03, "learning_rate": 0.0019158460161145926, "loss": 3.4281, "step": 1070 }, { "epoch": 0.03, "learning_rate": 0.0019176365264100268, "loss": 3.1558, "step": 1071 }, { "epoch": 0.03, "learning_rate": 0.0019194270367054612, "loss": 3.1037, "step": 1072 }, { "epoch": 0.03, "learning_rate": 0.0019212175470008953, "loss": 2.5736, "step": 1073 }, { "epoch": 0.03, "learning_rate": 0.0019230080572963295, "loss": 3.1556, "step": 1074 }, { "epoch": 0.03, "learning_rate": 0.0019247985675917637, "loss": 2.7147, "step": 1075 }, { "epoch": 0.03, "learning_rate": 0.001926589077887198, "loss": 3.4753, "step": 1076 }, { "epoch": 0.03, "learning_rate": 0.001928379588182632, "loss": 3.0288, "step": 1077 }, { "epoch": 0.03, "learning_rate": 0.0019301700984780663, "loss": 3.2478, "step": 1078 }, { "epoch": 0.03, "learning_rate": 0.0019319606087735005, "loss": 2.8523, "step": 1079 }, { "epoch": 0.03, "learning_rate": 0.0019337511190689347, "loss": 2.9557, "step": 1080 }, { "epoch": 0.03, "learning_rate": 0.0019355416293643688, "loss": 2.9065, "step": 1081 }, { "epoch": 0.03, "learning_rate": 0.0019373321396598032, "loss": 2.9133, "step": 1082 }, { "epoch": 0.03, "learning_rate": 0.0019391226499552371, "loss": 2.7349, "step": 1083 }, { "epoch": 0.03, "learning_rate": 0.0019409131602506715, "loss": 3.676, "step": 1084 }, { "epoch": 0.03, "learning_rate": 0.0019427036705461057, "loss": 2.8303, "step": 1085 }, { "epoch": 0.03, "learning_rate": 0.00194449418084154, "loss": 3.2221, "step": 1086 }, { "epoch": 0.03, "learning_rate": 0.001946284691136974, "loss": 2.9128, "step": 1087 }, { "epoch": 0.03, "learning_rate": 0.0019480752014324084, "loss": 3.1028, "step": 1088 }, { "epoch": 0.03, "learning_rate": 0.0019498657117278425, "loss": 2.6885, "step": 1089 }, { "epoch": 0.03, "learning_rate": 0.0019516562220232767, "loss": 2.8723, "step": 1090 }, { "epoch": 0.03, "learning_rate": 0.001953446732318711, "loss": 3.303, "step": 1091 }, { "epoch": 0.03, "learning_rate": 0.001955237242614145, "loss": 3.0332, "step": 1092 }, { "epoch": 0.03, "learning_rate": 0.0019570277529095794, "loss": 2.9445, "step": 1093 }, { "epoch": 0.03, "learning_rate": 0.0019588182632050135, "loss": 2.816, "step": 1094 }, { "epoch": 0.03, "learning_rate": 0.0019606087735004477, "loss": 2.8821, "step": 1095 }, { "epoch": 0.03, "learning_rate": 0.001962399283795882, "loss": 2.9007, "step": 1096 }, { "epoch": 0.03, "learning_rate": 0.001964189794091316, "loss": 2.7443, "step": 1097 }, { "epoch": 0.03, "learning_rate": 0.00196598030438675, "loss": 2.935, "step": 1098 }, { "epoch": 0.03, "learning_rate": 0.0019677708146821843, "loss": 2.8406, "step": 1099 }, { "epoch": 0.03, "learning_rate": 0.001969561324977619, "loss": 3.154, "step": 1100 }, { "epoch": 0.03, "learning_rate": 0.0019713518352730526, "loss": 2.9782, "step": 1101 }, { "epoch": 0.03, "learning_rate": 0.0019731423455684872, "loss": 2.9354, "step": 1102 }, { "epoch": 0.03, "learning_rate": 0.0019749328558639214, "loss": 3.036, "step": 1103 }, { "epoch": 0.03, "learning_rate": 0.0019767233661593555, "loss": 3.1913, "step": 1104 }, { "epoch": 0.03, "learning_rate": 0.0019785138764547897, "loss": 2.7505, "step": 1105 }, { "epoch": 0.03, "learning_rate": 0.001980304386750224, "loss": 3.0737, "step": 1106 }, { "epoch": 0.03, "learning_rate": 0.001982094897045658, "loss": 2.7583, "step": 1107 }, { "epoch": 0.03, "learning_rate": 0.001983885407341092, "loss": 2.8684, "step": 1108 }, { "epoch": 0.03, "learning_rate": 0.0019856759176365263, "loss": 2.8521, "step": 1109 }, { "epoch": 0.03, "learning_rate": 0.001987466427931961, "loss": 2.8479, "step": 1110 }, { "epoch": 0.03, "learning_rate": 0.0019892569382273947, "loss": 2.6558, "step": 1111 }, { "epoch": 0.03, "learning_rate": 0.0019910474485228292, "loss": 2.7396, "step": 1112 }, { "epoch": 0.03, "learning_rate": 0.0019928379588182634, "loss": 3.167, "step": 1113 }, { "epoch": 0.03, "learning_rate": 0.0019946284691136976, "loss": 2.8742, "step": 1114 }, { "epoch": 0.03, "learning_rate": 0.0019964189794091317, "loss": 2.63, "step": 1115 }, { "epoch": 0.03, "learning_rate": 0.001998209489704566, "loss": 2.8977, "step": 1116 }, { "epoch": 0.03, "learning_rate": 0.002, "loss": 2.9749, "step": 1117 }, { "epoch": 0.03, "learning_rate": 0.0019999999962120895, "loss": 3.1425, "step": 1118 }, { "epoch": 0.03, "learning_rate": 0.0019999999848483575, "loss": 2.9183, "step": 1119 }, { "epoch": 0.03, "learning_rate": 0.001999999965908805, "loss": 2.7834, "step": 1120 }, { "epoch": 0.03, "learning_rate": 0.001999999939393431, "loss": 2.7896, "step": 1121 }, { "epoch": 0.03, "learning_rate": 0.001999999905302236, "loss": 2.7019, "step": 1122 }, { "epoch": 0.03, "learning_rate": 0.001999999863635221, "loss": 3.119, "step": 1123 }, { "epoch": 0.03, "learning_rate": 0.0019999998143923857, "loss": 2.9899, "step": 1124 }, { "epoch": 0.03, "learning_rate": 0.001999999757573731, "loss": 2.9555, "step": 1125 }, { "epoch": 0.03, "learning_rate": 0.0019999996931792563, "loss": 3.2034, "step": 1126 }, { "epoch": 0.03, "learning_rate": 0.001999999621208963, "loss": 3.196, "step": 1127 }, { "epoch": 0.03, "learning_rate": 0.001999999541662851, "loss": 2.9032, "step": 1128 }, { "epoch": 0.03, "learning_rate": 0.0019999994545409215, "loss": 2.8983, "step": 1129 }, { "epoch": 0.03, "learning_rate": 0.0019999993598431754, "loss": 2.9489, "step": 1130 }, { "epoch": 0.03, "learning_rate": 0.001999999257569612, "loss": 3.0402, "step": 1131 }, { "epoch": 0.03, "learning_rate": 0.0019999991477202337, "loss": 2.7653, "step": 1132 }, { "epoch": 0.03, "learning_rate": 0.0019999990302950405, "loss": 3.5214, "step": 1133 }, { "epoch": 0.03, "learning_rate": 0.001999998905294033, "loss": 3.2578, "step": 1134 }, { "epoch": 0.03, "learning_rate": 0.001999998772717213, "loss": 2.9056, "step": 1135 }, { "epoch": 0.03, "learning_rate": 0.0019999986325645812, "loss": 2.6984, "step": 1136 }, { "epoch": 0.03, "learning_rate": 0.0019999984848361385, "loss": 3.0774, "step": 1137 }, { "epoch": 0.03, "learning_rate": 0.001999998329531886, "loss": 3.1433, "step": 1138 }, { "epoch": 0.03, "learning_rate": 0.0019999981666518245, "loss": 3.1302, "step": 1139 }, { "epoch": 0.03, "learning_rate": 0.001999997996195956, "loss": 2.9447, "step": 1140 }, { "epoch": 0.03, "learning_rate": 0.001999997818164282, "loss": 2.8205, "step": 1141 }, { "epoch": 0.03, "learning_rate": 0.0019999976325568024, "loss": 3.0849, "step": 1142 }, { "epoch": 0.03, "learning_rate": 0.0019999974393735197, "loss": 2.986, "step": 1143 }, { "epoch": 0.03, "learning_rate": 0.001999997238614436, "loss": 3.6629, "step": 1144 }, { "epoch": 0.03, "learning_rate": 0.001999997030279551, "loss": 2.9448, "step": 1145 }, { "epoch": 0.03, "learning_rate": 0.001999996814368868, "loss": 3.2355, "step": 1146 }, { "epoch": 0.03, "learning_rate": 0.0019999965908823873, "loss": 3.0837, "step": 1147 }, { "epoch": 0.03, "learning_rate": 0.0019999963598201116, "loss": 2.714, "step": 1148 }, { "epoch": 0.03, "learning_rate": 0.0019999961211820422, "loss": 3.1243, "step": 1149 }, { "epoch": 0.03, "learning_rate": 0.001999995874968181, "loss": 2.8107, "step": 1150 }, { "epoch": 0.03, "learning_rate": 0.0019999956211785297, "loss": 3.0145, "step": 1151 }, { "epoch": 0.03, "learning_rate": 0.0019999953598130904, "loss": 2.8913, "step": 1152 }, { "epoch": 0.03, "learning_rate": 0.001999995090871865, "loss": 2.7985, "step": 1153 }, { "epoch": 0.03, "learning_rate": 0.001999994814354856, "loss": 2.9086, "step": 1154 }, { "epoch": 0.03, "learning_rate": 0.0019999945302620645, "loss": 2.6658, "step": 1155 }, { "epoch": 0.03, "learning_rate": 0.0019999942385934937, "loss": 2.8247, "step": 1156 }, { "epoch": 0.03, "learning_rate": 0.0019999939393491447, "loss": 3.1665, "step": 1157 }, { "epoch": 0.03, "learning_rate": 0.0019999936325290207, "loss": 2.6768, "step": 1158 }, { "epoch": 0.03, "learning_rate": 0.001999993318133124, "loss": 3.1797, "step": 1159 }, { "epoch": 0.03, "learning_rate": 0.001999992996161456, "loss": 2.9376, "step": 1160 }, { "epoch": 0.03, "learning_rate": 0.001999992666614021, "loss": 3.1965, "step": 1161 }, { "epoch": 0.03, "learning_rate": 0.0019999923294908195, "loss": 2.4783, "step": 1162 }, { "epoch": 0.03, "learning_rate": 0.001999991984791855, "loss": 3.0512, "step": 1163 }, { "epoch": 0.03, "learning_rate": 0.00199999163251713, "loss": 2.5984, "step": 1164 }, { "epoch": 0.03, "learning_rate": 0.001999991272666647, "loss": 2.8677, "step": 1165 }, { "epoch": 0.03, "learning_rate": 0.001999990905240409, "loss": 2.7969, "step": 1166 }, { "epoch": 0.03, "learning_rate": 0.0019999905302384192, "loss": 2.9139, "step": 1167 }, { "epoch": 0.03, "learning_rate": 0.00199999014766068, "loss": 3.1149, "step": 1168 }, { "epoch": 0.03, "learning_rate": 0.0019999897575071935, "loss": 3.0267, "step": 1169 }, { "epoch": 0.03, "learning_rate": 0.0019999893597779637, "loss": 2.8127, "step": 1170 }, { "epoch": 0.03, "learning_rate": 0.001999988954472993, "loss": 3.3703, "step": 1171 }, { "epoch": 0.03, "learning_rate": 0.0019999885415922848, "loss": 2.8182, "step": 1172 }, { "epoch": 0.03, "learning_rate": 0.0019999881211358425, "loss": 3.0832, "step": 1173 }, { "epoch": 0.03, "learning_rate": 0.001999987693103669, "loss": 2.8551, "step": 1174 }, { "epoch": 0.03, "learning_rate": 0.0019999872574957673, "loss": 2.8678, "step": 1175 }, { "epoch": 0.03, "learning_rate": 0.001999986814312141, "loss": 2.7804, "step": 1176 }, { "epoch": 0.03, "learning_rate": 0.0019999863635527934, "loss": 2.9687, "step": 1177 }, { "epoch": 0.03, "learning_rate": 0.001999985905217728, "loss": 2.9743, "step": 1178 }, { "epoch": 0.03, "learning_rate": 0.0019999854393069477, "loss": 2.9505, "step": 1179 }, { "epoch": 0.03, "learning_rate": 0.0019999849658204573, "loss": 2.9125, "step": 1180 }, { "epoch": 0.03, "learning_rate": 0.001999984484758259, "loss": 2.9425, "step": 1181 }, { "epoch": 0.03, "learning_rate": 0.001999983996120357, "loss": 3.2007, "step": 1182 }, { "epoch": 0.03, "learning_rate": 0.001999983499906755, "loss": 3.0231, "step": 1183 }, { "epoch": 0.03, "learning_rate": 0.001999982996117457, "loss": 2.7997, "step": 1184 }, { "epoch": 0.03, "learning_rate": 0.001999982484752467, "loss": 2.8039, "step": 1185 }, { "epoch": 0.03, "learning_rate": 0.001999981965811788, "loss": 3.0816, "step": 1186 }, { "epoch": 0.03, "learning_rate": 0.001999981439295424, "loss": 2.9029, "step": 1187 }, { "epoch": 0.03, "learning_rate": 0.0019999809052033803, "loss": 2.8787, "step": 1188 }, { "epoch": 0.03, "learning_rate": 0.001999980363535659, "loss": 3.0539, "step": 1189 }, { "epoch": 0.03, "learning_rate": 0.0019999798142922662, "loss": 2.9659, "step": 1190 }, { "epoch": 0.03, "learning_rate": 0.001999979257473205, "loss": 2.9266, "step": 1191 }, { "epoch": 0.03, "learning_rate": 0.001999978693078479, "loss": 2.87, "step": 1192 }, { "epoch": 0.03, "learning_rate": 0.001999978121108094, "loss": 3.0472, "step": 1193 }, { "epoch": 0.03, "learning_rate": 0.001999977541562053, "loss": 2.7997, "step": 1194 }, { "epoch": 0.03, "learning_rate": 0.001999976954440361, "loss": 2.6606, "step": 1195 }, { "epoch": 0.03, "learning_rate": 0.0019999763597430224, "loss": 2.8011, "step": 1196 }, { "epoch": 0.03, "learning_rate": 0.0019999757574700417, "loss": 2.9374, "step": 1197 }, { "epoch": 0.03, "learning_rate": 0.0019999751476214235, "loss": 2.5555, "step": 1198 }, { "epoch": 0.03, "learning_rate": 0.0019999745301971725, "loss": 3.1096, "step": 1199 }, { "epoch": 0.03, "learning_rate": 0.001999973905197293, "loss": 3.0763, "step": 1200 }, { "epoch": 0.03, "learning_rate": 0.00199997327262179, "loss": 2.6316, "step": 1201 }, { "epoch": 0.03, "learning_rate": 0.0019999726324706683, "loss": 2.7488, "step": 1202 }, { "epoch": 0.03, "learning_rate": 0.0019999719847439332, "loss": 2.8125, "step": 1203 }, { "epoch": 0.03, "learning_rate": 0.0019999713294415883, "loss": 2.6011, "step": 1204 }, { "epoch": 0.03, "learning_rate": 0.0019999706665636396, "loss": 2.6733, "step": 1205 }, { "epoch": 0.03, "learning_rate": 0.0019999699961100923, "loss": 2.6388, "step": 1206 }, { "epoch": 0.03, "learning_rate": 0.0019999693180809508, "loss": 2.8553, "step": 1207 }, { "epoch": 0.03, "learning_rate": 0.0019999686324762207, "loss": 2.9952, "step": 1208 }, { "epoch": 0.03, "learning_rate": 0.0019999679392959067, "loss": 2.8009, "step": 1209 }, { "epoch": 0.03, "learning_rate": 0.0019999672385400146, "loss": 2.8607, "step": 1210 }, { "epoch": 0.03, "learning_rate": 0.0019999665302085495, "loss": 2.7209, "step": 1211 }, { "epoch": 0.03, "learning_rate": 0.0019999658143015167, "loss": 2.698, "step": 1212 }, { "epoch": 0.03, "learning_rate": 0.0019999650908189216, "loss": 2.9869, "step": 1213 }, { "epoch": 0.03, "learning_rate": 0.00199996435976077, "loss": 2.8562, "step": 1214 }, { "epoch": 0.03, "learning_rate": 0.001999963621127067, "loss": 3.2848, "step": 1215 }, { "epoch": 0.03, "learning_rate": 0.0019999628749178184, "loss": 3.2375, "step": 1216 }, { "epoch": 0.03, "learning_rate": 0.0019999621211330295, "loss": 2.4662, "step": 1217 }, { "epoch": 0.03, "learning_rate": 0.0019999613597727066, "loss": 2.8367, "step": 1218 }, { "epoch": 0.03, "learning_rate": 0.0019999605908368554, "loss": 2.8597, "step": 1219 }, { "epoch": 0.03, "learning_rate": 0.0019999598143254816, "loss": 2.5766, "step": 1220 }, { "epoch": 0.03, "learning_rate": 0.0019999590302385906, "loss": 3.0469, "step": 1221 }, { "epoch": 0.03, "learning_rate": 0.001999958238576189, "loss": 2.6589, "step": 1222 }, { "epoch": 0.03, "learning_rate": 0.0019999574393382825, "loss": 2.8247, "step": 1223 }, { "epoch": 0.03, "learning_rate": 0.0019999566325248773, "loss": 3.0435, "step": 1224 }, { "epoch": 0.03, "learning_rate": 0.0019999558181359794, "loss": 2.628, "step": 1225 }, { "epoch": 0.03, "learning_rate": 0.001999954996171595, "loss": 2.5943, "step": 1226 }, { "epoch": 0.03, "learning_rate": 0.0019999541666317305, "loss": 3.0959, "step": 1227 }, { "epoch": 0.03, "learning_rate": 0.0019999533295163917, "loss": 3.0264, "step": 1228 }, { "epoch": 0.03, "learning_rate": 0.0019999524848255856, "loss": 2.9397, "step": 1229 }, { "epoch": 0.03, "learning_rate": 0.0019999516325593177, "loss": 3.0662, "step": 1230 }, { "epoch": 0.03, "learning_rate": 0.0019999507727175955, "loss": 2.3912, "step": 1231 }, { "epoch": 0.03, "learning_rate": 0.001999949905300425, "loss": 2.4548, "step": 1232 }, { "epoch": 0.03, "learning_rate": 0.0019999490303078122, "loss": 3.1918, "step": 1233 }, { "epoch": 0.03, "learning_rate": 0.001999948147739765, "loss": 2.65, "step": 1234 }, { "epoch": 0.03, "learning_rate": 0.001999947257596289, "loss": 2.7047, "step": 1235 }, { "epoch": 0.03, "learning_rate": 0.0019999463598773916, "loss": 3.2376, "step": 1236 }, { "epoch": 0.03, "learning_rate": 0.0019999454545830794, "loss": 2.9711, "step": 1237 }, { "epoch": 0.03, "learning_rate": 0.0019999445417133587, "loss": 2.9668, "step": 1238 }, { "epoch": 0.03, "learning_rate": 0.0019999436212682375, "loss": 2.8738, "step": 1239 }, { "epoch": 0.03, "learning_rate": 0.0019999426932477225, "loss": 2.9608, "step": 1240 }, { "epoch": 0.03, "learning_rate": 0.0019999417576518196, "loss": 3.0064, "step": 1241 }, { "epoch": 0.03, "learning_rate": 0.001999940814480537, "loss": 2.827, "step": 1242 }, { "epoch": 0.03, "learning_rate": 0.001999939863733882, "loss": 3.0879, "step": 1243 }, { "epoch": 0.03, "learning_rate": 0.0019999389054118607, "loss": 3.152, "step": 1244 }, { "epoch": 0.03, "learning_rate": 0.001999937939514481, "loss": 2.6625, "step": 1245 }, { "epoch": 0.03, "learning_rate": 0.0019999369660417504, "loss": 2.8919, "step": 1246 }, { "epoch": 0.03, "learning_rate": 0.001999935984993677, "loss": 2.6727, "step": 1247 }, { "epoch": 0.03, "learning_rate": 0.0019999349963702663, "loss": 2.8761, "step": 1248 }, { "epoch": 0.03, "learning_rate": 0.001999934000171527, "loss": 2.8317, "step": 1249 }, { "epoch": 0.03, "learning_rate": 0.0019999329963974665, "loss": 2.9054, "step": 1250 }, { "epoch": 0.03, "learning_rate": 0.0019999319850480925, "loss": 2.546, "step": 1251 }, { "epoch": 0.03, "learning_rate": 0.001999930966123413, "loss": 2.7971, "step": 1252 }, { "epoch": 0.03, "learning_rate": 0.0019999299396234343, "loss": 2.9784, "step": 1253 }, { "epoch": 0.03, "learning_rate": 0.001999928905548166, "loss": 2.7557, "step": 1254 }, { "epoch": 0.03, "learning_rate": 0.0019999278638976148, "loss": 2.8206, "step": 1255 }, { "epoch": 0.03, "learning_rate": 0.001999926814671789, "loss": 2.9786, "step": 1256 }, { "epoch": 0.03, "learning_rate": 0.0019999257578706964, "loss": 2.8422, "step": 1257 }, { "epoch": 0.03, "learning_rate": 0.0019999246934943446, "loss": 3.1958, "step": 1258 }, { "epoch": 0.03, "learning_rate": 0.0019999236215427424, "loss": 3.1506, "step": 1259 }, { "epoch": 0.03, "learning_rate": 0.0019999225420158978, "loss": 2.4664, "step": 1260 }, { "epoch": 0.03, "learning_rate": 0.0019999214549138184, "loss": 2.5269, "step": 1261 }, { "epoch": 0.03, "learning_rate": 0.001999920360236513, "loss": 2.7856, "step": 1262 }, { "epoch": 0.03, "learning_rate": 0.00199991925798399, "loss": 2.8098, "step": 1263 }, { "epoch": 0.03, "learning_rate": 0.001999918148156257, "loss": 3.2093, "step": 1264 }, { "epoch": 0.03, "learning_rate": 0.001999917030753323, "loss": 2.5819, "step": 1265 }, { "epoch": 0.03, "learning_rate": 0.0019999159057751967, "loss": 2.7041, "step": 1266 }, { "epoch": 0.03, "learning_rate": 0.001999914773221886, "loss": 2.7555, "step": 1267 }, { "epoch": 0.03, "learning_rate": 0.0019999136330933996, "loss": 3.1786, "step": 1268 }, { "epoch": 0.03, "learning_rate": 0.0019999124853897466, "loss": 2.7484, "step": 1269 }, { "epoch": 0.03, "learning_rate": 0.001999911330110935, "loss": 2.7464, "step": 1270 }, { "epoch": 0.03, "learning_rate": 0.0019999101672569745, "loss": 2.9189, "step": 1271 }, { "epoch": 0.03, "learning_rate": 0.0019999089968278727, "loss": 2.9194, "step": 1272 }, { "epoch": 0.03, "learning_rate": 0.0019999078188236395, "loss": 2.8013, "step": 1273 }, { "epoch": 0.03, "learning_rate": 0.001999906633244283, "loss": 3.0153, "step": 1274 }, { "epoch": 0.03, "learning_rate": 0.0019999054400898133, "loss": 3.3401, "step": 1275 }, { "epoch": 0.03, "learning_rate": 0.001999904239360238, "loss": 2.9717, "step": 1276 }, { "epoch": 0.03, "learning_rate": 0.0019999030310555678, "loss": 3.1726, "step": 1277 }, { "epoch": 0.03, "learning_rate": 0.00199990181517581, "loss": 2.7197, "step": 1278 }, { "epoch": 0.03, "learning_rate": 0.001999900591720976, "loss": 3.2331, "step": 1279 }, { "epoch": 0.03, "learning_rate": 0.0019998993606910732, "loss": 2.9033, "step": 1280 }, { "epoch": 0.03, "learning_rate": 0.0019998981220861116, "loss": 2.6118, "step": 1281 }, { "epoch": 0.03, "learning_rate": 0.0019998968759061004, "loss": 3.1069, "step": 1282 }, { "epoch": 0.03, "learning_rate": 0.0019998956221510497, "loss": 3.0714, "step": 1283 }, { "epoch": 0.03, "learning_rate": 0.001999894360820968, "loss": 3.0514, "step": 1284 }, { "epoch": 0.03, "learning_rate": 0.001999893091915866, "loss": 2.8793, "step": 1285 }, { "epoch": 0.03, "learning_rate": 0.001999891815435752, "loss": 3.3485, "step": 1286 }, { "epoch": 0.03, "learning_rate": 0.0019998905313806372, "loss": 3.1146, "step": 1287 }, { "epoch": 0.03, "learning_rate": 0.0019998892397505297, "loss": 3.3144, "step": 1288 }, { "epoch": 0.03, "learning_rate": 0.0019998879405454402, "loss": 3.1459, "step": 1289 }, { "epoch": 0.03, "learning_rate": 0.001999886633765379, "loss": 2.4777, "step": 1290 }, { "epoch": 0.03, "learning_rate": 0.001999885319410355, "loss": 3.0799, "step": 1291 }, { "epoch": 0.03, "learning_rate": 0.0019998839974803787, "loss": 2.8337, "step": 1292 }, { "epoch": 0.03, "learning_rate": 0.0019998826679754602, "loss": 2.969, "step": 1293 }, { "epoch": 0.03, "learning_rate": 0.001999881330895609, "loss": 3.0193, "step": 1294 }, { "epoch": 0.03, "learning_rate": 0.0019998799862408355, "loss": 3.0109, "step": 1295 }, { "epoch": 0.03, "learning_rate": 0.0019998786340111505, "loss": 2.77, "step": 1296 }, { "epoch": 0.03, "learning_rate": 0.0019998772742065634, "loss": 3.4924, "step": 1297 }, { "epoch": 0.03, "learning_rate": 0.0019998759068270847, "loss": 2.668, "step": 1298 }, { "epoch": 0.03, "learning_rate": 0.001999874531872725, "loss": 2.7906, "step": 1299 }, { "epoch": 0.03, "learning_rate": 0.001999873149343495, "loss": 3.2527, "step": 1300 }, { "epoch": 0.03, "learning_rate": 0.0019998717592394043, "loss": 2.8467, "step": 1301 }, { "epoch": 0.03, "learning_rate": 0.0019998703615604642, "loss": 2.6914, "step": 1302 }, { "epoch": 0.04, "learning_rate": 0.001999868956306685, "loss": 2.9083, "step": 1303 }, { "epoch": 0.04, "learning_rate": 0.0019998675434780774, "loss": 2.5864, "step": 1304 }, { "epoch": 0.04, "learning_rate": 0.001999866123074652, "loss": 2.7229, "step": 1305 }, { "epoch": 0.04, "learning_rate": 0.0019998646950964193, "loss": 2.784, "step": 1306 }, { "epoch": 0.04, "learning_rate": 0.0019998632595433904, "loss": 2.5536, "step": 1307 }, { "epoch": 0.04, "learning_rate": 0.0019998618164155765, "loss": 3.3115, "step": 1308 }, { "epoch": 0.04, "learning_rate": 0.001999860365712988, "loss": 2.5575, "step": 1309 }, { "epoch": 0.04, "learning_rate": 0.0019998589074356364, "loss": 2.6609, "step": 1310 }, { "epoch": 0.04, "learning_rate": 0.0019998574415835326, "loss": 3.0747, "step": 1311 }, { "epoch": 0.04, "learning_rate": 0.0019998559681566872, "loss": 2.8851, "step": 1312 }, { "epoch": 0.04, "learning_rate": 0.001999854487155112, "loss": 3.0783, "step": 1313 }, { "epoch": 0.04, "learning_rate": 0.0019998529985788176, "loss": 2.6849, "step": 1314 }, { "epoch": 0.04, "learning_rate": 0.001999851502427816, "loss": 2.6236, "step": 1315 }, { "epoch": 0.04, "learning_rate": 0.001999849998702118, "loss": 2.5926, "step": 1316 }, { "epoch": 0.04, "learning_rate": 0.001999848487401735, "loss": 2.5699, "step": 1317 }, { "epoch": 0.04, "learning_rate": 0.001999846968526679, "loss": 2.9969, "step": 1318 }, { "epoch": 0.04, "learning_rate": 0.001999845442076961, "loss": 2.7043, "step": 1319 }, { "epoch": 0.04, "learning_rate": 0.0019998439080525926, "loss": 2.7663, "step": 1320 }, { "epoch": 0.04, "learning_rate": 0.0019998423664535857, "loss": 3.2165, "step": 1321 }, { "epoch": 0.04, "learning_rate": 0.0019998408172799517, "loss": 2.8078, "step": 1322 }, { "epoch": 0.04, "learning_rate": 0.0019998392605317023, "loss": 2.9601, "step": 1323 }, { "epoch": 0.04, "learning_rate": 0.0019998376962088497, "loss": 3.1027, "step": 1324 }, { "epoch": 0.04, "learning_rate": 0.001999836124311405, "loss": 3.0329, "step": 1325 }, { "epoch": 0.04, "learning_rate": 0.001999834544839381, "loss": 2.6057, "step": 1326 }, { "epoch": 0.04, "learning_rate": 0.001999832957792789, "loss": 2.7164, "step": 1327 }, { "epoch": 0.04, "learning_rate": 0.0019998313631716413, "loss": 2.6172, "step": 1328 }, { "epoch": 0.04, "learning_rate": 0.00199982976097595, "loss": 2.8235, "step": 1329 }, { "epoch": 0.04, "learning_rate": 0.001999828151205727, "loss": 2.937, "step": 1330 }, { "epoch": 0.04, "learning_rate": 0.001999826533860985, "loss": 2.7739, "step": 1331 }, { "epoch": 0.04, "learning_rate": 0.0019998249089417356, "loss": 2.3878, "step": 1332 }, { "epoch": 0.04, "learning_rate": 0.0019998232764479916, "loss": 2.8733, "step": 1333 }, { "epoch": 0.04, "learning_rate": 0.0019998216363797654, "loss": 2.5033, "step": 1334 }, { "epoch": 0.04, "learning_rate": 0.001999819988737069, "loss": 2.8802, "step": 1335 }, { "epoch": 0.04, "learning_rate": 0.0019998183335199152, "loss": 2.9811, "step": 1336 }, { "epoch": 0.04, "learning_rate": 0.0019998166707283164, "loss": 2.6408, "step": 1337 }, { "epoch": 0.04, "learning_rate": 0.001999815000362285, "loss": 3.0855, "step": 1338 }, { "epoch": 0.04, "learning_rate": 0.0019998133224218345, "loss": 2.8536, "step": 1339 }, { "epoch": 0.04, "learning_rate": 0.0019998116369069766, "loss": 2.8703, "step": 1340 }, { "epoch": 0.04, "learning_rate": 0.001999809943817725, "loss": 2.9552, "step": 1341 }, { "epoch": 0.04, "learning_rate": 0.0019998082431540915, "loss": 2.6681, "step": 1342 }, { "epoch": 0.04, "learning_rate": 0.0019998065349160895, "loss": 2.8055, "step": 1343 }, { "epoch": 0.04, "learning_rate": 0.0019998048191037323, "loss": 2.9019, "step": 1344 }, { "epoch": 0.04, "learning_rate": 0.001999803095717032, "loss": 2.9657, "step": 1345 }, { "epoch": 0.04, "learning_rate": 0.0019998013647560026, "loss": 3.0961, "step": 1346 }, { "epoch": 0.04, "learning_rate": 0.0019997996262206565, "loss": 3.0134, "step": 1347 }, { "epoch": 0.04, "learning_rate": 0.0019997978801110073, "loss": 3.0921, "step": 1348 }, { "epoch": 0.04, "learning_rate": 0.0019997961264270683, "loss": 2.5515, "step": 1349 }, { "epoch": 0.04, "learning_rate": 0.0019997943651688527, "loss": 2.9707, "step": 1350 }, { "epoch": 0.04, "learning_rate": 0.0019997925963363733, "loss": 2.6662, "step": 1351 }, { "epoch": 0.04, "learning_rate": 0.001999790819929644, "loss": 2.6812, "step": 1352 }, { "epoch": 0.04, "learning_rate": 0.0019997890359486786, "loss": 2.8992, "step": 1353 }, { "epoch": 0.04, "learning_rate": 0.00199978724439349, "loss": 2.8392, "step": 1354 }, { "epoch": 0.04, "learning_rate": 0.001999785445264092, "loss": 2.7888, "step": 1355 }, { "epoch": 0.04, "learning_rate": 0.001999783638560498, "loss": 3.0361, "step": 1356 }, { "epoch": 0.04, "learning_rate": 0.0019997818242827223, "loss": 2.6704, "step": 1357 }, { "epoch": 0.04, "learning_rate": 0.001999780002430778, "loss": 2.7503, "step": 1358 }, { "epoch": 0.04, "learning_rate": 0.001999778173004679, "loss": 3.3698, "step": 1359 }, { "epoch": 0.04, "learning_rate": 0.0019997763360044395, "loss": 2.8362, "step": 1360 }, { "epoch": 0.04, "learning_rate": 0.001999774491430073, "loss": 3.0043, "step": 1361 }, { "epoch": 0.04, "learning_rate": 0.001999772639281594, "loss": 3.0097, "step": 1362 }, { "epoch": 0.04, "learning_rate": 0.001999770779559016, "loss": 2.7871, "step": 1363 }, { "epoch": 0.04, "learning_rate": 0.001999768912262353, "loss": 2.9092, "step": 1364 }, { "epoch": 0.04, "learning_rate": 0.0019997670373916206, "loss": 3.1781, "step": 1365 }, { "epoch": 0.04, "learning_rate": 0.0019997651549468307, "loss": 2.634, "step": 1366 }, { "epoch": 0.04, "learning_rate": 0.001999763264927999, "loss": 3.4233, "step": 1367 }, { "epoch": 0.04, "learning_rate": 0.00199976136733514, "loss": 2.7768, "step": 1368 }, { "epoch": 0.04, "learning_rate": 0.0019997594621682675, "loss": 2.74, "step": 1369 }, { "epoch": 0.04, "learning_rate": 0.0019997575494273955, "loss": 2.6148, "step": 1370 }, { "epoch": 0.04, "learning_rate": 0.0019997556291125396, "loss": 2.9645, "step": 1371 }, { "epoch": 0.04, "learning_rate": 0.0019997537012237136, "loss": 2.8581, "step": 1372 }, { "epoch": 0.04, "learning_rate": 0.0019997517657609322, "loss": 2.9786, "step": 1373 }, { "epoch": 0.04, "learning_rate": 0.0019997498227242107, "loss": 2.6835, "step": 1374 }, { "epoch": 0.04, "learning_rate": 0.0019997478721135624, "loss": 3.0417, "step": 1375 }, { "epoch": 0.04, "learning_rate": 0.0019997459139290035, "loss": 3.0083, "step": 1376 }, { "epoch": 0.04, "learning_rate": 0.0019997439481705486, "loss": 2.4723, "step": 1377 }, { "epoch": 0.04, "learning_rate": 0.0019997419748382116, "loss": 2.9175, "step": 1378 }, { "epoch": 0.04, "learning_rate": 0.0019997399939320083, "loss": 2.7924, "step": 1379 }, { "epoch": 0.04, "learning_rate": 0.001999738005451954, "loss": 3.4902, "step": 1380 }, { "epoch": 0.04, "learning_rate": 0.001999736009398063, "loss": 3.3801, "step": 1381 }, { "epoch": 0.04, "learning_rate": 0.0019997340057703508, "loss": 2.8904, "step": 1382 }, { "epoch": 0.04, "learning_rate": 0.001999731994568832, "loss": 2.9636, "step": 1383 }, { "epoch": 0.04, "learning_rate": 0.001999729975793523, "loss": 3.1288, "step": 1384 }, { "epoch": 0.04, "learning_rate": 0.001999727949444438, "loss": 3.2563, "step": 1385 }, { "epoch": 0.04, "learning_rate": 0.001999725915521593, "loss": 2.834, "step": 1386 }, { "epoch": 0.04, "learning_rate": 0.0019997238740250035, "loss": 2.8556, "step": 1387 }, { "epoch": 0.04, "learning_rate": 0.0019997218249546843, "loss": 2.8761, "step": 1388 }, { "epoch": 0.04, "learning_rate": 0.0019997197683106513, "loss": 2.7639, "step": 1389 }, { "epoch": 0.04, "learning_rate": 0.00199971770409292, "loss": 2.9818, "step": 1390 }, { "epoch": 0.04, "learning_rate": 0.0019997156323015063, "loss": 2.9367, "step": 1391 }, { "epoch": 0.04, "learning_rate": 0.0019997135529364256, "loss": 2.8783, "step": 1392 }, { "epoch": 0.04, "learning_rate": 0.001999711465997694, "loss": 2.8165, "step": 1393 }, { "epoch": 0.04, "learning_rate": 0.0019997093714853266, "loss": 2.9865, "step": 1394 }, { "epoch": 0.04, "learning_rate": 0.00199970726939934, "loss": 2.5012, "step": 1395 }, { "epoch": 0.04, "learning_rate": 0.00199970515973975, "loss": 2.5434, "step": 1396 }, { "epoch": 0.04, "learning_rate": 0.0019997030425065723, "loss": 2.5984, "step": 1397 }, { "epoch": 0.04, "learning_rate": 0.001999700917699823, "loss": 3.3116, "step": 1398 }, { "epoch": 0.04, "learning_rate": 0.0019996987853195185, "loss": 2.9377, "step": 1399 }, { "epoch": 0.04, "learning_rate": 0.0019996966453656746, "loss": 3.2011, "step": 1400 }, { "epoch": 0.04, "learning_rate": 0.0019996944978383072, "loss": 2.5413, "step": 1401 }, { "epoch": 0.04, "learning_rate": 0.0019996923427374334, "loss": 2.8906, "step": 1402 }, { "epoch": 0.04, "learning_rate": 0.001999690180063069, "loss": 2.8754, "step": 1403 }, { "epoch": 0.04, "learning_rate": 0.001999688009815231, "loss": 3.1375, "step": 1404 }, { "epoch": 0.04, "learning_rate": 0.001999685831993935, "loss": 2.9557, "step": 1405 }, { "epoch": 0.04, "learning_rate": 0.0019996836465991977, "loss": 2.6098, "step": 1406 }, { "epoch": 0.04, "learning_rate": 0.001999681453631036, "loss": 2.7846, "step": 1407 }, { "epoch": 0.04, "learning_rate": 0.001999679253089467, "loss": 3.1259, "step": 1408 }, { "epoch": 0.04, "learning_rate": 0.0019996770449745055, "loss": 2.9872, "step": 1409 }, { "epoch": 0.04, "learning_rate": 0.00199967482928617, "loss": 2.9399, "step": 1410 }, { "epoch": 0.04, "learning_rate": 0.0019996726060244768, "loss": 3.4218, "step": 1411 }, { "epoch": 0.04, "learning_rate": 0.0019996703751894427, "loss": 3.1421, "step": 1412 }, { "epoch": 0.04, "learning_rate": 0.0019996681367810843, "loss": 2.9771, "step": 1413 }, { "epoch": 0.04, "learning_rate": 0.001999665890799419, "loss": 2.8324, "step": 1414 }, { "epoch": 0.04, "learning_rate": 0.001999663637244464, "loss": 3.2396, "step": 1415 }, { "epoch": 0.04, "learning_rate": 0.001999661376116235, "loss": 2.8275, "step": 1416 }, { "epoch": 0.04, "learning_rate": 0.001999659107414751, "loss": 2.7838, "step": 1417 }, { "epoch": 0.04, "learning_rate": 0.001999656831140028, "loss": 3.1974, "step": 1418 }, { "epoch": 0.04, "learning_rate": 0.0019996545472920836, "loss": 3.1402, "step": 1419 }, { "epoch": 0.04, "learning_rate": 0.0019996522558709353, "loss": 2.811, "step": 1420 }, { "epoch": 0.04, "learning_rate": 0.0019996499568766, "loss": 3.1677, "step": 1421 }, { "epoch": 0.04, "learning_rate": 0.0019996476503090954, "loss": 3.0191, "step": 1422 }, { "epoch": 0.04, "learning_rate": 0.001999645336168439, "loss": 2.7674, "step": 1423 }, { "epoch": 0.04, "learning_rate": 0.001999643014454648, "loss": 3.0761, "step": 1424 }, { "epoch": 0.04, "learning_rate": 0.0019996406851677403, "loss": 3.1134, "step": 1425 }, { "epoch": 0.04, "learning_rate": 0.001999638348307734, "loss": 3.0296, "step": 1426 }, { "epoch": 0.04, "learning_rate": 0.0019996360038746458, "loss": 2.6557, "step": 1427 }, { "epoch": 0.04, "learning_rate": 0.001999633651868494, "loss": 2.9687, "step": 1428 }, { "epoch": 0.04, "learning_rate": 0.0019996312922892965, "loss": 3.0993, "step": 1429 }, { "epoch": 0.04, "learning_rate": 0.001999628925137071, "loss": 2.8018, "step": 1430 }, { "epoch": 0.04, "learning_rate": 0.001999626550411835, "loss": 2.3903, "step": 1431 }, { "epoch": 0.04, "learning_rate": 0.0019996241681136074, "loss": 3.1338, "step": 1432 }, { "epoch": 0.04, "learning_rate": 0.001999621778242406, "loss": 3.0022, "step": 1433 }, { "epoch": 0.04, "learning_rate": 0.0019996193807982486, "loss": 2.8303, "step": 1434 }, { "epoch": 0.04, "learning_rate": 0.0019996169757811534, "loss": 2.6689, "step": 1435 }, { "epoch": 0.04, "learning_rate": 0.001999614563191139, "loss": 2.799, "step": 1436 }, { "epoch": 0.04, "learning_rate": 0.001999612143028223, "loss": 2.9938, "step": 1437 }, { "epoch": 0.04, "learning_rate": 0.001999609715292424, "loss": 2.997, "step": 1438 }, { "epoch": 0.04, "learning_rate": 0.0019996072799837606, "loss": 2.786, "step": 1439 }, { "epoch": 0.04, "learning_rate": 0.0019996048371022515, "loss": 2.9408, "step": 1440 }, { "epoch": 0.04, "learning_rate": 0.0019996023866479147, "loss": 2.4544, "step": 1441 }, { "epoch": 0.04, "learning_rate": 0.001999599928620769, "loss": 2.8305, "step": 1442 }, { "epoch": 0.04, "learning_rate": 0.0019995974630208327, "loss": 2.8828, "step": 1443 }, { "epoch": 0.04, "learning_rate": 0.001999594989848125, "loss": 2.7325, "step": 1444 }, { "epoch": 0.04, "learning_rate": 0.0019995925091026642, "loss": 3.09, "step": 1445 }, { "epoch": 0.04, "learning_rate": 0.001999590020784469, "loss": 2.8552, "step": 1446 }, { "epoch": 0.04, "learning_rate": 0.0019995875248935593, "loss": 2.6562, "step": 1447 }, { "epoch": 0.04, "learning_rate": 0.0019995850214299528, "loss": 2.6824, "step": 1448 }, { "epoch": 0.04, "learning_rate": 0.001999582510393669, "loss": 2.6042, "step": 1449 }, { "epoch": 0.04, "learning_rate": 0.0019995799917847264, "loss": 2.7103, "step": 1450 }, { "epoch": 0.04, "learning_rate": 0.001999577465603145, "loss": 2.8546, "step": 1451 }, { "epoch": 0.04, "learning_rate": 0.001999574931848943, "loss": 2.9495, "step": 1452 }, { "epoch": 0.04, "learning_rate": 0.00199957239052214, "loss": 2.8197, "step": 1453 }, { "epoch": 0.04, "learning_rate": 0.0019995698416227555, "loss": 3.147, "step": 1454 }, { "epoch": 0.04, "learning_rate": 0.0019995672851508086, "loss": 3.1393, "step": 1455 }, { "epoch": 0.04, "learning_rate": 0.0019995647211063184, "loss": 3.0409, "step": 1456 }, { "epoch": 0.04, "learning_rate": 0.001999562149489305, "loss": 2.9292, "step": 1457 }, { "epoch": 0.04, "learning_rate": 0.001999559570299787, "loss": 3.154, "step": 1458 }, { "epoch": 0.04, "learning_rate": 0.001999556983537785, "loss": 2.4761, "step": 1459 }, { "epoch": 0.04, "learning_rate": 0.0019995543892033173, "loss": 2.9878, "step": 1460 }, { "epoch": 0.04, "learning_rate": 0.0019995517872964047, "loss": 2.889, "step": 1461 }, { "epoch": 0.04, "learning_rate": 0.0019995491778170664, "loss": 2.9205, "step": 1462 }, { "epoch": 0.04, "learning_rate": 0.0019995465607653222, "loss": 3.1088, "step": 1463 }, { "epoch": 0.04, "learning_rate": 0.0019995439361411922, "loss": 2.7724, "step": 1464 }, { "epoch": 0.04, "learning_rate": 0.001999541303944696, "loss": 2.9197, "step": 1465 }, { "epoch": 0.04, "learning_rate": 0.001999538664175853, "loss": 2.812, "step": 1466 }, { "epoch": 0.04, "learning_rate": 0.0019995360168346844, "loss": 2.6169, "step": 1467 }, { "epoch": 0.04, "learning_rate": 0.001999533361921209, "loss": 2.9549, "step": 1468 }, { "epoch": 0.04, "learning_rate": 0.001999530699435448, "loss": 3.1839, "step": 1469 }, { "epoch": 0.04, "learning_rate": 0.001999528029377421, "loss": 2.698, "step": 1470 }, { "epoch": 0.04, "learning_rate": 0.0019995253517471486, "loss": 2.7872, "step": 1471 }, { "epoch": 0.04, "learning_rate": 0.0019995226665446507, "loss": 2.9934, "step": 1472 }, { "epoch": 0.04, "learning_rate": 0.0019995199737699474, "loss": 3.0643, "step": 1473 }, { "epoch": 0.04, "learning_rate": 0.0019995172734230604, "loss": 2.7782, "step": 1474 }, { "epoch": 0.04, "learning_rate": 0.001999514565504008, "loss": 2.5235, "step": 1475 }, { "epoch": 0.04, "learning_rate": 0.001999511850012813, "loss": 3.0801, "step": 1476 }, { "epoch": 0.04, "learning_rate": 0.0019995091269494943, "loss": 3.082, "step": 1477 }, { "epoch": 0.04, "learning_rate": 0.0019995063963140734, "loss": 3.1533, "step": 1478 }, { "epoch": 0.04, "learning_rate": 0.0019995036581065707, "loss": 2.9027, "step": 1479 }, { "epoch": 0.04, "learning_rate": 0.001999500912327007, "loss": 3.0734, "step": 1480 }, { "epoch": 0.04, "learning_rate": 0.0019994981589754033, "loss": 2.8553, "step": 1481 }, { "epoch": 0.04, "learning_rate": 0.0019994953980517795, "loss": 3.0899, "step": 1482 }, { "epoch": 0.04, "learning_rate": 0.001999492629556158, "loss": 2.7635, "step": 1483 }, { "epoch": 0.04, "learning_rate": 0.0019994898534885586, "loss": 2.8954, "step": 1484 }, { "epoch": 0.04, "learning_rate": 0.001999487069849003, "loss": 2.8104, "step": 1485 }, { "epoch": 0.04, "learning_rate": 0.001999484278637512, "loss": 2.8462, "step": 1486 }, { "epoch": 0.04, "learning_rate": 0.001999481479854107, "loss": 2.6616, "step": 1487 }, { "epoch": 0.04, "learning_rate": 0.0019994786734988087, "loss": 3.0784, "step": 1488 }, { "epoch": 0.04, "learning_rate": 0.001999475859571639, "loss": 2.8823, "step": 1489 }, { "epoch": 0.04, "learning_rate": 0.0019994730380726183, "loss": 2.6074, "step": 1490 }, { "epoch": 0.04, "learning_rate": 0.0019994702090017687, "loss": 3.1529, "step": 1491 }, { "epoch": 0.04, "learning_rate": 0.001999467372359112, "loss": 2.9082, "step": 1492 }, { "epoch": 0.04, "learning_rate": 0.0019994645281446685, "loss": 2.6926, "step": 1493 }, { "epoch": 0.04, "learning_rate": 0.001999461676358461, "loss": 3.0139, "step": 1494 }, { "epoch": 0.04, "learning_rate": 0.00199945881700051, "loss": 2.7144, "step": 1495 }, { "epoch": 0.04, "learning_rate": 0.001999455950070838, "loss": 2.9919, "step": 1496 }, { "epoch": 0.04, "learning_rate": 0.0019994530755694665, "loss": 3.0589, "step": 1497 }, { "epoch": 0.04, "learning_rate": 0.001999450193496417, "loss": 2.525, "step": 1498 }, { "epoch": 0.04, "learning_rate": 0.0019994473038517117, "loss": 3.0936, "step": 1499 }, { "epoch": 0.04, "learning_rate": 0.001999444406635372, "loss": 2.9935, "step": 1500 }, { "epoch": 0.04, "learning_rate": 0.0019994415018474206, "loss": 3.1907, "step": 1501 }, { "epoch": 0.04, "learning_rate": 0.0019994385894878787, "loss": 2.9784, "step": 1502 }, { "epoch": 0.04, "learning_rate": 0.001999435669556769, "loss": 2.7818, "step": 1503 }, { "epoch": 0.04, "learning_rate": 0.0019994327420541132, "loss": 3.1642, "step": 1504 }, { "epoch": 0.04, "learning_rate": 0.001999429806979934, "loss": 2.4861, "step": 1505 }, { "epoch": 0.04, "learning_rate": 0.0019994268643342525, "loss": 2.7742, "step": 1506 }, { "epoch": 0.04, "learning_rate": 0.001999423914117092, "loss": 2.8266, "step": 1507 }, { "epoch": 0.04, "learning_rate": 0.0019994209563284748, "loss": 3.039, "step": 1508 }, { "epoch": 0.04, "learning_rate": 0.001999417990968423, "loss": 2.9491, "step": 1509 }, { "epoch": 0.04, "learning_rate": 0.0019994150180369596, "loss": 2.8708, "step": 1510 }, { "epoch": 0.04, "learning_rate": 0.001999412037534106, "loss": 3.2076, "step": 1511 }, { "epoch": 0.04, "learning_rate": 0.001999409049459886, "loss": 2.645, "step": 1512 }, { "epoch": 0.04, "learning_rate": 0.0019994060538143215, "loss": 2.8996, "step": 1513 }, { "epoch": 0.04, "learning_rate": 0.0019994030505974354, "loss": 2.9736, "step": 1514 }, { "epoch": 0.04, "learning_rate": 0.0019994000398092506, "loss": 2.8554, "step": 1515 }, { "epoch": 0.04, "learning_rate": 0.00199939702144979, "loss": 2.8253, "step": 1516 }, { "epoch": 0.04, "learning_rate": 0.0019993939955190755, "loss": 2.8682, "step": 1517 }, { "epoch": 0.04, "learning_rate": 0.0019993909620171315, "loss": 2.4629, "step": 1518 }, { "epoch": 0.04, "learning_rate": 0.00199938792094398, "loss": 2.7425, "step": 1519 }, { "epoch": 0.04, "learning_rate": 0.0019993848722996443, "loss": 2.9556, "step": 1520 }, { "epoch": 0.04, "learning_rate": 0.001999381816084147, "loss": 2.6609, "step": 1521 }, { "epoch": 0.04, "learning_rate": 0.0019993787522975125, "loss": 2.9513, "step": 1522 }, { "epoch": 0.04, "learning_rate": 0.0019993756809397628, "loss": 2.443, "step": 1523 }, { "epoch": 0.04, "learning_rate": 0.0019993726020109217, "loss": 3.1615, "step": 1524 }, { "epoch": 0.04, "learning_rate": 0.0019993695155110123, "loss": 2.9854, "step": 1525 }, { "epoch": 0.04, "learning_rate": 0.0019993664214400584, "loss": 2.5698, "step": 1526 }, { "epoch": 0.04, "learning_rate": 0.001999363319798083, "loss": 2.9871, "step": 1527 }, { "epoch": 0.04, "learning_rate": 0.0019993602105851096, "loss": 2.8094, "step": 1528 }, { "epoch": 0.04, "learning_rate": 0.0019993570938011624, "loss": 3.1691, "step": 1529 }, { "epoch": 0.04, "learning_rate": 0.0019993539694462643, "loss": 3.0746, "step": 1530 }, { "epoch": 0.04, "learning_rate": 0.001999350837520439, "loss": 2.4342, "step": 1531 }, { "epoch": 0.04, "learning_rate": 0.0019993476980237107, "loss": 3.0124, "step": 1532 }, { "epoch": 0.04, "learning_rate": 0.0019993445509561025, "loss": 2.2792, "step": 1533 }, { "epoch": 0.04, "learning_rate": 0.001999341396317639, "loss": 3.2041, "step": 1534 }, { "epoch": 0.04, "learning_rate": 0.0019993382341083436, "loss": 2.5778, "step": 1535 }, { "epoch": 0.04, "learning_rate": 0.0019993350643282403, "loss": 2.7523, "step": 1536 }, { "epoch": 0.04, "learning_rate": 0.0019993318869773536, "loss": 2.9986, "step": 1537 }, { "epoch": 0.04, "learning_rate": 0.001999328702055707, "loss": 2.8356, "step": 1538 }, { "epoch": 0.04, "learning_rate": 0.001999325509563325, "loss": 2.6104, "step": 1539 }, { "epoch": 0.04, "learning_rate": 0.001999322309500231, "loss": 2.6056, "step": 1540 }, { "epoch": 0.04, "learning_rate": 0.0019993191018664504, "loss": 2.8982, "step": 1541 }, { "epoch": 0.04, "learning_rate": 0.0019993158866620066, "loss": 2.7298, "step": 1542 }, { "epoch": 0.04, "learning_rate": 0.0019993126638869247, "loss": 3.0955, "step": 1543 }, { "epoch": 0.04, "learning_rate": 0.0019993094335412284, "loss": 2.905, "step": 1544 }, { "epoch": 0.04, "learning_rate": 0.0019993061956249426, "loss": 2.9576, "step": 1545 }, { "epoch": 0.04, "learning_rate": 0.0019993029501380916, "loss": 2.8779, "step": 1546 }, { "epoch": 0.04, "learning_rate": 0.0019992996970807004, "loss": 3.1305, "step": 1547 }, { "epoch": 0.04, "learning_rate": 0.001999296436452793, "loss": 3.3541, "step": 1548 }, { "epoch": 0.04, "learning_rate": 0.001999293168254395, "loss": 3.1718, "step": 1549 }, { "epoch": 0.04, "learning_rate": 0.00199928989248553, "loss": 2.5306, "step": 1550 }, { "epoch": 0.04, "learning_rate": 0.0019992866091462233, "loss": 3.0099, "step": 1551 }, { "epoch": 0.04, "learning_rate": 0.0019992833182365007, "loss": 2.8949, "step": 1552 }, { "epoch": 0.04, "learning_rate": 0.0019992800197563857, "loss": 2.9873, "step": 1553 }, { "epoch": 0.04, "learning_rate": 0.001999276713705904, "loss": 2.6588, "step": 1554 }, { "epoch": 0.04, "learning_rate": 0.0019992734000850807, "loss": 2.8188, "step": 1555 }, { "epoch": 0.04, "learning_rate": 0.001999270078893941, "loss": 3.1787, "step": 1556 }, { "epoch": 0.04, "learning_rate": 0.0019992667501325095, "loss": 2.6552, "step": 1557 }, { "epoch": 0.04, "learning_rate": 0.001999263413800812, "loss": 2.5115, "step": 1558 }, { "epoch": 0.04, "learning_rate": 0.0019992600698988732, "loss": 3.1082, "step": 1559 }, { "epoch": 0.04, "learning_rate": 0.0019992567184267188, "loss": 2.522, "step": 1560 }, { "epoch": 0.04, "learning_rate": 0.0019992533593843746, "loss": 2.85, "step": 1561 }, { "epoch": 0.04, "learning_rate": 0.001999249992771865, "loss": 2.747, "step": 1562 }, { "epoch": 0.04, "learning_rate": 0.001999246618589217, "loss": 2.9731, "step": 1563 }, { "epoch": 0.04, "learning_rate": 0.0019992432368364545, "loss": 2.897, "step": 1564 }, { "epoch": 0.04, "learning_rate": 0.001999239847513604, "loss": 2.8791, "step": 1565 }, { "epoch": 0.04, "learning_rate": 0.0019992364506206907, "loss": 2.8465, "step": 1566 }, { "epoch": 0.04, "learning_rate": 0.0019992330461577417, "loss": 2.5468, "step": 1567 }, { "epoch": 0.04, "learning_rate": 0.001999229634124781, "loss": 2.7057, "step": 1568 }, { "epoch": 0.04, "learning_rate": 0.001999226214521835, "loss": 3.2449, "step": 1569 }, { "epoch": 0.04, "learning_rate": 0.0019992227873489306, "loss": 2.9148, "step": 1570 }, { "epoch": 0.04, "learning_rate": 0.0019992193526060928, "loss": 2.7879, "step": 1571 }, { "epoch": 0.04, "learning_rate": 0.0019992159102933476, "loss": 2.7559, "step": 1572 }, { "epoch": 0.04, "learning_rate": 0.0019992124604107215, "loss": 3.1414, "step": 1573 }, { "epoch": 0.04, "learning_rate": 0.0019992090029582405, "loss": 3.3364, "step": 1574 }, { "epoch": 0.04, "learning_rate": 0.0019992055379359306, "loss": 2.8609, "step": 1575 }, { "epoch": 0.04, "learning_rate": 0.0019992020653438183, "loss": 2.933, "step": 1576 }, { "epoch": 0.04, "learning_rate": 0.0019991985851819296, "loss": 3.0689, "step": 1577 }, { "epoch": 0.04, "learning_rate": 0.001999195097450291, "loss": 3.1145, "step": 1578 }, { "epoch": 0.04, "learning_rate": 0.0019991916021489292, "loss": 2.4657, "step": 1579 }, { "epoch": 0.04, "learning_rate": 0.00199918809927787, "loss": 2.7365, "step": 1580 }, { "epoch": 0.04, "learning_rate": 0.001999184588837141, "loss": 2.7793, "step": 1581 }, { "epoch": 0.04, "learning_rate": 0.001999181070826768, "loss": 2.9834, "step": 1582 }, { "epoch": 0.04, "learning_rate": 0.001999177545246778, "loss": 2.7329, "step": 1583 }, { "epoch": 0.04, "learning_rate": 0.001999174012097197, "loss": 2.7422, "step": 1584 }, { "epoch": 0.04, "learning_rate": 0.001999170471378053, "loss": 3.0553, "step": 1585 }, { "epoch": 0.04, "learning_rate": 0.001999166923089372, "loss": 3.0621, "step": 1586 }, { "epoch": 0.04, "learning_rate": 0.0019991633672311808, "loss": 2.6618, "step": 1587 }, { "epoch": 0.04, "learning_rate": 0.0019991598038035067, "loss": 2.7598, "step": 1588 }, { "epoch": 0.04, "learning_rate": 0.001999156232806376, "loss": 3.1684, "step": 1589 }, { "epoch": 0.04, "learning_rate": 0.001999152654239817, "loss": 3.0665, "step": 1590 }, { "epoch": 0.04, "learning_rate": 0.001999149068103856, "loss": 2.7844, "step": 1591 }, { "epoch": 0.04, "learning_rate": 0.0019991454743985204, "loss": 2.8478, "step": 1592 }, { "epoch": 0.04, "learning_rate": 0.001999141873123837, "loss": 2.997, "step": 1593 }, { "epoch": 0.04, "learning_rate": 0.0019991382642798334, "loss": 2.7922, "step": 1594 }, { "epoch": 0.04, "learning_rate": 0.001999134647866537, "loss": 2.7528, "step": 1595 }, { "epoch": 0.04, "learning_rate": 0.0019991310238839754, "loss": 2.7292, "step": 1596 }, { "epoch": 0.04, "learning_rate": 0.0019991273923321757, "loss": 2.7342, "step": 1597 }, { "epoch": 0.04, "learning_rate": 0.001999123753211165, "loss": 2.9659, "step": 1598 }, { "epoch": 0.04, "learning_rate": 0.0019991201065209722, "loss": 2.6273, "step": 1599 }, { "epoch": 0.04, "learning_rate": 0.0019991164522616236, "loss": 3.0449, "step": 1600 }, { "epoch": 0.04, "learning_rate": 0.0019991127904331473, "loss": 2.7548, "step": 1601 }, { "epoch": 0.04, "learning_rate": 0.001999109121035571, "loss": 3.1649, "step": 1602 }, { "epoch": 0.04, "learning_rate": 0.0019991054440689233, "loss": 2.7291, "step": 1603 }, { "epoch": 0.04, "learning_rate": 0.001999101759533231, "loss": 3.0354, "step": 1604 }, { "epoch": 0.04, "learning_rate": 0.0019990980674285223, "loss": 3.0352, "step": 1605 }, { "epoch": 0.04, "learning_rate": 0.001999094367754825, "loss": 3.1124, "step": 1606 }, { "epoch": 0.04, "learning_rate": 0.0019990906605121678, "loss": 3.1904, "step": 1607 }, { "epoch": 0.04, "learning_rate": 0.0019990869457005784, "loss": 2.6837, "step": 1608 }, { "epoch": 0.04, "learning_rate": 0.0019990832233200847, "loss": 3.1758, "step": 1609 }, { "epoch": 0.04, "learning_rate": 0.0019990794933707153, "loss": 2.9678, "step": 1610 }, { "epoch": 0.04, "learning_rate": 0.0019990757558524985, "loss": 2.8735, "step": 1611 }, { "epoch": 0.04, "learning_rate": 0.001999072010765462, "loss": 2.9952, "step": 1612 }, { "epoch": 0.04, "learning_rate": 0.001999068258109635, "loss": 2.513, "step": 1613 }, { "epoch": 0.04, "learning_rate": 0.001999064497885045, "loss": 3.0562, "step": 1614 }, { "epoch": 0.04, "learning_rate": 0.001999060730091721, "loss": 3.588, "step": 1615 }, { "epoch": 0.04, "learning_rate": 0.001999056954729692, "loss": 2.7885, "step": 1616 }, { "epoch": 0.04, "learning_rate": 0.0019990531717989854, "loss": 2.8912, "step": 1617 }, { "epoch": 0.04, "learning_rate": 0.001999049381299631, "loss": 2.8587, "step": 1618 }, { "epoch": 0.04, "learning_rate": 0.001999045583231657, "loss": 3.2204, "step": 1619 }, { "epoch": 0.04, "learning_rate": 0.0019990417775950925, "loss": 2.6306, "step": 1620 }, { "epoch": 0.04, "learning_rate": 0.0019990379643899663, "loss": 2.3184, "step": 1621 }, { "epoch": 0.04, "learning_rate": 0.0019990341436163066, "loss": 2.5457, "step": 1622 }, { "epoch": 0.04, "learning_rate": 0.001999030315274143, "loss": 2.8431, "step": 1623 }, { "epoch": 0.04, "learning_rate": 0.0019990264793635043, "loss": 3.0813, "step": 1624 }, { "epoch": 0.04, "learning_rate": 0.0019990226358844194, "loss": 2.7094, "step": 1625 }, { "epoch": 0.04, "learning_rate": 0.001999018784836918, "loss": 2.7376, "step": 1626 }, { "epoch": 0.04, "learning_rate": 0.0019990149262210286, "loss": 2.7035, "step": 1627 }, { "epoch": 0.04, "learning_rate": 0.001999011060036781, "loss": 2.4618, "step": 1628 }, { "epoch": 0.04, "learning_rate": 0.001999007186284204, "loss": 2.8328, "step": 1629 }, { "epoch": 0.04, "learning_rate": 0.0019990033049633272, "loss": 2.7363, "step": 1630 }, { "epoch": 0.04, "learning_rate": 0.0019989994160741803, "loss": 2.5647, "step": 1631 }, { "epoch": 0.04, "learning_rate": 0.0019989955196167922, "loss": 3.1807, "step": 1632 }, { "epoch": 0.04, "learning_rate": 0.0019989916155911925, "loss": 3.4666, "step": 1633 }, { "epoch": 0.04, "learning_rate": 0.001998987703997411, "loss": 2.9107, "step": 1634 }, { "epoch": 0.04, "learning_rate": 0.001998983784835477, "loss": 2.9844, "step": 1635 }, { "epoch": 0.04, "learning_rate": 0.0019989798581054206, "loss": 2.5932, "step": 1636 }, { "epoch": 0.04, "learning_rate": 0.0019989759238072716, "loss": 2.6929, "step": 1637 }, { "epoch": 0.04, "learning_rate": 0.0019989719819410597, "loss": 3.2339, "step": 1638 }, { "epoch": 0.04, "learning_rate": 0.001998968032506815, "loss": 2.6642, "step": 1639 }, { "epoch": 0.04, "learning_rate": 0.0019989640755045664, "loss": 2.7299, "step": 1640 }, { "epoch": 0.04, "learning_rate": 0.0019989601109343443, "loss": 2.8709, "step": 1641 }, { "epoch": 0.04, "learning_rate": 0.0019989561387961795, "loss": 2.8538, "step": 1642 }, { "epoch": 0.04, "learning_rate": 0.001998952159090102, "loss": 2.8624, "step": 1643 }, { "epoch": 0.04, "learning_rate": 0.0019989481718161407, "loss": 2.6502, "step": 1644 }, { "epoch": 0.04, "learning_rate": 0.001998944176974327, "loss": 2.9571, "step": 1645 }, { "epoch": 0.04, "learning_rate": 0.001998940174564691, "loss": 2.983, "step": 1646 }, { "epoch": 0.04, "learning_rate": 0.0019989361645872624, "loss": 2.8402, "step": 1647 }, { "epoch": 0.04, "learning_rate": 0.0019989321470420722, "loss": 2.6918, "step": 1648 }, { "epoch": 0.04, "learning_rate": 0.0019989281219291504, "loss": 2.8259, "step": 1649 }, { "epoch": 0.04, "learning_rate": 0.0019989240892485283, "loss": 2.9407, "step": 1650 }, { "epoch": 0.04, "learning_rate": 0.0019989200490002357, "loss": 2.7441, "step": 1651 }, { "epoch": 0.04, "learning_rate": 0.0019989160011843034, "loss": 2.9407, "step": 1652 }, { "epoch": 0.04, "learning_rate": 0.001998911945800762, "loss": 2.8579, "step": 1653 }, { "epoch": 0.04, "learning_rate": 0.001998907882849642, "loss": 2.8634, "step": 1654 }, { "epoch": 0.04, "learning_rate": 0.001998903812330975, "loss": 2.8216, "step": 1655 }, { "epoch": 0.04, "learning_rate": 0.001998899734244791, "loss": 2.643, "step": 1656 }, { "epoch": 0.04, "learning_rate": 0.0019988956485911214, "loss": 2.8727, "step": 1657 }, { "epoch": 0.04, "learning_rate": 0.0019988915553699966, "loss": 2.8918, "step": 1658 }, { "epoch": 0.04, "learning_rate": 0.0019988874545814484, "loss": 2.7076, "step": 1659 }, { "epoch": 0.04, "learning_rate": 0.0019988833462255074, "loss": 2.6934, "step": 1660 }, { "epoch": 0.04, "learning_rate": 0.0019988792303022042, "loss": 2.3923, "step": 1661 }, { "epoch": 0.04, "learning_rate": 0.001998875106811571, "loss": 2.8971, "step": 1662 }, { "epoch": 0.04, "learning_rate": 0.0019988709757536387, "loss": 2.8688, "step": 1663 }, { "epoch": 0.04, "learning_rate": 0.001998866837128438, "loss": 3.0989, "step": 1664 }, { "epoch": 0.04, "learning_rate": 0.001998862690936001, "loss": 3.1674, "step": 1665 }, { "epoch": 0.04, "learning_rate": 0.0019988585371763586, "loss": 2.8349, "step": 1666 }, { "epoch": 0.04, "learning_rate": 0.001998854375849543, "loss": 3.2202, "step": 1667 }, { "epoch": 0.04, "learning_rate": 0.0019988502069555845, "loss": 2.8359, "step": 1668 }, { "epoch": 0.04, "learning_rate": 0.001998846030494516, "loss": 2.8951, "step": 1669 }, { "epoch": 0.04, "learning_rate": 0.0019988418464663683, "loss": 3.1392, "step": 1670 }, { "epoch": 0.04, "learning_rate": 0.001998837654871173, "loss": 2.8785, "step": 1671 }, { "epoch": 0.04, "learning_rate": 0.001998833455708963, "loss": 2.7998, "step": 1672 }, { "epoch": 0.04, "learning_rate": 0.0019988292489797692, "loss": 2.8977, "step": 1673 }, { "epoch": 0.04, "learning_rate": 0.0019988250346836232, "loss": 3.3858, "step": 1674 }, { "epoch": 0.05, "learning_rate": 0.0019988208128205575, "loss": 2.3873, "step": 1675 }, { "epoch": 0.05, "learning_rate": 0.0019988165833906037, "loss": 3.0469, "step": 1676 }, { "epoch": 0.05, "learning_rate": 0.0019988123463937943, "loss": 2.9506, "step": 1677 }, { "epoch": 0.05, "learning_rate": 0.0019988081018301605, "loss": 2.9591, "step": 1678 }, { "epoch": 0.05, "learning_rate": 0.001998803849699736, "loss": 2.8589, "step": 1679 }, { "epoch": 0.05, "learning_rate": 0.0019987995900025515, "loss": 2.7771, "step": 1680 }, { "epoch": 0.05, "learning_rate": 0.0019987953227386403, "loss": 2.768, "step": 1681 }, { "epoch": 0.05, "learning_rate": 0.0019987910479080336, "loss": 3.0573, "step": 1682 }, { "epoch": 0.05, "learning_rate": 0.0019987867655107652, "loss": 3.4222, "step": 1683 }, { "epoch": 0.05, "learning_rate": 0.001998782475546867, "loss": 2.6892, "step": 1684 }, { "epoch": 0.05, "learning_rate": 0.0019987781780163704, "loss": 3.0156, "step": 1685 }, { "epoch": 0.05, "learning_rate": 0.00199877387291931, "loss": 2.8697, "step": 1686 }, { "epoch": 0.05, "learning_rate": 0.0019987695602557165, "loss": 2.4811, "step": 1687 }, { "epoch": 0.05, "learning_rate": 0.0019987652400256235, "loss": 3.1867, "step": 1688 }, { "epoch": 0.05, "learning_rate": 0.0019987609122290636, "loss": 2.9187, "step": 1689 }, { "epoch": 0.05, "learning_rate": 0.0019987565768660696, "loss": 2.9649, "step": 1690 }, { "epoch": 0.05, "learning_rate": 0.001998752233936674, "loss": 3.2325, "step": 1691 }, { "epoch": 0.05, "learning_rate": 0.001998747883440911, "loss": 2.7362, "step": 1692 }, { "epoch": 0.05, "learning_rate": 0.001998743525378812, "loss": 2.7889, "step": 1693 }, { "epoch": 0.05, "learning_rate": 0.0019987391597504106, "loss": 3.134, "step": 1694 }, { "epoch": 0.05, "learning_rate": 0.00199873478655574, "loss": 3.0704, "step": 1695 }, { "epoch": 0.05, "learning_rate": 0.001998730405794833, "loss": 3.1504, "step": 1696 }, { "epoch": 0.05, "learning_rate": 0.001998726017467723, "loss": 3.0714, "step": 1697 }, { "epoch": 0.05, "learning_rate": 0.0019987216215744436, "loss": 2.928, "step": 1698 }, { "epoch": 0.05, "learning_rate": 0.0019987172181150275, "loss": 2.7301, "step": 1699 }, { "epoch": 0.05, "learning_rate": 0.0019987128070895082, "loss": 2.7671, "step": 1700 }, { "epoch": 0.05, "learning_rate": 0.0019987083884979192, "loss": 3.246, "step": 1701 }, { "epoch": 0.05, "learning_rate": 0.0019987039623402944, "loss": 2.6545, "step": 1702 }, { "epoch": 0.05, "learning_rate": 0.0019986995286166665, "loss": 2.8913, "step": 1703 }, { "epoch": 0.05, "learning_rate": 0.00199869508732707, "loss": 2.9406, "step": 1704 }, { "epoch": 0.05, "learning_rate": 0.001998690638471538, "loss": 3.0397, "step": 1705 }, { "epoch": 0.05, "learning_rate": 0.0019986861820501037, "loss": 2.6531, "step": 1706 }, { "epoch": 0.05, "learning_rate": 0.001998681718062802, "loss": 2.5684, "step": 1707 }, { "epoch": 0.05, "learning_rate": 0.001998677246509666, "loss": 2.9343, "step": 1708 }, { "epoch": 0.05, "learning_rate": 0.0019986727673907295, "loss": 2.7437, "step": 1709 }, { "epoch": 0.05, "learning_rate": 0.001998668280706027, "loss": 2.8168, "step": 1710 }, { "epoch": 0.05, "learning_rate": 0.001998663786455592, "loss": 2.9227, "step": 1711 }, { "epoch": 0.05, "learning_rate": 0.0019986592846394586, "loss": 2.6833, "step": 1712 }, { "epoch": 0.05, "learning_rate": 0.0019986547752576613, "loss": 2.6201, "step": 1713 }, { "epoch": 0.05, "learning_rate": 0.0019986502583102337, "loss": 2.6198, "step": 1714 }, { "epoch": 0.05, "learning_rate": 0.0019986457337972103, "loss": 2.8344, "step": 1715 }, { "epoch": 0.05, "learning_rate": 0.0019986412017186255, "loss": 3.4667, "step": 1716 }, { "epoch": 0.05, "learning_rate": 0.0019986366620745135, "loss": 3.0254, "step": 1717 }, { "epoch": 0.05, "learning_rate": 0.0019986321148649086, "loss": 2.7318, "step": 1718 }, { "epoch": 0.05, "learning_rate": 0.001998627560089845, "loss": 2.5557, "step": 1719 }, { "epoch": 0.05, "learning_rate": 0.0019986229977493578, "loss": 3.0843, "step": 1720 }, { "epoch": 0.05, "learning_rate": 0.0019986184278434817, "loss": 2.637, "step": 1721 }, { "epoch": 0.05, "learning_rate": 0.0019986138503722507, "loss": 2.8174, "step": 1722 }, { "epoch": 0.05, "learning_rate": 0.0019986092653356997, "loss": 2.6955, "step": 1723 }, { "epoch": 0.05, "learning_rate": 0.001998604672733863, "loss": 2.7417, "step": 1724 }, { "epoch": 0.05, "learning_rate": 0.0019986000725667765, "loss": 2.7141, "step": 1725 }, { "epoch": 0.05, "learning_rate": 0.001998595464834474, "loss": 2.8898, "step": 1726 }, { "epoch": 0.05, "learning_rate": 0.001998590849536991, "loss": 2.6636, "step": 1727 }, { "epoch": 0.05, "learning_rate": 0.001998586226674362, "loss": 2.8533, "step": 1728 }, { "epoch": 0.05, "learning_rate": 0.001998581596246622, "loss": 2.4759, "step": 1729 }, { "epoch": 0.05, "learning_rate": 0.0019985769582538068, "loss": 2.8612, "step": 1730 }, { "epoch": 0.05, "learning_rate": 0.0019985723126959513, "loss": 3.0251, "step": 1731 }, { "epoch": 0.05, "learning_rate": 0.0019985676595730903, "loss": 2.7068, "step": 1732 }, { "epoch": 0.05, "learning_rate": 0.001998562998885259, "loss": 2.8676, "step": 1733 }, { "epoch": 0.05, "learning_rate": 0.001998558330632493, "loss": 2.7703, "step": 1734 }, { "epoch": 0.05, "learning_rate": 0.001998553654814828, "loss": 2.6781, "step": 1735 }, { "epoch": 0.05, "learning_rate": 0.0019985489714322985, "loss": 2.9408, "step": 1736 }, { "epoch": 0.05, "learning_rate": 0.001998544280484941, "loss": 2.7877, "step": 1737 }, { "epoch": 0.05, "learning_rate": 0.0019985395819727904, "loss": 2.6007, "step": 1738 }, { "epoch": 0.05, "learning_rate": 0.0019985348758958825, "loss": 2.4615, "step": 1739 }, { "epoch": 0.05, "learning_rate": 0.0019985301622542522, "loss": 2.8027, "step": 1740 }, { "epoch": 0.05, "learning_rate": 0.0019985254410479366, "loss": 3.0887, "step": 1741 }, { "epoch": 0.05, "learning_rate": 0.001998520712276971, "loss": 2.6071, "step": 1742 }, { "epoch": 0.05, "learning_rate": 0.001998515975941391, "loss": 2.7821, "step": 1743 }, { "epoch": 0.05, "learning_rate": 0.001998511232041232, "loss": 2.3928, "step": 1744 }, { "epoch": 0.05, "learning_rate": 0.0019985064805765305, "loss": 3.3893, "step": 1745 }, { "epoch": 0.05, "learning_rate": 0.0019985017215473225, "loss": 2.6929, "step": 1746 }, { "epoch": 0.05, "learning_rate": 0.0019984969549536437, "loss": 2.9088, "step": 1747 }, { "epoch": 0.05, "learning_rate": 0.001998492180795531, "loss": 2.3833, "step": 1748 }, { "epoch": 0.05, "learning_rate": 0.0019984873990730196, "loss": 3.1816, "step": 1749 }, { "epoch": 0.05, "learning_rate": 0.0019984826097861467, "loss": 2.6441, "step": 1750 }, { "epoch": 0.05, "learning_rate": 0.001998477812934948, "loss": 2.861, "step": 1751 }, { "epoch": 0.05, "learning_rate": 0.001998473008519459, "loss": 2.7383, "step": 1752 }, { "epoch": 0.05, "learning_rate": 0.001998468196539718, "loss": 2.6858, "step": 1753 }, { "epoch": 0.05, "learning_rate": 0.00199846337699576, "loss": 2.6086, "step": 1754 }, { "epoch": 0.05, "learning_rate": 0.001998458549887622, "loss": 2.6797, "step": 1755 }, { "epoch": 0.05, "learning_rate": 0.001998453715215341, "loss": 2.6442, "step": 1756 }, { "epoch": 0.05, "learning_rate": 0.0019984488729789525, "loss": 2.9596, "step": 1757 }, { "epoch": 0.05, "learning_rate": 0.001998444023178494, "loss": 2.6035, "step": 1758 }, { "epoch": 0.05, "learning_rate": 0.001998439165814002, "loss": 2.6452, "step": 1759 }, { "epoch": 0.05, "learning_rate": 0.001998434300885514, "loss": 2.5269, "step": 1760 }, { "epoch": 0.05, "learning_rate": 0.0019984294283930657, "loss": 2.8362, "step": 1761 }, { "epoch": 0.05, "learning_rate": 0.0019984245483366946, "loss": 2.9294, "step": 1762 }, { "epoch": 0.05, "learning_rate": 0.0019984196607164377, "loss": 3.1863, "step": 1763 }, { "epoch": 0.05, "learning_rate": 0.001998414765532332, "loss": 2.7258, "step": 1764 }, { "epoch": 0.05, "learning_rate": 0.0019984098627844143, "loss": 3.0457, "step": 1765 }, { "epoch": 0.05, "learning_rate": 0.0019984049524727223, "loss": 2.8481, "step": 1766 }, { "epoch": 0.05, "learning_rate": 0.001998400034597293, "loss": 2.708, "step": 1767 }, { "epoch": 0.05, "learning_rate": 0.001998395109158163, "loss": 3.1834, "step": 1768 }, { "epoch": 0.05, "learning_rate": 0.0019983901761553703, "loss": 3.1202, "step": 1769 }, { "epoch": 0.05, "learning_rate": 0.001998385235588952, "loss": 3.0453, "step": 1770 }, { "epoch": 0.05, "learning_rate": 0.001998380287458946, "loss": 3.1017, "step": 1771 }, { "epoch": 0.05, "learning_rate": 0.0019983753317653896, "loss": 2.9096, "step": 1772 }, { "epoch": 0.05, "learning_rate": 0.00199837036850832, "loss": 2.4446, "step": 1773 }, { "epoch": 0.05, "learning_rate": 0.001998365397687775, "loss": 2.5367, "step": 1774 }, { "epoch": 0.05, "learning_rate": 0.0019983604193037916, "loss": 2.6367, "step": 1775 }, { "epoch": 0.05, "learning_rate": 0.0019983554333564088, "loss": 2.7868, "step": 1776 }, { "epoch": 0.05, "learning_rate": 0.0019983504398456637, "loss": 2.7784, "step": 1777 }, { "epoch": 0.05, "learning_rate": 0.001998345438771594, "loss": 2.4809, "step": 1778 }, { "epoch": 0.05, "learning_rate": 0.0019983404301342376, "loss": 2.8778, "step": 1779 }, { "epoch": 0.05, "learning_rate": 0.001998335413933633, "loss": 2.7322, "step": 1780 }, { "epoch": 0.05, "learning_rate": 0.0019983303901698174, "loss": 2.733, "step": 1781 }, { "epoch": 0.05, "learning_rate": 0.0019983253588428296, "loss": 2.7295, "step": 1782 }, { "epoch": 0.05, "learning_rate": 0.001998320319952707, "loss": 2.5242, "step": 1783 }, { "epoch": 0.05, "learning_rate": 0.0019983152734994888, "loss": 3.0823, "step": 1784 }, { "epoch": 0.05, "learning_rate": 0.001998310219483212, "loss": 2.8737, "step": 1785 }, { "epoch": 0.05, "learning_rate": 0.0019983051579039153, "loss": 3.1568, "step": 1786 }, { "epoch": 0.05, "learning_rate": 0.0019983000887616375, "loss": 2.6464, "step": 1787 }, { "epoch": 0.05, "learning_rate": 0.001998295012056417, "loss": 2.8134, "step": 1788 }, { "epoch": 0.05, "learning_rate": 0.0019982899277882914, "loss": 2.8553, "step": 1789 }, { "epoch": 0.05, "learning_rate": 0.0019982848359573003, "loss": 3.0366, "step": 1790 }, { "epoch": 0.05, "learning_rate": 0.001998279736563481, "loss": 2.8851, "step": 1791 }, { "epoch": 0.05, "learning_rate": 0.0019982746296068736, "loss": 2.5262, "step": 1792 }, { "epoch": 0.05, "learning_rate": 0.001998269515087516, "loss": 2.7852, "step": 1793 }, { "epoch": 0.05, "learning_rate": 0.001998264393005447, "loss": 2.7035, "step": 1794 }, { "epoch": 0.05, "learning_rate": 0.001998259263360705, "loss": 2.5145, "step": 1795 }, { "epoch": 0.05, "learning_rate": 0.0019982541261533296, "loss": 2.5449, "step": 1796 }, { "epoch": 0.05, "learning_rate": 0.0019982489813833593, "loss": 2.7808, "step": 1797 }, { "epoch": 0.05, "learning_rate": 0.0019982438290508334, "loss": 3.1054, "step": 1798 }, { "epoch": 0.05, "learning_rate": 0.0019982386691557905, "loss": 2.7113, "step": 1799 }, { "epoch": 0.05, "learning_rate": 0.00199823350169827, "loss": 3.2727, "step": 1800 }, { "epoch": 0.05, "learning_rate": 0.001998228326678311, "loss": 2.5443, "step": 1801 }, { "epoch": 0.05, "learning_rate": 0.001998223144095953, "loss": 2.992, "step": 1802 }, { "epoch": 0.05, "learning_rate": 0.0019982179539512345, "loss": 3.1139, "step": 1803 }, { "epoch": 0.05, "learning_rate": 0.0019982127562441954, "loss": 2.7633, "step": 1804 }, { "epoch": 0.05, "learning_rate": 0.0019982075509748748, "loss": 2.936, "step": 1805 }, { "epoch": 0.05, "learning_rate": 0.001998202338143312, "loss": 2.9104, "step": 1806 }, { "epoch": 0.05, "learning_rate": 0.0019981971177495473, "loss": 2.695, "step": 1807 }, { "epoch": 0.05, "learning_rate": 0.0019981918897936197, "loss": 2.7997, "step": 1808 }, { "epoch": 0.05, "learning_rate": 0.0019981866542755685, "loss": 3.2795, "step": 1809 }, { "epoch": 0.05, "learning_rate": 0.0019981814111954335, "loss": 3.1697, "step": 1810 }, { "epoch": 0.05, "learning_rate": 0.0019981761605532547, "loss": 2.8074, "step": 1811 }, { "epoch": 0.05, "learning_rate": 0.001998170902349072, "loss": 2.6948, "step": 1812 }, { "epoch": 0.05, "learning_rate": 0.001998165636582925, "loss": 2.6208, "step": 1813 }, { "epoch": 0.05, "learning_rate": 0.0019981603632548534, "loss": 2.8715, "step": 1814 }, { "epoch": 0.05, "learning_rate": 0.001998155082364897, "loss": 2.8582, "step": 1815 }, { "epoch": 0.05, "learning_rate": 0.001998149793913097, "loss": 2.5973, "step": 1816 }, { "epoch": 0.05, "learning_rate": 0.001998144497899492, "loss": 3.1958, "step": 1817 }, { "epoch": 0.05, "learning_rate": 0.001998139194324123, "loss": 2.8599, "step": 1818 }, { "epoch": 0.05, "learning_rate": 0.00199813388318703, "loss": 2.7628, "step": 1819 }, { "epoch": 0.05, "learning_rate": 0.0019981285644882526, "loss": 2.8071, "step": 1820 }, { "epoch": 0.05, "learning_rate": 0.001998123238227832, "loss": 2.37, "step": 1821 }, { "epoch": 0.05, "learning_rate": 0.0019981179044058083, "loss": 3.072, "step": 1822 }, { "epoch": 0.05, "learning_rate": 0.001998112563022222, "loss": 2.9442, "step": 1823 }, { "epoch": 0.05, "learning_rate": 0.001998107214077113, "loss": 2.8431, "step": 1824 }, { "epoch": 0.05, "learning_rate": 0.0019981018575705224, "loss": 2.7609, "step": 1825 }, { "epoch": 0.05, "learning_rate": 0.00199809649350249, "loss": 3.1401, "step": 1826 }, { "epoch": 0.05, "learning_rate": 0.0019980911218730577, "loss": 2.9083, "step": 1827 }, { "epoch": 0.05, "learning_rate": 0.0019980857426822652, "loss": 2.591, "step": 1828 }, { "epoch": 0.05, "learning_rate": 0.0019980803559301536, "loss": 2.7771, "step": 1829 }, { "epoch": 0.05, "learning_rate": 0.0019980749616167635, "loss": 2.8968, "step": 1830 }, { "epoch": 0.05, "learning_rate": 0.001998069559742136, "loss": 2.6468, "step": 1831 }, { "epoch": 0.05, "learning_rate": 0.0019980641503063125, "loss": 2.6874, "step": 1832 }, { "epoch": 0.05, "learning_rate": 0.0019980587333093326, "loss": 3.0189, "step": 1833 }, { "epoch": 0.05, "learning_rate": 0.001998053308751239, "loss": 2.5762, "step": 1834 }, { "epoch": 0.05, "learning_rate": 0.0019980478766320714, "loss": 2.4389, "step": 1835 }, { "epoch": 0.05, "learning_rate": 0.0019980424369518716, "loss": 2.9877, "step": 1836 }, { "epoch": 0.05, "learning_rate": 0.001998036989710681, "loss": 3.3394, "step": 1837 }, { "epoch": 0.05, "learning_rate": 0.00199803153490854, "loss": 2.59, "step": 1838 }, { "epoch": 0.05, "learning_rate": 0.0019980260725454913, "loss": 2.9254, "step": 1839 }, { "epoch": 0.05, "learning_rate": 0.0019980206026215747, "loss": 3.1287, "step": 1840 }, { "epoch": 0.05, "learning_rate": 0.001998015125136833, "loss": 2.7006, "step": 1841 }, { "epoch": 0.05, "learning_rate": 0.001998009640091307, "loss": 3.0041, "step": 1842 }, { "epoch": 0.05, "learning_rate": 0.0019980041474850383, "loss": 2.9366, "step": 1843 }, { "epoch": 0.05, "learning_rate": 0.001997998647318069, "loss": 2.8577, "step": 1844 }, { "epoch": 0.05, "learning_rate": 0.00199799313959044, "loss": 2.9256, "step": 1845 }, { "epoch": 0.05, "learning_rate": 0.0019979876243021934, "loss": 2.9447, "step": 1846 }, { "epoch": 0.05, "learning_rate": 0.001997982101453371, "loss": 2.8549, "step": 1847 }, { "epoch": 0.05, "learning_rate": 0.001997976571044015, "loss": 2.824, "step": 1848 }, { "epoch": 0.05, "learning_rate": 0.001997971033074166, "loss": 2.6333, "step": 1849 }, { "epoch": 0.05, "learning_rate": 0.0019979654875438677, "loss": 2.7787, "step": 1850 }, { "epoch": 0.05, "learning_rate": 0.0019979599344531612, "loss": 2.9168, "step": 1851 }, { "epoch": 0.05, "learning_rate": 0.0019979543738020884, "loss": 2.6115, "step": 1852 }, { "epoch": 0.05, "learning_rate": 0.0019979488055906916, "loss": 2.9989, "step": 1853 }, { "epoch": 0.05, "learning_rate": 0.0019979432298190135, "loss": 2.9002, "step": 1854 }, { "epoch": 0.05, "learning_rate": 0.0019979376464870956, "loss": 3.2029, "step": 1855 }, { "epoch": 0.05, "learning_rate": 0.001997932055594981, "loss": 2.9142, "step": 1856 }, { "epoch": 0.05, "learning_rate": 0.0019979264571427105, "loss": 2.8584, "step": 1857 }, { "epoch": 0.05, "learning_rate": 0.0019979208511303284, "loss": 2.1321, "step": 1858 }, { "epoch": 0.05, "learning_rate": 0.001997915237557876, "loss": 2.6193, "step": 1859 }, { "epoch": 0.05, "learning_rate": 0.0019979096164253964, "loss": 2.5298, "step": 1860 }, { "epoch": 0.05, "learning_rate": 0.001997903987732932, "loss": 2.9495, "step": 1861 }, { "epoch": 0.05, "learning_rate": 0.001997898351480525, "loss": 2.5816, "step": 1862 }, { "epoch": 0.05, "learning_rate": 0.001997892707668219, "loss": 2.8783, "step": 1863 }, { "epoch": 0.05, "learning_rate": 0.0019978870562960558, "loss": 3.0689, "step": 1864 }, { "epoch": 0.05, "learning_rate": 0.001997881397364079, "loss": 2.8519, "step": 1865 }, { "epoch": 0.05, "learning_rate": 0.001997875730872331, "loss": 2.5599, "step": 1866 }, { "epoch": 0.05, "learning_rate": 0.001997870056820855, "loss": 2.8927, "step": 1867 }, { "epoch": 0.05, "learning_rate": 0.001997864375209694, "loss": 2.9058, "step": 1868 }, { "epoch": 0.05, "learning_rate": 0.00199785868603889, "loss": 2.944, "step": 1869 }, { "epoch": 0.05, "learning_rate": 0.001997852989308488, "loss": 2.7083, "step": 1870 }, { "epoch": 0.05, "learning_rate": 0.0019978472850185297, "loss": 3.2299, "step": 1871 }, { "epoch": 0.05, "learning_rate": 0.001997841573169059, "loss": 2.8256, "step": 1872 }, { "epoch": 0.05, "learning_rate": 0.0019978358537601185, "loss": 3.0618, "step": 1873 }, { "epoch": 0.05, "learning_rate": 0.0019978301267917524, "loss": 3.1095, "step": 1874 }, { "epoch": 0.05, "learning_rate": 0.0019978243922640034, "loss": 2.8965, "step": 1875 }, { "epoch": 0.05, "learning_rate": 0.0019978186501769155, "loss": 2.4917, "step": 1876 }, { "epoch": 0.05, "learning_rate": 0.0019978129005305315, "loss": 2.9198, "step": 1877 }, { "epoch": 0.05, "learning_rate": 0.0019978071433248957, "loss": 2.8914, "step": 1878 }, { "epoch": 0.05, "learning_rate": 0.0019978013785600514, "loss": 2.8512, "step": 1879 }, { "epoch": 0.05, "learning_rate": 0.001997795606236042, "loss": 2.8375, "step": 1880 }, { "epoch": 0.05, "learning_rate": 0.0019977898263529117, "loss": 2.8641, "step": 1881 }, { "epoch": 0.05, "learning_rate": 0.001997784038910704, "loss": 2.7096, "step": 1882 }, { "epoch": 0.05, "learning_rate": 0.0019977782439094625, "loss": 2.7567, "step": 1883 }, { "epoch": 0.05, "learning_rate": 0.0019977724413492316, "loss": 2.7765, "step": 1884 }, { "epoch": 0.05, "learning_rate": 0.001997766631230055, "loss": 3.1232, "step": 1885 }, { "epoch": 0.05, "learning_rate": 0.001997760813551977, "loss": 2.945, "step": 1886 }, { "epoch": 0.05, "learning_rate": 0.0019977549883150414, "loss": 2.8077, "step": 1887 }, { "epoch": 0.05, "learning_rate": 0.0019977491555192924, "loss": 2.6374, "step": 1888 }, { "epoch": 0.05, "learning_rate": 0.001997743315164774, "loss": 3.0483, "step": 1889 }, { "epoch": 0.05, "learning_rate": 0.0019977374672515307, "loss": 2.9014, "step": 1890 }, { "epoch": 0.05, "learning_rate": 0.001997731611779607, "loss": 2.7937, "step": 1891 }, { "epoch": 0.05, "learning_rate": 0.0019977257487490464, "loss": 3.0215, "step": 1892 }, { "epoch": 0.05, "learning_rate": 0.0019977198781598944, "loss": 2.6075, "step": 1893 }, { "epoch": 0.05, "learning_rate": 0.001997714000012195, "loss": 3.069, "step": 1894 }, { "epoch": 0.05, "learning_rate": 0.0019977081143059926, "loss": 2.7008, "step": 1895 }, { "epoch": 0.05, "learning_rate": 0.001997702221041332, "loss": 2.6834, "step": 1896 }, { "epoch": 0.05, "learning_rate": 0.001997696320218257, "loss": 3.0137, "step": 1897 }, { "epoch": 0.05, "learning_rate": 0.001997690411836814, "loss": 2.7183, "step": 1898 }, { "epoch": 0.05, "learning_rate": 0.0019976844958970465, "loss": 2.6533, "step": 1899 }, { "epoch": 0.05, "learning_rate": 0.0019976785723989994, "loss": 2.7753, "step": 1900 }, { "epoch": 0.05, "learning_rate": 0.0019976726413427183, "loss": 2.3633, "step": 1901 }, { "epoch": 0.05, "learning_rate": 0.001997666702728247, "loss": 2.6457, "step": 1902 }, { "epoch": 0.05, "learning_rate": 0.0019976607565556316, "loss": 2.8491, "step": 1903 }, { "epoch": 0.05, "learning_rate": 0.0019976548028249165, "loss": 2.5504, "step": 1904 }, { "epoch": 0.05, "learning_rate": 0.001997648841536147, "loss": 2.8482, "step": 1905 }, { "epoch": 0.05, "learning_rate": 0.0019976428726893682, "loss": 2.6483, "step": 1906 }, { "epoch": 0.05, "learning_rate": 0.0019976368962846256, "loss": 2.6992, "step": 1907 }, { "epoch": 0.05, "learning_rate": 0.001997630912321964, "loss": 2.8879, "step": 1908 }, { "epoch": 0.05, "learning_rate": 0.001997624920801429, "loss": 2.7602, "step": 1909 }, { "epoch": 0.05, "learning_rate": 0.001997618921723066, "loss": 2.8241, "step": 1910 }, { "epoch": 0.05, "learning_rate": 0.00199761291508692, "loss": 2.9222, "step": 1911 }, { "epoch": 0.05, "learning_rate": 0.0019976069008930375, "loss": 2.9785, "step": 1912 }, { "epoch": 0.05, "learning_rate": 0.001997600879141463, "loss": 3.0147, "step": 1913 }, { "epoch": 0.05, "learning_rate": 0.0019975948498322433, "loss": 2.9349, "step": 1914 }, { "epoch": 0.05, "learning_rate": 0.0019975888129654226, "loss": 2.8122, "step": 1915 }, { "epoch": 0.05, "learning_rate": 0.0019975827685410476, "loss": 2.8762, "step": 1916 }, { "epoch": 0.05, "learning_rate": 0.0019975767165591645, "loss": 2.9978, "step": 1917 }, { "epoch": 0.05, "learning_rate": 0.0019975706570198176, "loss": 2.8431, "step": 1918 }, { "epoch": 0.05, "learning_rate": 0.0019975645899230547, "loss": 2.4982, "step": 1919 }, { "epoch": 0.05, "learning_rate": 0.0019975585152689204, "loss": 2.9408, "step": 1920 }, { "epoch": 0.05, "learning_rate": 0.0019975524330574606, "loss": 3.0953, "step": 1921 }, { "epoch": 0.05, "learning_rate": 0.0019975463432887228, "loss": 2.8843, "step": 1922 }, { "epoch": 0.05, "learning_rate": 0.001997540245962752, "loss": 2.9161, "step": 1923 }, { "epoch": 0.05, "learning_rate": 0.001997534141079594, "loss": 2.8599, "step": 1924 }, { "epoch": 0.05, "learning_rate": 0.0019975280286392964, "loss": 3.0401, "step": 1925 }, { "epoch": 0.05, "learning_rate": 0.0019975219086419043, "loss": 2.7202, "step": 1926 }, { "epoch": 0.05, "learning_rate": 0.0019975157810874647, "loss": 2.4962, "step": 1927 }, { "epoch": 0.05, "learning_rate": 0.001997509645976024, "loss": 2.5702, "step": 1928 }, { "epoch": 0.05, "learning_rate": 0.001997503503307629, "loss": 3.082, "step": 1929 }, { "epoch": 0.05, "learning_rate": 0.001997497353082325, "loss": 2.7735, "step": 1930 }, { "epoch": 0.05, "learning_rate": 0.00199749119530016, "loss": 3.0067, "step": 1931 }, { "epoch": 0.05, "learning_rate": 0.0019974850299611796, "loss": 2.9538, "step": 1932 }, { "epoch": 0.05, "learning_rate": 0.0019974788570654312, "loss": 3.0499, "step": 1933 }, { "epoch": 0.05, "learning_rate": 0.001997472676612961, "loss": 2.9369, "step": 1934 }, { "epoch": 0.05, "learning_rate": 0.001997466488603817, "loss": 2.9496, "step": 1935 }, { "epoch": 0.05, "learning_rate": 0.0019974602930380443, "loss": 2.8444, "step": 1936 }, { "epoch": 0.05, "learning_rate": 0.001997454089915691, "loss": 2.4895, "step": 1937 }, { "epoch": 0.05, "learning_rate": 0.001997447879236804, "loss": 2.7256, "step": 1938 }, { "epoch": 0.05, "learning_rate": 0.0019974416610014298, "loss": 2.7024, "step": 1939 }, { "epoch": 0.05, "learning_rate": 0.0019974354352096163, "loss": 2.6854, "step": 1940 }, { "epoch": 0.05, "learning_rate": 0.00199742920186141, "loss": 3.0669, "step": 1941 }, { "epoch": 0.05, "learning_rate": 0.001997422960956859, "loss": 2.8602, "step": 1942 }, { "epoch": 0.05, "learning_rate": 0.0019974167124960094, "loss": 2.7803, "step": 1943 }, { "epoch": 0.05, "learning_rate": 0.0019974104564789087, "loss": 2.9741, "step": 1944 }, { "epoch": 0.05, "learning_rate": 0.0019974041929056055, "loss": 2.5993, "step": 1945 }, { "epoch": 0.05, "learning_rate": 0.001997397921776146, "loss": 3.1145, "step": 1946 }, { "epoch": 0.05, "learning_rate": 0.0019973916430905785, "loss": 3.1246, "step": 1947 }, { "epoch": 0.05, "learning_rate": 0.00199738535684895, "loss": 2.5878, "step": 1948 }, { "epoch": 0.05, "learning_rate": 0.0019973790630513086, "loss": 3.0138, "step": 1949 }, { "epoch": 0.05, "learning_rate": 0.0019973727616977013, "loss": 3.1366, "step": 1950 }, { "epoch": 0.05, "learning_rate": 0.0019973664527881767, "loss": 2.7241, "step": 1951 }, { "epoch": 0.05, "learning_rate": 0.001997360136322782, "loss": 2.8098, "step": 1952 }, { "epoch": 0.05, "learning_rate": 0.0019973538123015653, "loss": 2.7962, "step": 1953 }, { "epoch": 0.05, "learning_rate": 0.001997347480724574, "loss": 2.7725, "step": 1954 }, { "epoch": 0.05, "learning_rate": 0.001997341141591857, "loss": 2.7954, "step": 1955 }, { "epoch": 0.05, "learning_rate": 0.0019973347949034615, "loss": 2.3947, "step": 1956 }, { "epoch": 0.05, "learning_rate": 0.001997328440659436, "loss": 2.8603, "step": 1957 }, { "epoch": 0.05, "learning_rate": 0.0019973220788598285, "loss": 2.9391, "step": 1958 }, { "epoch": 0.05, "learning_rate": 0.0019973157095046876, "loss": 2.4217, "step": 1959 }, { "epoch": 0.05, "learning_rate": 0.001997309332594061, "loss": 2.6561, "step": 1960 }, { "epoch": 0.05, "learning_rate": 0.001997302948127997, "loss": 2.849, "step": 1961 }, { "epoch": 0.05, "learning_rate": 0.001997296556106544, "loss": 3.0462, "step": 1962 }, { "epoch": 0.05, "learning_rate": 0.001997290156529751, "loss": 3.1549, "step": 1963 }, { "epoch": 0.05, "learning_rate": 0.001997283749397666, "loss": 3.2162, "step": 1964 }, { "epoch": 0.05, "learning_rate": 0.0019972773347103376, "loss": 2.8907, "step": 1965 }, { "epoch": 0.05, "learning_rate": 0.001997270912467814, "loss": 2.5736, "step": 1966 }, { "epoch": 0.05, "learning_rate": 0.001997264482670145, "loss": 3.219, "step": 1967 }, { "epoch": 0.05, "learning_rate": 0.001997258045317378, "loss": 2.861, "step": 1968 }, { "epoch": 0.05, "learning_rate": 0.0019972516004095626, "loss": 3.2263, "step": 1969 }, { "epoch": 0.05, "learning_rate": 0.0019972451479467472, "loss": 2.4631, "step": 1970 }, { "epoch": 0.05, "learning_rate": 0.001997238687928981, "loss": 2.8785, "step": 1971 }, { "epoch": 0.05, "learning_rate": 0.001997232220356313, "loss": 2.9942, "step": 1972 }, { "epoch": 0.05, "learning_rate": 0.0019972257452287915, "loss": 2.7119, "step": 1973 }, { "epoch": 0.05, "learning_rate": 0.001997219262546466, "loss": 2.948, "step": 1974 }, { "epoch": 0.05, "learning_rate": 0.001997212772309386, "loss": 2.6886, "step": 1975 }, { "epoch": 0.05, "learning_rate": 0.0019972062745176006, "loss": 2.5574, "step": 1976 }, { "epoch": 0.05, "learning_rate": 0.001997199769171158, "loss": 2.6944, "step": 1977 }, { "epoch": 0.05, "learning_rate": 0.001997193256270109, "loss": 3.1517, "step": 1978 }, { "epoch": 0.05, "learning_rate": 0.0019971867358145015, "loss": 2.752, "step": 1979 }, { "epoch": 0.05, "learning_rate": 0.001997180207804386, "loss": 2.9976, "step": 1980 }, { "epoch": 0.05, "learning_rate": 0.0019971736722398117, "loss": 2.6925, "step": 1981 }, { "epoch": 0.05, "learning_rate": 0.0019971671291208275, "loss": 2.7261, "step": 1982 }, { "epoch": 0.05, "learning_rate": 0.0019971605784474835, "loss": 2.8049, "step": 1983 }, { "epoch": 0.05, "learning_rate": 0.001997154020219829, "loss": 3.024, "step": 1984 }, { "epoch": 0.05, "learning_rate": 0.0019971474544379143, "loss": 2.7105, "step": 1985 }, { "epoch": 0.05, "learning_rate": 0.0019971408811017884, "loss": 2.8783, "step": 1986 }, { "epoch": 0.05, "learning_rate": 0.0019971343002115017, "loss": 2.5883, "step": 1987 }, { "epoch": 0.05, "learning_rate": 0.001997127711767104, "loss": 2.7866, "step": 1988 }, { "epoch": 0.05, "learning_rate": 0.001997121115768645, "loss": 3.1235, "step": 1989 }, { "epoch": 0.05, "learning_rate": 0.0019971145122161743, "loss": 3.1523, "step": 1990 }, { "epoch": 0.05, "learning_rate": 0.0019971079011097425, "loss": 3.1567, "step": 1991 }, { "epoch": 0.05, "learning_rate": 0.0019971012824493996, "loss": 2.5797, "step": 1992 }, { "epoch": 0.05, "learning_rate": 0.0019970946562351956, "loss": 2.5439, "step": 1993 }, { "epoch": 0.05, "learning_rate": 0.0019970880224671806, "loss": 2.6609, "step": 1994 }, { "epoch": 0.05, "learning_rate": 0.0019970813811454055, "loss": 2.938, "step": 1995 }, { "epoch": 0.05, "learning_rate": 0.0019970747322699198, "loss": 2.7239, "step": 1996 }, { "epoch": 0.05, "learning_rate": 0.001997068075840774, "loss": 2.3321, "step": 1997 }, { "epoch": 0.05, "learning_rate": 0.001997061411858019, "loss": 2.6589, "step": 1998 }, { "epoch": 0.05, "learning_rate": 0.001997054740321705, "loss": 3.1178, "step": 1999 }, { "epoch": 0.05, "learning_rate": 0.0019970480612318824, "loss": 2.8503, "step": 2000 }, { "epoch": 0.05, "learning_rate": 0.0019970413745886016, "loss": 3.0627, "step": 2001 }, { "epoch": 0.05, "learning_rate": 0.001997034680391914, "loss": 2.8551, "step": 2002 }, { "epoch": 0.05, "learning_rate": 0.00199702797864187, "loss": 2.6894, "step": 2003 }, { "epoch": 0.05, "learning_rate": 0.0019970212693385205, "loss": 2.727, "step": 2004 }, { "epoch": 0.05, "learning_rate": 0.0019970145524819158, "loss": 3.014, "step": 2005 }, { "epoch": 0.05, "learning_rate": 0.001997007828072107, "loss": 2.9502, "step": 2006 }, { "epoch": 0.05, "learning_rate": 0.0019970010961091454, "loss": 3.0361, "step": 2007 }, { "epoch": 0.05, "learning_rate": 0.0019969943565930812, "loss": 3.0235, "step": 2008 }, { "epoch": 0.05, "learning_rate": 0.0019969876095239664, "loss": 2.5668, "step": 2009 }, { "epoch": 0.05, "learning_rate": 0.0019969808549018518, "loss": 2.764, "step": 2010 }, { "epoch": 0.05, "learning_rate": 0.0019969740927267884, "loss": 2.7708, "step": 2011 }, { "epoch": 0.05, "learning_rate": 0.0019969673229988274, "loss": 2.7648, "step": 2012 }, { "epoch": 0.05, "learning_rate": 0.00199696054571802, "loss": 2.6781, "step": 2013 }, { "epoch": 0.05, "learning_rate": 0.0019969537608844185, "loss": 2.7545, "step": 2014 }, { "epoch": 0.05, "learning_rate": 0.001996946968498073, "loss": 2.7652, "step": 2015 }, { "epoch": 0.05, "learning_rate": 0.0019969401685590357, "loss": 2.5507, "step": 2016 }, { "epoch": 0.05, "learning_rate": 0.0019969333610673577, "loss": 2.6272, "step": 2017 }, { "epoch": 0.05, "learning_rate": 0.001996926546023091, "loss": 2.9188, "step": 2018 }, { "epoch": 0.05, "learning_rate": 0.001996919723426287, "loss": 2.9995, "step": 2019 }, { "epoch": 0.05, "learning_rate": 0.001996912893276997, "loss": 2.5156, "step": 2020 }, { "epoch": 0.05, "learning_rate": 0.0019969060555752737, "loss": 2.9522, "step": 2021 }, { "epoch": 0.05, "learning_rate": 0.001996899210321168, "loss": 2.4323, "step": 2022 }, { "epoch": 0.05, "learning_rate": 0.0019968923575147323, "loss": 3.0898, "step": 2023 }, { "epoch": 0.05, "learning_rate": 0.0019968854971560185, "loss": 3.2194, "step": 2024 }, { "epoch": 0.05, "learning_rate": 0.001996878629245078, "loss": 2.8018, "step": 2025 }, { "epoch": 0.05, "learning_rate": 0.0019968717537819634, "loss": 3.0727, "step": 2026 }, { "epoch": 0.05, "learning_rate": 0.0019968648707667266, "loss": 3.222, "step": 2027 }, { "epoch": 0.05, "learning_rate": 0.0019968579801994198, "loss": 2.7597, "step": 2028 }, { "epoch": 0.05, "learning_rate": 0.0019968510820800953, "loss": 2.6686, "step": 2029 }, { "epoch": 0.05, "learning_rate": 0.001996844176408805, "loss": 2.7049, "step": 2030 }, { "epoch": 0.05, "learning_rate": 0.0019968372631856014, "loss": 2.6205, "step": 2031 }, { "epoch": 0.05, "learning_rate": 0.0019968303424105368, "loss": 2.8364, "step": 2032 }, { "epoch": 0.05, "learning_rate": 0.0019968234140836645, "loss": 2.9604, "step": 2033 }, { "epoch": 0.05, "learning_rate": 0.0019968164782050352, "loss": 2.9718, "step": 2034 }, { "epoch": 0.05, "learning_rate": 0.0019968095347747033, "loss": 3.0416, "step": 2035 }, { "epoch": 0.05, "learning_rate": 0.00199680258379272, "loss": 2.8741, "step": 2036 }, { "epoch": 0.05, "learning_rate": 0.0019967956252591387, "loss": 2.2744, "step": 2037 }, { "epoch": 0.05, "learning_rate": 0.0019967886591740125, "loss": 2.7854, "step": 2038 }, { "epoch": 0.05, "learning_rate": 0.001996781685537393, "loss": 2.894, "step": 2039 }, { "epoch": 0.05, "learning_rate": 0.001996774704349334, "loss": 2.5911, "step": 2040 }, { "epoch": 0.05, "learning_rate": 0.0019967677156098877, "loss": 2.7939, "step": 2041 }, { "epoch": 0.05, "learning_rate": 0.0019967607193191075, "loss": 3.0415, "step": 2042 }, { "epoch": 0.05, "learning_rate": 0.001996753715477046, "loss": 2.7561, "step": 2043 }, { "epoch": 0.05, "learning_rate": 0.001996746704083757, "loss": 3.1339, "step": 2044 }, { "epoch": 0.05, "learning_rate": 0.0019967396851392934, "loss": 2.7436, "step": 2045 }, { "epoch": 0.05, "learning_rate": 0.001996732658643708, "loss": 2.7953, "step": 2046 }, { "epoch": 0.06, "learning_rate": 0.0019967256245970537, "loss": 2.7518, "step": 2047 }, { "epoch": 0.06, "learning_rate": 0.0019967185829993846, "loss": 2.9534, "step": 2048 }, { "epoch": 0.06, "learning_rate": 0.001996711533850754, "loss": 2.844, "step": 2049 }, { "epoch": 0.06, "learning_rate": 0.0019967044771512146, "loss": 2.493, "step": 2050 }, { "epoch": 0.06, "learning_rate": 0.00199669741290082, "loss": 2.8768, "step": 2051 }, { "epoch": 0.06, "learning_rate": 0.0019966903410996244, "loss": 2.8139, "step": 2052 }, { "epoch": 0.06, "learning_rate": 0.001996683261747681, "loss": 3.1238, "step": 2053 }, { "epoch": 0.06, "learning_rate": 0.001996676174845043, "loss": 2.9652, "step": 2054 }, { "epoch": 0.06, "learning_rate": 0.0019966690803917653, "loss": 3.1645, "step": 2055 }, { "epoch": 0.06, "learning_rate": 0.0019966619783879, "loss": 2.8045, "step": 2056 }, { "epoch": 0.06, "learning_rate": 0.001996654868833502, "loss": 2.8223, "step": 2057 }, { "epoch": 0.06, "learning_rate": 0.0019966477517286254, "loss": 2.4568, "step": 2058 }, { "epoch": 0.06, "learning_rate": 0.001996640627073323, "loss": 2.5419, "step": 2059 }, { "epoch": 0.06, "learning_rate": 0.0019966334948676497, "loss": 2.9998, "step": 2060 }, { "epoch": 0.06, "learning_rate": 0.0019966263551116593, "loss": 2.6605, "step": 2061 }, { "epoch": 0.06, "learning_rate": 0.001996619207805405, "loss": 2.5751, "step": 2062 }, { "epoch": 0.06, "learning_rate": 0.001996612052948943, "loss": 3.1641, "step": 2063 }, { "epoch": 0.06, "learning_rate": 0.0019966048905423256, "loss": 2.6089, "step": 2064 }, { "epoch": 0.06, "learning_rate": 0.001996597720585608, "loss": 2.8678, "step": 2065 }, { "epoch": 0.06, "learning_rate": 0.0019965905430788435, "loss": 2.8812, "step": 2066 }, { "epoch": 0.06, "learning_rate": 0.001996583358022088, "loss": 2.6249, "step": 2067 }, { "epoch": 0.06, "learning_rate": 0.001996576165415395, "loss": 2.3869, "step": 2068 }, { "epoch": 0.06, "learning_rate": 0.001996568965258819, "loss": 2.8696, "step": 2069 }, { "epoch": 0.06, "learning_rate": 0.0019965617575524145, "loss": 2.2363, "step": 2070 }, { "epoch": 0.06, "learning_rate": 0.0019965545422962368, "loss": 2.3706, "step": 2071 }, { "epoch": 0.06, "learning_rate": 0.0019965473194903396, "loss": 2.845, "step": 2072 }, { "epoch": 0.06, "learning_rate": 0.0019965400891347783, "loss": 3.0845, "step": 2073 }, { "epoch": 0.06, "learning_rate": 0.0019965328512296073, "loss": 3.0613, "step": 2074 }, { "epoch": 0.06, "learning_rate": 0.001996525605774882, "loss": 3.1499, "step": 2075 }, { "epoch": 0.06, "learning_rate": 0.0019965183527706565, "loss": 2.6527, "step": 2076 }, { "epoch": 0.06, "learning_rate": 0.001996511092216986, "loss": 2.8932, "step": 2077 }, { "epoch": 0.06, "learning_rate": 0.0019965038241139257, "loss": 2.6175, "step": 2078 }, { "epoch": 0.06, "learning_rate": 0.001996496548461531, "loss": 2.7421, "step": 2079 }, { "epoch": 0.06, "learning_rate": 0.001996489265259856, "loss": 2.9444, "step": 2080 }, { "epoch": 0.06, "learning_rate": 0.0019964819745089566, "loss": 2.6927, "step": 2081 }, { "epoch": 0.06, "learning_rate": 0.001996474676208888, "loss": 2.7078, "step": 2082 }, { "epoch": 0.06, "learning_rate": 0.001996467370359706, "loss": 3.1547, "step": 2083 }, { "epoch": 0.06, "learning_rate": 0.001996460056961465, "loss": 2.7827, "step": 2084 }, { "epoch": 0.06, "learning_rate": 0.00199645273601422, "loss": 2.9695, "step": 2085 }, { "epoch": 0.06, "learning_rate": 0.0019964454075180283, "loss": 2.5496, "step": 2086 }, { "epoch": 0.06, "learning_rate": 0.0019964380714729436, "loss": 2.5433, "step": 2087 }, { "epoch": 0.06, "learning_rate": 0.0019964307278790227, "loss": 3.2312, "step": 2088 }, { "epoch": 0.06, "learning_rate": 0.0019964233767363203, "loss": 2.5426, "step": 2089 }, { "epoch": 0.06, "learning_rate": 0.0019964160180448933, "loss": 2.7488, "step": 2090 }, { "epoch": 0.06, "learning_rate": 0.0019964086518047958, "loss": 3.2688, "step": 2091 }, { "epoch": 0.06, "learning_rate": 0.001996401278016085, "loss": 2.9066, "step": 2092 }, { "epoch": 0.06, "learning_rate": 0.001996393896678816, "loss": 2.714, "step": 2093 }, { "epoch": 0.06, "learning_rate": 0.001996386507793045, "loss": 2.6382, "step": 2094 }, { "epoch": 0.06, "learning_rate": 0.001996379111358828, "loss": 2.6086, "step": 2095 }, { "epoch": 0.06, "learning_rate": 0.0019963717073762212, "loss": 3.1445, "step": 2096 }, { "epoch": 0.06, "learning_rate": 0.00199636429584528, "loss": 2.8523, "step": 2097 }, { "epoch": 0.06, "learning_rate": 0.0019963568767660616, "loss": 2.7037, "step": 2098 }, { "epoch": 0.06, "learning_rate": 0.0019963494501386214, "loss": 2.9941, "step": 2099 }, { "epoch": 0.06, "learning_rate": 0.001996342015963016, "loss": 2.9889, "step": 2100 }, { "epoch": 0.06, "learning_rate": 0.0019963345742393017, "loss": 2.8459, "step": 2101 }, { "epoch": 0.06, "learning_rate": 0.0019963271249675346, "loss": 2.6386, "step": 2102 }, { "epoch": 0.06, "learning_rate": 0.001996319668147771, "loss": 3.0664, "step": 2103 }, { "epoch": 0.06, "learning_rate": 0.001996312203780068, "loss": 2.8785, "step": 2104 }, { "epoch": 0.06, "learning_rate": 0.001996304731864482, "loss": 2.5148, "step": 2105 }, { "epoch": 0.06, "learning_rate": 0.0019962972524010694, "loss": 3.0653, "step": 2106 }, { "epoch": 0.06, "learning_rate": 0.001996289765389887, "loss": 2.9035, "step": 2107 }, { "epoch": 0.06, "learning_rate": 0.001996282270830991, "loss": 2.5889, "step": 2108 }, { "epoch": 0.06, "learning_rate": 0.0019962747687244393, "loss": 3.0461, "step": 2109 }, { "epoch": 0.06, "learning_rate": 0.001996267259070288, "loss": 2.6274, "step": 2110 }, { "epoch": 0.06, "learning_rate": 0.0019962597418685937, "loss": 2.7539, "step": 2111 }, { "epoch": 0.06, "learning_rate": 0.0019962522171194136, "loss": 2.7723, "step": 2112 }, { "epoch": 0.06, "learning_rate": 0.001996244684822805, "loss": 2.7917, "step": 2113 }, { "epoch": 0.06, "learning_rate": 0.001996237144978825, "loss": 2.9063, "step": 2114 }, { "epoch": 0.06, "learning_rate": 0.0019962295975875306, "loss": 3.0254, "step": 2115 }, { "epoch": 0.06, "learning_rate": 0.0019962220426489787, "loss": 2.853, "step": 2116 }, { "epoch": 0.06, "learning_rate": 0.0019962144801632265, "loss": 2.6408, "step": 2117 }, { "epoch": 0.06, "learning_rate": 0.0019962069101303317, "loss": 2.5941, "step": 2118 }, { "epoch": 0.06, "learning_rate": 0.0019961993325503516, "loss": 2.9851, "step": 2119 }, { "epoch": 0.06, "learning_rate": 0.001996191747423343, "loss": 2.6825, "step": 2120 }, { "epoch": 0.06, "learning_rate": 0.001996184154749364, "loss": 3.1246, "step": 2121 }, { "epoch": 0.06, "learning_rate": 0.0019961765545284723, "loss": 2.7171, "step": 2122 }, { "epoch": 0.06, "learning_rate": 0.0019961689467607245, "loss": 2.7922, "step": 2123 }, { "epoch": 0.06, "learning_rate": 0.0019961613314461793, "loss": 2.8149, "step": 2124 }, { "epoch": 0.06, "learning_rate": 0.001996153708584894, "loss": 3.3053, "step": 2125 }, { "epoch": 0.06, "learning_rate": 0.001996146078176926, "loss": 2.6468, "step": 2126 }, { "epoch": 0.06, "learning_rate": 0.0019961384402223336, "loss": 2.8887, "step": 2127 }, { "epoch": 0.06, "learning_rate": 0.0019961307947211743, "loss": 2.7715, "step": 2128 }, { "epoch": 0.06, "learning_rate": 0.0019961231416735065, "loss": 2.6371, "step": 2129 }, { "epoch": 0.06, "learning_rate": 0.0019961154810793874, "loss": 2.8091, "step": 2130 }, { "epoch": 0.06, "learning_rate": 0.001996107812938876, "loss": 2.7698, "step": 2131 }, { "epoch": 0.06, "learning_rate": 0.00199610013725203, "loss": 2.7005, "step": 2132 }, { "epoch": 0.06, "learning_rate": 0.0019960924540189068, "loss": 2.7664, "step": 2133 }, { "epoch": 0.06, "learning_rate": 0.0019960847632395657, "loss": 2.6488, "step": 2134 }, { "epoch": 0.06, "learning_rate": 0.0019960770649140643, "loss": 3.0448, "step": 2135 }, { "epoch": 0.06, "learning_rate": 0.0019960693590424616, "loss": 2.8539, "step": 2136 }, { "epoch": 0.06, "learning_rate": 0.001996061645624815, "loss": 3.1429, "step": 2137 }, { "epoch": 0.06, "learning_rate": 0.0019960539246611834, "loss": 2.7301, "step": 2138 }, { "epoch": 0.06, "learning_rate": 0.0019960461961516258, "loss": 2.845, "step": 2139 }, { "epoch": 0.06, "learning_rate": 0.0019960384600961997, "loss": 3.3301, "step": 2140 }, { "epoch": 0.06, "learning_rate": 0.001996030716494965, "loss": 2.9531, "step": 2141 }, { "epoch": 0.06, "learning_rate": 0.001996022965347979, "loss": 2.799, "step": 2142 }, { "epoch": 0.06, "learning_rate": 0.0019960152066553017, "loss": 2.7145, "step": 2143 }, { "epoch": 0.06, "learning_rate": 0.001996007440416991, "loss": 2.903, "step": 2144 }, { "epoch": 0.06, "learning_rate": 0.001995999666633106, "loss": 3.0377, "step": 2145 }, { "epoch": 0.06, "learning_rate": 0.0019959918853037057, "loss": 2.4841, "step": 2146 }, { "epoch": 0.06, "learning_rate": 0.0019959840964288485, "loss": 3.2182, "step": 2147 }, { "epoch": 0.06, "learning_rate": 0.0019959763000085944, "loss": 2.7259, "step": 2148 }, { "epoch": 0.06, "learning_rate": 0.0019959684960430013, "loss": 2.6242, "step": 2149 }, { "epoch": 0.06, "learning_rate": 0.0019959606845321295, "loss": 2.6076, "step": 2150 }, { "epoch": 0.06, "learning_rate": 0.0019959528654760377, "loss": 2.8651, "step": 2151 }, { "epoch": 0.06, "learning_rate": 0.0019959450388747847, "loss": 2.617, "step": 2152 }, { "epoch": 0.06, "learning_rate": 0.0019959372047284297, "loss": 2.761, "step": 2153 }, { "epoch": 0.06, "learning_rate": 0.001995929363037033, "loss": 2.7912, "step": 2154 }, { "epoch": 0.06, "learning_rate": 0.001995921513800654, "loss": 2.3618, "step": 2155 }, { "epoch": 0.06, "learning_rate": 0.001995913657019351, "loss": 2.6787, "step": 2156 }, { "epoch": 0.06, "learning_rate": 0.0019959057926931846, "loss": 2.6737, "step": 2157 }, { "epoch": 0.06, "learning_rate": 0.0019958979208222136, "loss": 2.9766, "step": 2158 }, { "epoch": 0.06, "learning_rate": 0.001995890041406498, "loss": 2.9028, "step": 2159 }, { "epoch": 0.06, "learning_rate": 0.001995882154446098, "loss": 3.0548, "step": 2160 }, { "epoch": 0.06, "learning_rate": 0.001995874259941072, "loss": 2.8039, "step": 2161 }, { "epoch": 0.06, "learning_rate": 0.0019958663578914814, "loss": 2.6879, "step": 2162 }, { "epoch": 0.06, "learning_rate": 0.001995858448297385, "loss": 3.0272, "step": 2163 }, { "epoch": 0.06, "learning_rate": 0.001995850531158843, "loss": 3.0323, "step": 2164 }, { "epoch": 0.06, "learning_rate": 0.0019958426064759153, "loss": 2.9016, "step": 2165 }, { "epoch": 0.06, "learning_rate": 0.0019958346742486627, "loss": 2.9241, "step": 2166 }, { "epoch": 0.06, "learning_rate": 0.001995826734477144, "loss": 2.7083, "step": 2167 }, { "epoch": 0.06, "learning_rate": 0.00199581878716142, "loss": 2.8336, "step": 2168 }, { "epoch": 0.06, "learning_rate": 0.0019958108323015512, "loss": 2.7479, "step": 2169 }, { "epoch": 0.06, "learning_rate": 0.0019958028698975976, "loss": 3.2046, "step": 2170 }, { "epoch": 0.06, "learning_rate": 0.0019957948999496196, "loss": 2.7919, "step": 2171 }, { "epoch": 0.06, "learning_rate": 0.001995786922457677, "loss": 2.8801, "step": 2172 }, { "epoch": 0.06, "learning_rate": 0.001995778937421831, "loss": 3.0158, "step": 2173 }, { "epoch": 0.06, "learning_rate": 0.0019957709448421416, "loss": 3.034, "step": 2174 }, { "epoch": 0.06, "learning_rate": 0.0019957629447186695, "loss": 2.5651, "step": 2175 }, { "epoch": 0.06, "learning_rate": 0.0019957549370514757, "loss": 3.105, "step": 2176 }, { "epoch": 0.06, "learning_rate": 0.0019957469218406204, "loss": 3.135, "step": 2177 }, { "epoch": 0.06, "learning_rate": 0.0019957388990861644, "loss": 2.7758, "step": 2178 }, { "epoch": 0.06, "learning_rate": 0.0019957308687881684, "loss": 3.1466, "step": 2179 }, { "epoch": 0.06, "learning_rate": 0.0019957228309466935, "loss": 2.4891, "step": 2180 }, { "epoch": 0.06, "learning_rate": 0.0019957147855618005, "loss": 2.7536, "step": 2181 }, { "epoch": 0.06, "learning_rate": 0.0019957067326335505, "loss": 2.7089, "step": 2182 }, { "epoch": 0.06, "learning_rate": 0.0019956986721620038, "loss": 2.8617, "step": 2183 }, { "epoch": 0.06, "learning_rate": 0.0019956906041472223, "loss": 2.6073, "step": 2184 }, { "epoch": 0.06, "learning_rate": 0.0019956825285892665, "loss": 3.3853, "step": 2185 }, { "epoch": 0.06, "learning_rate": 0.001995674445488198, "loss": 2.7644, "step": 2186 }, { "epoch": 0.06, "learning_rate": 0.0019956663548440783, "loss": 2.9356, "step": 2187 }, { "epoch": 0.06, "learning_rate": 0.001995658256656968, "loss": 2.7007, "step": 2188 }, { "epoch": 0.06, "learning_rate": 0.001995650150926929, "loss": 3.0687, "step": 2189 }, { "epoch": 0.06, "learning_rate": 0.001995642037654022, "loss": 2.8285, "step": 2190 }, { "epoch": 0.06, "learning_rate": 0.001995633916838309, "loss": 2.1878, "step": 2191 }, { "epoch": 0.06, "learning_rate": 0.0019956257884798517, "loss": 2.9442, "step": 2192 }, { "epoch": 0.06, "learning_rate": 0.0019956176525787114, "loss": 2.9831, "step": 2193 }, { "epoch": 0.06, "learning_rate": 0.0019956095091349497, "loss": 3.029, "step": 2194 }, { "epoch": 0.06, "learning_rate": 0.0019956013581486284, "loss": 3.0275, "step": 2195 }, { "epoch": 0.06, "learning_rate": 0.0019955931996198093, "loss": 2.4828, "step": 2196 }, { "epoch": 0.06, "learning_rate": 0.0019955850335485535, "loss": 2.6415, "step": 2197 }, { "epoch": 0.06, "learning_rate": 0.0019955768599349243, "loss": 2.736, "step": 2198 }, { "epoch": 0.06, "learning_rate": 0.0019955686787789823, "loss": 2.5895, "step": 2199 }, { "epoch": 0.06, "learning_rate": 0.00199556049008079, "loss": 2.8211, "step": 2200 }, { "epoch": 0.06, "learning_rate": 0.0019955522938404097, "loss": 2.4397, "step": 2201 }, { "epoch": 0.06, "learning_rate": 0.001995544090057903, "loss": 3.1412, "step": 2202 }, { "epoch": 0.06, "learning_rate": 0.0019955358787333323, "loss": 3.1634, "step": 2203 }, { "epoch": 0.06, "learning_rate": 0.00199552765986676, "loss": 2.7798, "step": 2204 }, { "epoch": 0.06, "learning_rate": 0.001995519433458248, "loss": 2.604, "step": 2205 }, { "epoch": 0.06, "learning_rate": 0.0019955111995078587, "loss": 2.7305, "step": 2206 }, { "epoch": 0.06, "learning_rate": 0.0019955029580156543, "loss": 2.8538, "step": 2207 }, { "epoch": 0.06, "learning_rate": 0.0019954947089816976, "loss": 2.9137, "step": 2208 }, { "epoch": 0.06, "learning_rate": 0.001995486452406051, "loss": 3.0387, "step": 2209 }, { "epoch": 0.06, "learning_rate": 0.001995478188288777, "loss": 2.4801, "step": 2210 }, { "epoch": 0.06, "learning_rate": 0.0019954699166299383, "loss": 2.8574, "step": 2211 }, { "epoch": 0.06, "learning_rate": 0.001995461637429598, "loss": 2.5834, "step": 2212 }, { "epoch": 0.06, "learning_rate": 0.0019954533506878172, "loss": 3.075, "step": 2213 }, { "epoch": 0.06, "learning_rate": 0.0019954450564046607, "loss": 3.0393, "step": 2214 }, { "epoch": 0.06, "learning_rate": 0.0019954367545801897, "loss": 2.6239, "step": 2215 }, { "epoch": 0.06, "learning_rate": 0.0019954284452144686, "loss": 2.5561, "step": 2216 }, { "epoch": 0.06, "learning_rate": 0.001995420128307559, "loss": 2.9435, "step": 2217 }, { "epoch": 0.06, "learning_rate": 0.0019954118038595244, "loss": 2.8972, "step": 2218 }, { "epoch": 0.06, "learning_rate": 0.0019954034718704283, "loss": 2.5333, "step": 2219 }, { "epoch": 0.06, "learning_rate": 0.001995395132340333, "loss": 2.6042, "step": 2220 }, { "epoch": 0.06, "learning_rate": 0.0019953867852693027, "loss": 2.8396, "step": 2221 }, { "epoch": 0.06, "learning_rate": 0.0019953784306574, "loss": 2.6469, "step": 2222 }, { "epoch": 0.06, "learning_rate": 0.0019953700685046882, "loss": 2.7308, "step": 2223 }, { "epoch": 0.06, "learning_rate": 0.0019953616988112304, "loss": 2.5318, "step": 2224 }, { "epoch": 0.06, "learning_rate": 0.0019953533215770905, "loss": 2.7843, "step": 2225 }, { "epoch": 0.06, "learning_rate": 0.001995344936802332, "loss": 2.5107, "step": 2226 }, { "epoch": 0.06, "learning_rate": 0.001995336544487018, "loss": 2.6721, "step": 2227 }, { "epoch": 0.06, "learning_rate": 0.001995328144631212, "loss": 2.611, "step": 2228 }, { "epoch": 0.06, "learning_rate": 0.0019953197372349785, "loss": 3.0056, "step": 2229 }, { "epoch": 0.06, "learning_rate": 0.0019953113222983803, "loss": 2.7378, "step": 2230 }, { "epoch": 0.06, "learning_rate": 0.0019953028998214817, "loss": 3.0848, "step": 2231 }, { "epoch": 0.06, "learning_rate": 0.001995294469804346, "loss": 2.6001, "step": 2232 }, { "epoch": 0.06, "learning_rate": 0.0019952860322470373, "loss": 2.8921, "step": 2233 }, { "epoch": 0.06, "learning_rate": 0.00199527758714962, "loss": 2.9936, "step": 2234 }, { "epoch": 0.06, "learning_rate": 0.001995269134512157, "loss": 2.6814, "step": 2235 }, { "epoch": 0.06, "learning_rate": 0.0019952606743347135, "loss": 2.7512, "step": 2236 }, { "epoch": 0.06, "learning_rate": 0.001995252206617353, "loss": 2.6847, "step": 2237 }, { "epoch": 0.06, "learning_rate": 0.0019952437313601394, "loss": 3.1203, "step": 2238 }, { "epoch": 0.06, "learning_rate": 0.0019952352485631377, "loss": 2.6418, "step": 2239 }, { "epoch": 0.06, "learning_rate": 0.001995226758226411, "loss": 3.1745, "step": 2240 }, { "epoch": 0.06, "learning_rate": 0.001995218260350025, "loss": 3.1448, "step": 2241 }, { "epoch": 0.06, "learning_rate": 0.001995209754934043, "loss": 2.8123, "step": 2242 }, { "epoch": 0.06, "learning_rate": 0.00199520124197853, "loss": 2.738, "step": 2243 }, { "epoch": 0.06, "learning_rate": 0.0019951927214835502, "loss": 2.7789, "step": 2244 }, { "epoch": 0.06, "learning_rate": 0.0019951841934491682, "loss": 2.8158, "step": 2245 }, { "epoch": 0.06, "learning_rate": 0.001995175657875449, "loss": 2.6999, "step": 2246 }, { "epoch": 0.06, "learning_rate": 0.001995167114762457, "loss": 2.8063, "step": 2247 }, { "epoch": 0.06, "learning_rate": 0.0019951585641102563, "loss": 2.4463, "step": 2248 }, { "epoch": 0.06, "learning_rate": 0.0019951500059189123, "loss": 2.5255, "step": 2249 }, { "epoch": 0.06, "learning_rate": 0.00199514144018849, "loss": 2.9931, "step": 2250 }, { "epoch": 0.06, "learning_rate": 0.001995132866919054, "loss": 2.7217, "step": 2251 }, { "epoch": 0.06, "learning_rate": 0.0019951242861106695, "loss": 3.0981, "step": 2252 }, { "epoch": 0.06, "learning_rate": 0.0019951156977634013, "loss": 2.577, "step": 2253 }, { "epoch": 0.06, "learning_rate": 0.001995107101877314, "loss": 2.9445, "step": 2254 }, { "epoch": 0.06, "learning_rate": 0.001995098498452474, "loss": 3.1221, "step": 2255 }, { "epoch": 0.06, "learning_rate": 0.001995089887488945, "loss": 2.4225, "step": 2256 }, { "epoch": 0.06, "learning_rate": 0.0019950812689867935, "loss": 2.8956, "step": 2257 }, { "epoch": 0.06, "learning_rate": 0.001995072642946084, "loss": 3.0158, "step": 2258 }, { "epoch": 0.06, "learning_rate": 0.001995064009366882, "loss": 2.7999, "step": 2259 }, { "epoch": 0.06, "learning_rate": 0.0019950553682492526, "loss": 2.8506, "step": 2260 }, { "epoch": 0.06, "learning_rate": 0.001995046719593262, "loss": 2.7676, "step": 2261 }, { "epoch": 0.06, "learning_rate": 0.0019950380633989755, "loss": 2.9672, "step": 2262 }, { "epoch": 0.06, "learning_rate": 0.001995029399666458, "loss": 2.4978, "step": 2263 }, { "epoch": 0.06, "learning_rate": 0.001995020728395776, "loss": 2.9062, "step": 2264 }, { "epoch": 0.06, "learning_rate": 0.001995012049586995, "loss": 3.0989, "step": 2265 }, { "epoch": 0.06, "learning_rate": 0.00199500336324018, "loss": 2.6399, "step": 2266 }, { "epoch": 0.06, "learning_rate": 0.0019949946693553983, "loss": 2.929, "step": 2267 }, { "epoch": 0.06, "learning_rate": 0.0019949859679327143, "loss": 2.4775, "step": 2268 }, { "epoch": 0.06, "learning_rate": 0.0019949772589721946, "loss": 2.627, "step": 2269 }, { "epoch": 0.06, "learning_rate": 0.001994968542473905, "loss": 2.7476, "step": 2270 }, { "epoch": 0.06, "learning_rate": 0.0019949598184379118, "loss": 2.8707, "step": 2271 }, { "epoch": 0.06, "learning_rate": 0.001994951086864281, "loss": 2.5743, "step": 2272 }, { "epoch": 0.06, "learning_rate": 0.0019949423477530785, "loss": 2.8464, "step": 2273 }, { "epoch": 0.06, "learning_rate": 0.0019949336011043702, "loss": 2.8016, "step": 2274 }, { "epoch": 0.06, "learning_rate": 0.0019949248469182234, "loss": 2.8936, "step": 2275 }, { "epoch": 0.06, "learning_rate": 0.0019949160851947035, "loss": 2.8859, "step": 2276 }, { "epoch": 0.06, "learning_rate": 0.0019949073159338773, "loss": 2.9238, "step": 2277 }, { "epoch": 0.06, "learning_rate": 0.0019948985391358112, "loss": 2.9748, "step": 2278 }, { "epoch": 0.06, "learning_rate": 0.0019948897548005716, "loss": 2.5524, "step": 2279 }, { "epoch": 0.06, "learning_rate": 0.0019948809629282255, "loss": 2.8966, "step": 2280 }, { "epoch": 0.06, "learning_rate": 0.0019948721635188386, "loss": 2.8617, "step": 2281 }, { "epoch": 0.06, "learning_rate": 0.0019948633565724785, "loss": 2.4892, "step": 2282 }, { "epoch": 0.06, "learning_rate": 0.0019948545420892107, "loss": 2.8929, "step": 2283 }, { "epoch": 0.06, "learning_rate": 0.001994845720069103, "loss": 2.6042, "step": 2284 }, { "epoch": 0.06, "learning_rate": 0.0019948368905122224, "loss": 2.5556, "step": 2285 }, { "epoch": 0.06, "learning_rate": 0.0019948280534186355, "loss": 2.9526, "step": 2286 }, { "epoch": 0.06, "learning_rate": 0.0019948192087884085, "loss": 3.2162, "step": 2287 }, { "epoch": 0.06, "learning_rate": 0.0019948103566216095, "loss": 2.8858, "step": 2288 }, { "epoch": 0.06, "learning_rate": 0.0019948014969183047, "loss": 2.6611, "step": 2289 }, { "epoch": 0.06, "learning_rate": 0.001994792629678562, "loss": 2.5204, "step": 2290 }, { "epoch": 0.06, "learning_rate": 0.0019947837549024483, "loss": 2.5977, "step": 2291 }, { "epoch": 0.06, "learning_rate": 0.00199477487259003, "loss": 2.8131, "step": 2292 }, { "epoch": 0.06, "learning_rate": 0.0019947659827413756, "loss": 3.2264, "step": 2293 }, { "epoch": 0.06, "learning_rate": 0.001994757085356552, "loss": 2.8277, "step": 2294 }, { "epoch": 0.06, "learning_rate": 0.0019947481804356263, "loss": 2.7785, "step": 2295 }, { "epoch": 0.06, "learning_rate": 0.0019947392679786667, "loss": 2.6507, "step": 2296 }, { "epoch": 0.06, "learning_rate": 0.0019947303479857397, "loss": 2.832, "step": 2297 }, { "epoch": 0.06, "learning_rate": 0.001994721420456914, "loss": 3.1029, "step": 2298 }, { "epoch": 0.06, "learning_rate": 0.0019947124853922564, "loss": 2.897, "step": 2299 }, { "epoch": 0.06, "learning_rate": 0.0019947035427918345, "loss": 2.826, "step": 2300 }, { "epoch": 0.06, "learning_rate": 0.001994694592655717, "loss": 2.5857, "step": 2301 }, { "epoch": 0.06, "learning_rate": 0.0019946856349839707, "loss": 2.6009, "step": 2302 }, { "epoch": 0.06, "learning_rate": 0.0019946766697766637, "loss": 2.7131, "step": 2303 }, { "epoch": 0.06, "learning_rate": 0.0019946676970338645, "loss": 2.5523, "step": 2304 }, { "epoch": 0.06, "learning_rate": 0.0019946587167556404, "loss": 2.5988, "step": 2305 }, { "epoch": 0.06, "learning_rate": 0.00199464972894206, "loss": 2.8648, "step": 2306 }, { "epoch": 0.06, "learning_rate": 0.0019946407335931907, "loss": 2.8734, "step": 2307 }, { "epoch": 0.06, "learning_rate": 0.0019946317307091015, "loss": 3.1284, "step": 2308 }, { "epoch": 0.06, "learning_rate": 0.0019946227202898596, "loss": 2.7491, "step": 2309 }, { "epoch": 0.06, "learning_rate": 0.001994613702335534, "loss": 2.6043, "step": 2310 }, { "epoch": 0.06, "learning_rate": 0.001994604676846193, "loss": 3.0981, "step": 2311 }, { "epoch": 0.06, "learning_rate": 0.0019945956438219047, "loss": 2.6945, "step": 2312 }, { "epoch": 0.06, "learning_rate": 0.0019945866032627375, "loss": 2.9068, "step": 2313 }, { "epoch": 0.06, "learning_rate": 0.00199457755516876, "loss": 2.6476, "step": 2314 }, { "epoch": 0.06, "learning_rate": 0.001994568499540041, "loss": 2.5155, "step": 2315 }, { "epoch": 0.06, "learning_rate": 0.0019945594363766483, "loss": 2.456, "step": 2316 }, { "epoch": 0.06, "learning_rate": 0.0019945503656786517, "loss": 2.8663, "step": 2317 }, { "epoch": 0.06, "learning_rate": 0.001994541287446119, "loss": 2.8839, "step": 2318 }, { "epoch": 0.06, "learning_rate": 0.0019945322016791194, "loss": 2.5429, "step": 2319 }, { "epoch": 0.06, "learning_rate": 0.0019945231083777215, "loss": 3.098, "step": 2320 }, { "epoch": 0.06, "learning_rate": 0.0019945140075419946, "loss": 2.7139, "step": 2321 }, { "epoch": 0.06, "learning_rate": 0.0019945048991720075, "loss": 2.4705, "step": 2322 }, { "epoch": 0.06, "learning_rate": 0.001994495783267829, "loss": 2.8588, "step": 2323 }, { "epoch": 0.06, "learning_rate": 0.001994486659829528, "loss": 2.5016, "step": 2324 }, { "epoch": 0.06, "learning_rate": 0.001994477528857174, "loss": 2.9993, "step": 2325 }, { "epoch": 0.06, "learning_rate": 0.001994468390350836, "loss": 3.0917, "step": 2326 }, { "epoch": 0.06, "learning_rate": 0.0019944592443105836, "loss": 2.5175, "step": 2327 }, { "epoch": 0.06, "learning_rate": 0.001994450090736485, "loss": 2.8276, "step": 2328 }, { "epoch": 0.06, "learning_rate": 0.0019944409296286107, "loss": 2.7417, "step": 2329 }, { "epoch": 0.06, "learning_rate": 0.00199443176098703, "loss": 2.7238, "step": 2330 }, { "epoch": 0.06, "learning_rate": 0.0019944225848118114, "loss": 2.5964, "step": 2331 }, { "epoch": 0.06, "learning_rate": 0.001994413401103026, "loss": 3.0807, "step": 2332 }, { "epoch": 0.06, "learning_rate": 0.0019944042098607416, "loss": 3.1858, "step": 2333 }, { "epoch": 0.06, "learning_rate": 0.001994395011085029, "loss": 2.7963, "step": 2334 }, { "epoch": 0.06, "learning_rate": 0.0019943858047759577, "loss": 2.9776, "step": 2335 }, { "epoch": 0.06, "learning_rate": 0.0019943765909335976, "loss": 3.0794, "step": 2336 }, { "epoch": 0.06, "learning_rate": 0.001994367369558018, "loss": 2.7251, "step": 2337 }, { "epoch": 0.06, "learning_rate": 0.001994358140649289, "loss": 3.0079, "step": 2338 }, { "epoch": 0.06, "learning_rate": 0.00199434890420748, "loss": 2.6884, "step": 2339 }, { "epoch": 0.06, "learning_rate": 0.001994339660232662, "loss": 2.8847, "step": 2340 }, { "epoch": 0.06, "learning_rate": 0.0019943304087249045, "loss": 2.5932, "step": 2341 }, { "epoch": 0.06, "learning_rate": 0.0019943211496842774, "loss": 2.8078, "step": 2342 }, { "epoch": 0.06, "learning_rate": 0.001994311883110851, "loss": 2.9885, "step": 2343 }, { "epoch": 0.06, "learning_rate": 0.0019943026090046955, "loss": 2.8847, "step": 2344 }, { "epoch": 0.06, "learning_rate": 0.001994293327365881, "loss": 2.4523, "step": 2345 }, { "epoch": 0.06, "learning_rate": 0.0019942840381944786, "loss": 2.3038, "step": 2346 }, { "epoch": 0.06, "learning_rate": 0.0019942747414905576, "loss": 3.168, "step": 2347 }, { "epoch": 0.06, "learning_rate": 0.0019942654372541893, "loss": 2.8451, "step": 2348 }, { "epoch": 0.06, "learning_rate": 0.001994256125485444, "loss": 2.6426, "step": 2349 }, { "epoch": 0.06, "learning_rate": 0.0019942468061843917, "loss": 2.814, "step": 2350 }, { "epoch": 0.06, "learning_rate": 0.001994237479351103, "loss": 3.0313, "step": 2351 }, { "epoch": 0.06, "learning_rate": 0.0019942281449856496, "loss": 2.6301, "step": 2352 }, { "epoch": 0.06, "learning_rate": 0.001994218803088101, "loss": 2.6797, "step": 2353 }, { "epoch": 0.06, "learning_rate": 0.0019942094536585285, "loss": 2.6767, "step": 2354 }, { "epoch": 0.06, "learning_rate": 0.001994200096697003, "loss": 2.9605, "step": 2355 }, { "epoch": 0.06, "learning_rate": 0.001994190732203596, "loss": 2.7411, "step": 2356 }, { "epoch": 0.06, "learning_rate": 0.0019941813601783765, "loss": 2.2678, "step": 2357 }, { "epoch": 0.06, "learning_rate": 0.0019941719806214177, "loss": 2.95, "step": 2358 }, { "epoch": 0.06, "learning_rate": 0.0019941625935327896, "loss": 2.8636, "step": 2359 }, { "epoch": 0.06, "learning_rate": 0.0019941531989125633, "loss": 2.878, "step": 2360 }, { "epoch": 0.06, "learning_rate": 0.00199414379676081, "loss": 2.8547, "step": 2361 }, { "epoch": 0.06, "learning_rate": 0.001994134387077601, "loss": 3.1232, "step": 2362 }, { "epoch": 0.06, "learning_rate": 0.001994124969863008, "loss": 2.8023, "step": 2363 }, { "epoch": 0.06, "learning_rate": 0.0019941155451171015, "loss": 2.5569, "step": 2364 }, { "epoch": 0.06, "learning_rate": 0.001994106112839954, "loss": 2.6886, "step": 2365 }, { "epoch": 0.06, "learning_rate": 0.0019940966730316355, "loss": 2.8097, "step": 2366 }, { "epoch": 0.06, "learning_rate": 0.0019940872256922187, "loss": 2.8801, "step": 2367 }, { "epoch": 0.06, "learning_rate": 0.001994077770821775, "loss": 2.4887, "step": 2368 }, { "epoch": 0.06, "learning_rate": 0.0019940683084203755, "loss": 2.7985, "step": 2369 }, { "epoch": 0.06, "learning_rate": 0.0019940588384880923, "loss": 2.9502, "step": 2370 }, { "epoch": 0.06, "learning_rate": 0.001994049361024997, "loss": 2.8831, "step": 2371 }, { "epoch": 0.06, "learning_rate": 0.0019940398760311616, "loss": 2.7342, "step": 2372 }, { "epoch": 0.06, "learning_rate": 0.001994030383506658, "loss": 3.0546, "step": 2373 }, { "epoch": 0.06, "learning_rate": 0.0019940208834515576, "loss": 2.4313, "step": 2374 }, { "epoch": 0.06, "learning_rate": 0.001994011375865933, "loss": 3.2785, "step": 2375 }, { "epoch": 0.06, "learning_rate": 0.001994001860749856, "loss": 2.6985, "step": 2376 }, { "epoch": 0.06, "learning_rate": 0.001993992338103398, "loss": 2.7633, "step": 2377 }, { "epoch": 0.06, "learning_rate": 0.0019939828079266323, "loss": 2.5883, "step": 2378 }, { "epoch": 0.06, "learning_rate": 0.00199397327021963, "loss": 3.1028, "step": 2379 }, { "epoch": 0.06, "learning_rate": 0.0019939637249824648, "loss": 2.7649, "step": 2380 }, { "epoch": 0.06, "learning_rate": 0.0019939541722152074, "loss": 3.0342, "step": 2381 }, { "epoch": 0.06, "learning_rate": 0.001993944611917931, "loss": 2.7817, "step": 2382 }, { "epoch": 0.06, "learning_rate": 0.001993935044090708, "loss": 2.8641, "step": 2383 }, { "epoch": 0.06, "learning_rate": 0.001993925468733611, "loss": 2.592, "step": 2384 }, { "epoch": 0.06, "learning_rate": 0.001993915885846712, "loss": 2.475, "step": 2385 }, { "epoch": 0.06, "learning_rate": 0.001993906295430084, "loss": 2.7446, "step": 2386 }, { "epoch": 0.06, "learning_rate": 0.0019938966974838, "loss": 2.5456, "step": 2387 }, { "epoch": 0.06, "learning_rate": 0.0019938870920079323, "loss": 2.6393, "step": 2388 }, { "epoch": 0.06, "learning_rate": 0.001993877479002553, "loss": 2.5593, "step": 2389 }, { "epoch": 0.06, "learning_rate": 0.0019938678584677364, "loss": 2.9374, "step": 2390 }, { "epoch": 0.06, "learning_rate": 0.001993858230403554, "loss": 3.2108, "step": 2391 }, { "epoch": 0.06, "learning_rate": 0.0019938485948100796, "loss": 2.8739, "step": 2392 }, { "epoch": 0.06, "learning_rate": 0.001993838951687386, "loss": 2.5835, "step": 2393 }, { "epoch": 0.06, "learning_rate": 0.0019938293010355462, "loss": 2.9042, "step": 2394 }, { "epoch": 0.06, "learning_rate": 0.0019938196428546328, "loss": 2.5934, "step": 2395 }, { "epoch": 0.06, "learning_rate": 0.00199380997714472, "loss": 2.7721, "step": 2396 }, { "epoch": 0.06, "learning_rate": 0.0019938003039058805, "loss": 2.4136, "step": 2397 }, { "epoch": 0.06, "learning_rate": 0.0019937906231381874, "loss": 2.43, "step": 2398 }, { "epoch": 0.06, "learning_rate": 0.001993780934841714, "loss": 2.8665, "step": 2399 }, { "epoch": 0.06, "learning_rate": 0.001993771239016534, "loss": 2.5444, "step": 2400 }, { "epoch": 0.06, "learning_rate": 0.001993761535662721, "loss": 3.1019, "step": 2401 }, { "epoch": 0.06, "learning_rate": 0.001993751824780348, "loss": 2.3979, "step": 2402 }, { "epoch": 0.06, "learning_rate": 0.0019937421063694893, "loss": 2.7469, "step": 2403 }, { "epoch": 0.06, "learning_rate": 0.0019937323804302175, "loss": 2.7391, "step": 2404 }, { "epoch": 0.06, "learning_rate": 0.001993722646962607, "loss": 2.9755, "step": 2405 }, { "epoch": 0.06, "learning_rate": 0.0019937129059667317, "loss": 2.9621, "step": 2406 }, { "epoch": 0.06, "learning_rate": 0.001993703157442665, "loss": 2.8541, "step": 2407 }, { "epoch": 0.06, "learning_rate": 0.0019936934013904807, "loss": 2.8933, "step": 2408 }, { "epoch": 0.06, "learning_rate": 0.001993683637810253, "loss": 3.2251, "step": 2409 }, { "epoch": 0.06, "learning_rate": 0.0019936738667020552, "loss": 2.8801, "step": 2410 }, { "epoch": 0.06, "learning_rate": 0.0019936640880659625, "loss": 2.8557, "step": 2411 }, { "epoch": 0.06, "learning_rate": 0.0019936543019020477, "loss": 2.9102, "step": 2412 }, { "epoch": 0.06, "learning_rate": 0.001993644508210386, "loss": 2.6884, "step": 2413 }, { "epoch": 0.06, "learning_rate": 0.0019936347069910514, "loss": 2.5442, "step": 2414 }, { "epoch": 0.06, "learning_rate": 0.0019936248982441174, "loss": 2.7378, "step": 2415 }, { "epoch": 0.06, "learning_rate": 0.0019936150819696587, "loss": 2.7544, "step": 2416 }, { "epoch": 0.06, "learning_rate": 0.00199360525816775, "loss": 2.7844, "step": 2417 }, { "epoch": 0.06, "learning_rate": 0.0019935954268384655, "loss": 2.6934, "step": 2418 }, { "epoch": 0.07, "learning_rate": 0.00199358558798188, "loss": 3.0668, "step": 2419 }, { "epoch": 0.07, "learning_rate": 0.0019935757415980673, "loss": 3.0355, "step": 2420 }, { "epoch": 0.07, "learning_rate": 0.0019935658876871027, "loss": 2.8136, "step": 2421 }, { "epoch": 0.07, "learning_rate": 0.0019935560262490603, "loss": 2.9974, "step": 2422 }, { "epoch": 0.07, "learning_rate": 0.0019935461572840154, "loss": 2.7086, "step": 2423 }, { "epoch": 0.07, "learning_rate": 0.001993536280792042, "loss": 2.4275, "step": 2424 }, { "epoch": 0.07, "learning_rate": 0.0019935263967732157, "loss": 2.5073, "step": 2425 }, { "epoch": 0.07, "learning_rate": 0.001993516505227611, "loss": 3.0993, "step": 2426 }, { "epoch": 0.07, "learning_rate": 0.001993506606155303, "loss": 3.0579, "step": 2427 }, { "epoch": 0.07, "learning_rate": 0.0019934966995563664, "loss": 2.7671, "step": 2428 }, { "epoch": 0.07, "learning_rate": 0.001993486785430876, "loss": 2.6587, "step": 2429 }, { "epoch": 0.07, "learning_rate": 0.0019934768637789083, "loss": 2.6316, "step": 2430 }, { "epoch": 0.07, "learning_rate": 0.001993466934600537, "loss": 2.797, "step": 2431 }, { "epoch": 0.07, "learning_rate": 0.001993456997895838, "loss": 2.4425, "step": 2432 }, { "epoch": 0.07, "learning_rate": 0.0019934470536648857, "loss": 2.5843, "step": 2433 }, { "epoch": 0.07, "learning_rate": 0.001993437101907757, "loss": 3.1862, "step": 2434 }, { "epoch": 0.07, "learning_rate": 0.0019934271426245258, "loss": 2.587, "step": 2435 }, { "epoch": 0.07, "learning_rate": 0.0019934171758152685, "loss": 2.6763, "step": 2436 }, { "epoch": 0.07, "learning_rate": 0.00199340720148006, "loss": 2.692, "step": 2437 }, { "epoch": 0.07, "learning_rate": 0.0019933972196189763, "loss": 2.606, "step": 2438 }, { "epoch": 0.07, "learning_rate": 0.001993387230232093, "loss": 3.0093, "step": 2439 }, { "epoch": 0.07, "learning_rate": 0.001993377233319486, "loss": 2.8723, "step": 2440 }, { "epoch": 0.07, "learning_rate": 0.0019933672288812297, "loss": 2.7812, "step": 2441 }, { "epoch": 0.07, "learning_rate": 0.0019933572169174014, "loss": 2.9584, "step": 2442 }, { "epoch": 0.07, "learning_rate": 0.0019933471974280764, "loss": 2.5906, "step": 2443 }, { "epoch": 0.07, "learning_rate": 0.001993337170413331, "loss": 2.4933, "step": 2444 }, { "epoch": 0.07, "learning_rate": 0.00199332713587324, "loss": 2.8439, "step": 2445 }, { "epoch": 0.07, "learning_rate": 0.0019933170938078813, "loss": 3.0751, "step": 2446 }, { "epoch": 0.07, "learning_rate": 0.001993307044217329, "loss": 2.6244, "step": 2447 }, { "epoch": 0.07, "learning_rate": 0.0019932969871016603, "loss": 2.6747, "step": 2448 }, { "epoch": 0.07, "learning_rate": 0.0019932869224609513, "loss": 2.9742, "step": 2449 }, { "epoch": 0.07, "learning_rate": 0.001993276850295278, "loss": 2.8693, "step": 2450 }, { "epoch": 0.07, "learning_rate": 0.0019932667706047172, "loss": 2.7718, "step": 2451 }, { "epoch": 0.07, "learning_rate": 0.001993256683389345, "loss": 2.7276, "step": 2452 }, { "epoch": 0.07, "learning_rate": 0.001993246588649237, "loss": 2.9141, "step": 2453 }, { "epoch": 0.07, "learning_rate": 0.001993236486384471, "loss": 3.1946, "step": 2454 }, { "epoch": 0.07, "learning_rate": 0.001993226376595123, "loss": 2.691, "step": 2455 }, { "epoch": 0.07, "learning_rate": 0.001993216259281269, "loss": 3.0515, "step": 2456 }, { "epoch": 0.07, "learning_rate": 0.0019932061344429867, "loss": 2.6828, "step": 2457 }, { "epoch": 0.07, "learning_rate": 0.001993196002080352, "loss": 2.493, "step": 2458 }, { "epoch": 0.07, "learning_rate": 0.0019931858621934423, "loss": 2.7178, "step": 2459 }, { "epoch": 0.07, "learning_rate": 0.001993175714782334, "loss": 2.8412, "step": 2460 }, { "epoch": 0.07, "learning_rate": 0.001993165559847104, "loss": 2.708, "step": 2461 }, { "epoch": 0.07, "learning_rate": 0.001993155397387829, "loss": 3.1554, "step": 2462 }, { "epoch": 0.07, "learning_rate": 0.001993145227404587, "loss": 2.6883, "step": 2463 }, { "epoch": 0.07, "learning_rate": 0.0019931350498974534, "loss": 2.9636, "step": 2464 }, { "epoch": 0.07, "learning_rate": 0.0019931248648665067, "loss": 2.887, "step": 2465 }, { "epoch": 0.07, "learning_rate": 0.0019931146723118232, "loss": 2.9072, "step": 2466 }, { "epoch": 0.07, "learning_rate": 0.001993104472233481, "loss": 3.1527, "step": 2467 }, { "epoch": 0.07, "learning_rate": 0.001993094264631557, "loss": 2.9665, "step": 2468 }, { "epoch": 0.07, "learning_rate": 0.001993084049506128, "loss": 2.8174, "step": 2469 }, { "epoch": 0.07, "learning_rate": 0.0019930738268572716, "loss": 2.791, "step": 2470 }, { "epoch": 0.07, "learning_rate": 0.0019930635966850657, "loss": 2.7914, "step": 2471 }, { "epoch": 0.07, "learning_rate": 0.0019930533589895875, "loss": 2.9277, "step": 2472 }, { "epoch": 0.07, "learning_rate": 0.0019930431137709145, "loss": 2.8527, "step": 2473 }, { "epoch": 0.07, "learning_rate": 0.001993032861029125, "loss": 3.0576, "step": 2474 }, { "epoch": 0.07, "learning_rate": 0.001993022600764295, "loss": 3.1522, "step": 2475 }, { "epoch": 0.07, "learning_rate": 0.0019930123329765046, "loss": 2.5422, "step": 2476 }, { "epoch": 0.07, "learning_rate": 0.0019930020576658294, "loss": 2.6494, "step": 2477 }, { "epoch": 0.07, "learning_rate": 0.0019929917748323484, "loss": 2.5819, "step": 2478 }, { "epoch": 0.07, "learning_rate": 0.0019929814844761393, "loss": 2.7911, "step": 2479 }, { "epoch": 0.07, "learning_rate": 0.00199297118659728, "loss": 3.0145, "step": 2480 }, { "epoch": 0.07, "learning_rate": 0.001992960881195848, "loss": 2.989, "step": 2481 }, { "epoch": 0.07, "learning_rate": 0.0019929505682719224, "loss": 2.9092, "step": 2482 }, { "epoch": 0.07, "learning_rate": 0.0019929402478255807, "loss": 2.6989, "step": 2483 }, { "epoch": 0.07, "learning_rate": 0.001992929919856901, "loss": 2.7724, "step": 2484 }, { "epoch": 0.07, "learning_rate": 0.0019929195843659624, "loss": 2.9915, "step": 2485 }, { "epoch": 0.07, "learning_rate": 0.001992909241352842, "loss": 3.4591, "step": 2486 }, { "epoch": 0.07, "learning_rate": 0.0019928988908176188, "loss": 2.7109, "step": 2487 }, { "epoch": 0.07, "learning_rate": 0.0019928885327603714, "loss": 2.9214, "step": 2488 }, { "epoch": 0.07, "learning_rate": 0.0019928781671811773, "loss": 2.7851, "step": 2489 }, { "epoch": 0.07, "learning_rate": 0.0019928677940801165, "loss": 2.7557, "step": 2490 }, { "epoch": 0.07, "learning_rate": 0.0019928574134572665, "loss": 3.2135, "step": 2491 }, { "epoch": 0.07, "learning_rate": 0.001992847025312706, "loss": 2.569, "step": 2492 }, { "epoch": 0.07, "learning_rate": 0.001992836629646514, "loss": 2.5653, "step": 2493 }, { "epoch": 0.07, "learning_rate": 0.0019928262264587693, "loss": 2.8768, "step": 2494 }, { "epoch": 0.07, "learning_rate": 0.001992815815749551, "loss": 2.6854, "step": 2495 }, { "epoch": 0.07, "learning_rate": 0.001992805397518937, "loss": 2.7239, "step": 2496 }, { "epoch": 0.07, "learning_rate": 0.001992794971767007, "loss": 2.4658, "step": 2497 }, { "epoch": 0.07, "learning_rate": 0.00199278453849384, "loss": 3.0718, "step": 2498 }, { "epoch": 0.07, "learning_rate": 0.0019927740976995144, "loss": 2.8535, "step": 2499 }, { "epoch": 0.07, "learning_rate": 0.00199276364938411, "loss": 2.635, "step": 2500 }, { "epoch": 0.07, "learning_rate": 0.0019927531935477055, "loss": 2.6792, "step": 2501 }, { "epoch": 0.07, "learning_rate": 0.001992742730190381, "loss": 3.0614, "step": 2502 }, { "epoch": 0.07, "learning_rate": 0.001992732259312214, "loss": 3.2386, "step": 2503 }, { "epoch": 0.07, "learning_rate": 0.0019927217809132857, "loss": 2.8313, "step": 2504 }, { "epoch": 0.07, "learning_rate": 0.0019927112949936743, "loss": 2.5509, "step": 2505 }, { "epoch": 0.07, "learning_rate": 0.0019927008015534595, "loss": 2.8103, "step": 2506 }, { "epoch": 0.07, "learning_rate": 0.001992690300592721, "loss": 2.7436, "step": 2507 }, { "epoch": 0.07, "learning_rate": 0.0019926797921115385, "loss": 2.8444, "step": 2508 }, { "epoch": 0.07, "learning_rate": 0.001992669276109991, "loss": 2.8511, "step": 2509 }, { "epoch": 0.07, "learning_rate": 0.001992658752588159, "loss": 2.3969, "step": 2510 }, { "epoch": 0.07, "learning_rate": 0.0019926482215461214, "loss": 2.9511, "step": 2511 }, { "epoch": 0.07, "learning_rate": 0.0019926376829839587, "loss": 2.6968, "step": 2512 }, { "epoch": 0.07, "learning_rate": 0.0019926271369017498, "loss": 3.023, "step": 2513 }, { "epoch": 0.07, "learning_rate": 0.0019926165832995757, "loss": 2.9363, "step": 2514 }, { "epoch": 0.07, "learning_rate": 0.0019926060221775155, "loss": 3.1102, "step": 2515 }, { "epoch": 0.07, "learning_rate": 0.00199259545353565, "loss": 2.7051, "step": 2516 }, { "epoch": 0.07, "learning_rate": 0.0019925848773740583, "loss": 3.076, "step": 2517 }, { "epoch": 0.07, "learning_rate": 0.001992574293692821, "loss": 2.8816, "step": 2518 }, { "epoch": 0.07, "learning_rate": 0.0019925637024920183, "loss": 2.8659, "step": 2519 }, { "epoch": 0.07, "learning_rate": 0.001992553103771731, "loss": 2.3819, "step": 2520 }, { "epoch": 0.07, "learning_rate": 0.0019925424975320385, "loss": 2.5158, "step": 2521 }, { "epoch": 0.07, "learning_rate": 0.0019925318837730214, "loss": 2.6453, "step": 2522 }, { "epoch": 0.07, "learning_rate": 0.00199252126249476, "loss": 2.9426, "step": 2523 }, { "epoch": 0.07, "learning_rate": 0.0019925106336973353, "loss": 2.8807, "step": 2524 }, { "epoch": 0.07, "learning_rate": 0.0019924999973808277, "loss": 2.5824, "step": 2525 }, { "epoch": 0.07, "learning_rate": 0.0019924893535453172, "loss": 2.5812, "step": 2526 }, { "epoch": 0.07, "learning_rate": 0.0019924787021908846, "loss": 2.6166, "step": 2527 }, { "epoch": 0.07, "learning_rate": 0.0019924680433176115, "loss": 2.6302, "step": 2528 }, { "epoch": 0.07, "learning_rate": 0.0019924573769255776, "loss": 2.9727, "step": 2529 }, { "epoch": 0.07, "learning_rate": 0.001992446703014864, "loss": 2.7052, "step": 2530 }, { "epoch": 0.07, "learning_rate": 0.0019924360215855513, "loss": 2.9646, "step": 2531 }, { "epoch": 0.07, "learning_rate": 0.0019924253326377207, "loss": 3.1051, "step": 2532 }, { "epoch": 0.07, "learning_rate": 0.0019924146361714537, "loss": 2.6161, "step": 2533 }, { "epoch": 0.07, "learning_rate": 0.001992403932186831, "loss": 2.7687, "step": 2534 }, { "epoch": 0.07, "learning_rate": 0.001992393220683933, "loss": 3.0883, "step": 2535 }, { "epoch": 0.07, "learning_rate": 0.0019923825016628415, "loss": 3.098, "step": 2536 }, { "epoch": 0.07, "learning_rate": 0.0019923717751236377, "loss": 2.9431, "step": 2537 }, { "epoch": 0.07, "learning_rate": 0.0019923610410664027, "loss": 3.1073, "step": 2538 }, { "epoch": 0.07, "learning_rate": 0.001992350299491218, "loss": 2.6689, "step": 2539 }, { "epoch": 0.07, "learning_rate": 0.0019923395503981646, "loss": 2.3566, "step": 2540 }, { "epoch": 0.07, "learning_rate": 0.0019923287937873243, "loss": 2.9927, "step": 2541 }, { "epoch": 0.07, "learning_rate": 0.0019923180296587788, "loss": 2.5999, "step": 2542 }, { "epoch": 0.07, "learning_rate": 0.0019923072580126087, "loss": 3.001, "step": 2543 }, { "epoch": 0.07, "learning_rate": 0.0019922964788488965, "loss": 3.0813, "step": 2544 }, { "epoch": 0.07, "learning_rate": 0.0019922856921677236, "loss": 2.8924, "step": 2545 }, { "epoch": 0.07, "learning_rate": 0.0019922748979691717, "loss": 2.6397, "step": 2546 }, { "epoch": 0.07, "learning_rate": 0.0019922640962533227, "loss": 2.8483, "step": 2547 }, { "epoch": 0.07, "learning_rate": 0.001992253287020258, "loss": 2.7674, "step": 2548 }, { "epoch": 0.07, "learning_rate": 0.00199224247027006, "loss": 2.6477, "step": 2549 }, { "epoch": 0.07, "learning_rate": 0.0019922316460028104, "loss": 2.8197, "step": 2550 }, { "epoch": 0.07, "learning_rate": 0.0019922208142185913, "loss": 3.256, "step": 2551 }, { "epoch": 0.07, "learning_rate": 0.001992209974917485, "loss": 2.6459, "step": 2552 }, { "epoch": 0.07, "learning_rate": 0.0019921991280995727, "loss": 3.1236, "step": 2553 }, { "epoch": 0.07, "learning_rate": 0.0019921882737649376, "loss": 2.8618, "step": 2554 }, { "epoch": 0.07, "learning_rate": 0.0019921774119136615, "loss": 2.7522, "step": 2555 }, { "epoch": 0.07, "learning_rate": 0.001992166542545826, "loss": 2.7293, "step": 2556 }, { "epoch": 0.07, "learning_rate": 0.0019921556656615153, "loss": 2.615, "step": 2557 }, { "epoch": 0.07, "learning_rate": 0.00199214478126081, "loss": 2.731, "step": 2558 }, { "epoch": 0.07, "learning_rate": 0.001992133889343793, "loss": 2.7911, "step": 2559 }, { "epoch": 0.07, "learning_rate": 0.0019921229899105474, "loss": 2.78, "step": 2560 }, { "epoch": 0.07, "learning_rate": 0.0019921120829611556, "loss": 2.6115, "step": 2561 }, { "epoch": 0.07, "learning_rate": 0.0019921011684957, "loss": 2.9494, "step": 2562 }, { "epoch": 0.07, "learning_rate": 0.001992090246514263, "loss": 2.448, "step": 2563 }, { "epoch": 0.07, "learning_rate": 0.001992079317016928, "loss": 2.7876, "step": 2564 }, { "epoch": 0.07, "learning_rate": 0.001992068380003777, "loss": 3.0187, "step": 2565 }, { "epoch": 0.07, "learning_rate": 0.0019920574354748933, "loss": 2.7881, "step": 2566 }, { "epoch": 0.07, "learning_rate": 0.0019920464834303603, "loss": 2.736, "step": 2567 }, { "epoch": 0.07, "learning_rate": 0.0019920355238702606, "loss": 2.3665, "step": 2568 }, { "epoch": 0.07, "learning_rate": 0.0019920245567946766, "loss": 2.818, "step": 2569 }, { "epoch": 0.07, "learning_rate": 0.0019920135822036923, "loss": 2.6465, "step": 2570 }, { "epoch": 0.07, "learning_rate": 0.0019920026000973903, "loss": 2.7163, "step": 2571 }, { "epoch": 0.07, "learning_rate": 0.001991991610475854, "loss": 2.9474, "step": 2572 }, { "epoch": 0.07, "learning_rate": 0.0019919806133391663, "loss": 2.8748, "step": 2573 }, { "epoch": 0.07, "learning_rate": 0.0019919696086874114, "loss": 2.9995, "step": 2574 }, { "epoch": 0.07, "learning_rate": 0.0019919585965206717, "loss": 2.914, "step": 2575 }, { "epoch": 0.07, "learning_rate": 0.001991947576839031, "loss": 3.1197, "step": 2576 }, { "epoch": 0.07, "learning_rate": 0.001991936549642573, "loss": 2.6784, "step": 2577 }, { "epoch": 0.07, "learning_rate": 0.001991925514931381, "loss": 2.4537, "step": 2578 }, { "epoch": 0.07, "learning_rate": 0.0019919144727055384, "loss": 2.7562, "step": 2579 }, { "epoch": 0.07, "learning_rate": 0.0019919034229651292, "loss": 2.8129, "step": 2580 }, { "epoch": 0.07, "learning_rate": 0.001991892365710237, "loss": 2.8738, "step": 2581 }, { "epoch": 0.07, "learning_rate": 0.001991881300940946, "loss": 2.5841, "step": 2582 }, { "epoch": 0.07, "learning_rate": 0.0019918702286573393, "loss": 2.816, "step": 2583 }, { "epoch": 0.07, "learning_rate": 0.001991859148859501, "loss": 2.7282, "step": 2584 }, { "epoch": 0.07, "learning_rate": 0.0019918480615475154, "loss": 3.2078, "step": 2585 }, { "epoch": 0.07, "learning_rate": 0.0019918369667214658, "loss": 2.6484, "step": 2586 }, { "epoch": 0.07, "learning_rate": 0.0019918258643814367, "loss": 2.4652, "step": 2587 }, { "epoch": 0.07, "learning_rate": 0.0019918147545275123, "loss": 2.8338, "step": 2588 }, { "epoch": 0.07, "learning_rate": 0.0019918036371597767, "loss": 2.5457, "step": 2589 }, { "epoch": 0.07, "learning_rate": 0.001991792512278314, "loss": 2.4149, "step": 2590 }, { "epoch": 0.07, "learning_rate": 0.0019917813798832084, "loss": 3.1486, "step": 2591 }, { "epoch": 0.07, "learning_rate": 0.0019917702399745445, "loss": 2.7672, "step": 2592 }, { "epoch": 0.07, "learning_rate": 0.0019917590925524068, "loss": 2.8902, "step": 2593 }, { "epoch": 0.07, "learning_rate": 0.0019917479376168794, "loss": 2.9203, "step": 2594 }, { "epoch": 0.07, "learning_rate": 0.0019917367751680465, "loss": 2.7929, "step": 2595 }, { "epoch": 0.07, "learning_rate": 0.0019917256052059936, "loss": 2.5847, "step": 2596 }, { "epoch": 0.07, "learning_rate": 0.0019917144277308047, "loss": 2.5744, "step": 2597 }, { "epoch": 0.07, "learning_rate": 0.0019917032427425644, "loss": 2.7406, "step": 2598 }, { "epoch": 0.07, "learning_rate": 0.0019916920502413577, "loss": 2.7455, "step": 2599 }, { "epoch": 0.07, "learning_rate": 0.0019916808502272697, "loss": 2.6485, "step": 2600 }, { "epoch": 0.07, "learning_rate": 0.0019916696427003844, "loss": 2.7694, "step": 2601 }, { "epoch": 0.07, "learning_rate": 0.0019916584276607873, "loss": 2.4612, "step": 2602 }, { "epoch": 0.07, "learning_rate": 0.0019916472051085634, "loss": 2.7142, "step": 2603 }, { "epoch": 0.07, "learning_rate": 0.0019916359750437977, "loss": 2.9143, "step": 2604 }, { "epoch": 0.07, "learning_rate": 0.001991624737466575, "loss": 2.7519, "step": 2605 }, { "epoch": 0.07, "learning_rate": 0.0019916134923769805, "loss": 2.8693, "step": 2606 }, { "epoch": 0.07, "learning_rate": 0.0019916022397750994, "loss": 2.934, "step": 2607 }, { "epoch": 0.07, "learning_rate": 0.001991590979661017, "loss": 2.7596, "step": 2608 }, { "epoch": 0.07, "learning_rate": 0.0019915797120348185, "loss": 2.9898, "step": 2609 }, { "epoch": 0.07, "learning_rate": 0.0019915684368965896, "loss": 2.5584, "step": 2610 }, { "epoch": 0.07, "learning_rate": 0.0019915571542464157, "loss": 2.3883, "step": 2611 }, { "epoch": 0.07, "learning_rate": 0.0019915458640843817, "loss": 2.9856, "step": 2612 }, { "epoch": 0.07, "learning_rate": 0.001991534566410574, "loss": 2.4278, "step": 2613 }, { "epoch": 0.07, "learning_rate": 0.001991523261225077, "loss": 2.5406, "step": 2614 }, { "epoch": 0.07, "learning_rate": 0.0019915119485279776, "loss": 2.6679, "step": 2615 }, { "epoch": 0.07, "learning_rate": 0.0019915006283193607, "loss": 2.8442, "step": 2616 }, { "epoch": 0.07, "learning_rate": 0.0019914893005993123, "loss": 2.7964, "step": 2617 }, { "epoch": 0.07, "learning_rate": 0.001991477965367918, "loss": 3.008, "step": 2618 }, { "epoch": 0.07, "learning_rate": 0.0019914666226252646, "loss": 2.8003, "step": 2619 }, { "epoch": 0.07, "learning_rate": 0.0019914552723714367, "loss": 2.7118, "step": 2620 }, { "epoch": 0.07, "learning_rate": 0.001991443914606521, "loss": 2.4274, "step": 2621 }, { "epoch": 0.07, "learning_rate": 0.0019914325493306036, "loss": 2.9233, "step": 2622 }, { "epoch": 0.07, "learning_rate": 0.0019914211765437702, "loss": 2.9713, "step": 2623 }, { "epoch": 0.07, "learning_rate": 0.0019914097962461077, "loss": 3.0045, "step": 2624 }, { "epoch": 0.07, "learning_rate": 0.0019913984084377013, "loss": 2.7362, "step": 2625 }, { "epoch": 0.07, "learning_rate": 0.0019913870131186384, "loss": 2.6147, "step": 2626 }, { "epoch": 0.07, "learning_rate": 0.0019913756102890043, "loss": 2.745, "step": 2627 }, { "epoch": 0.07, "learning_rate": 0.001991364199948886, "loss": 2.7602, "step": 2628 }, { "epoch": 0.07, "learning_rate": 0.0019913527820983696, "loss": 2.5302, "step": 2629 }, { "epoch": 0.07, "learning_rate": 0.0019913413567375416, "loss": 2.8341, "step": 2630 }, { "epoch": 0.07, "learning_rate": 0.001991329923866489, "loss": 2.7146, "step": 2631 }, { "epoch": 0.07, "learning_rate": 0.0019913184834852984, "loss": 2.8941, "step": 2632 }, { "epoch": 0.07, "learning_rate": 0.001991307035594056, "loss": 2.4553, "step": 2633 }, { "epoch": 0.07, "learning_rate": 0.001991295580192848, "loss": 2.5808, "step": 2634 }, { "epoch": 0.07, "learning_rate": 0.0019912841172817627, "loss": 3.0664, "step": 2635 }, { "epoch": 0.07, "learning_rate": 0.001991272646860886, "loss": 2.7943, "step": 2636 }, { "epoch": 0.07, "learning_rate": 0.001991261168930305, "loss": 2.7299, "step": 2637 }, { "epoch": 0.07, "learning_rate": 0.0019912496834901066, "loss": 2.7514, "step": 2638 }, { "epoch": 0.07, "learning_rate": 0.0019912381905403775, "loss": 2.7651, "step": 2639 }, { "epoch": 0.07, "learning_rate": 0.0019912266900812053, "loss": 2.7567, "step": 2640 }, { "epoch": 0.07, "learning_rate": 0.001991215182112677, "loss": 2.676, "step": 2641 }, { "epoch": 0.07, "learning_rate": 0.0019912036666348797, "loss": 2.9642, "step": 2642 }, { "epoch": 0.07, "learning_rate": 0.0019911921436479006, "loss": 3.0857, "step": 2643 }, { "epoch": 0.07, "learning_rate": 0.001991180613151827, "loss": 2.7349, "step": 2644 }, { "epoch": 0.07, "learning_rate": 0.001991169075146746, "loss": 2.7762, "step": 2645 }, { "epoch": 0.07, "learning_rate": 0.0019911575296327456, "loss": 2.7745, "step": 2646 }, { "epoch": 0.07, "learning_rate": 0.001991145976609913, "loss": 3.1318, "step": 2647 }, { "epoch": 0.07, "learning_rate": 0.0019911344160783357, "loss": 2.7563, "step": 2648 }, { "epoch": 0.07, "learning_rate": 0.001991122848038101, "loss": 2.8717, "step": 2649 }, { "epoch": 0.07, "learning_rate": 0.001991111272489297, "loss": 2.7705, "step": 2650 }, { "epoch": 0.07, "learning_rate": 0.001991099689432011, "loss": 2.8111, "step": 2651 }, { "epoch": 0.07, "learning_rate": 0.001991088098866331, "loss": 2.5842, "step": 2652 }, { "epoch": 0.07, "learning_rate": 0.001991076500792345, "loss": 3.1607, "step": 2653 }, { "epoch": 0.07, "learning_rate": 0.0019910648952101402, "loss": 2.9652, "step": 2654 }, { "epoch": 0.07, "learning_rate": 0.001991053282119806, "loss": 2.7928, "step": 2655 }, { "epoch": 0.07, "learning_rate": 0.001991041661521428, "loss": 3.0858, "step": 2656 }, { "epoch": 0.07, "learning_rate": 0.001991030033415096, "loss": 3.0674, "step": 2657 }, { "epoch": 0.07, "learning_rate": 0.001991018397800898, "loss": 2.8635, "step": 2658 }, { "epoch": 0.07, "learning_rate": 0.0019910067546789214, "loss": 2.7072, "step": 2659 }, { "epoch": 0.07, "learning_rate": 0.001990995104049255, "loss": 3.2277, "step": 2660 }, { "epoch": 0.07, "learning_rate": 0.001990983445911987, "loss": 2.6497, "step": 2661 }, { "epoch": 0.07, "learning_rate": 0.0019909717802672052, "loss": 2.6075, "step": 2662 }, { "epoch": 0.07, "learning_rate": 0.0019909601071149987, "loss": 2.8016, "step": 2663 }, { "epoch": 0.07, "learning_rate": 0.0019909484264554553, "loss": 2.6302, "step": 2664 }, { "epoch": 0.07, "learning_rate": 0.0019909367382886637, "loss": 2.9771, "step": 2665 }, { "epoch": 0.07, "learning_rate": 0.001990925042614713, "loss": 2.6305, "step": 2666 }, { "epoch": 0.07, "learning_rate": 0.0019909133394336908, "loss": 2.6068, "step": 2667 }, { "epoch": 0.07, "learning_rate": 0.001990901628745687, "loss": 2.8503, "step": 2668 }, { "epoch": 0.07, "learning_rate": 0.001990889910550789, "loss": 3.0324, "step": 2669 }, { "epoch": 0.07, "learning_rate": 0.0019908781848490863, "loss": 2.7818, "step": 2670 }, { "epoch": 0.07, "learning_rate": 0.001990866451640668, "loss": 3.1046, "step": 2671 }, { "epoch": 0.07, "learning_rate": 0.001990854710925622, "loss": 2.6267, "step": 2672 }, { "epoch": 0.07, "learning_rate": 0.0019908429627040385, "loss": 2.4503, "step": 2673 }, { "epoch": 0.07, "learning_rate": 0.001990831206976005, "loss": 2.8372, "step": 2674 }, { "epoch": 0.07, "learning_rate": 0.0019908194437416125, "loss": 3.056, "step": 2675 }, { "epoch": 0.07, "learning_rate": 0.001990807673000948, "loss": 2.7447, "step": 2676 }, { "epoch": 0.07, "learning_rate": 0.001990795894754103, "loss": 2.7429, "step": 2677 }, { "epoch": 0.07, "learning_rate": 0.001990784109001164, "loss": 2.4695, "step": 2678 }, { "epoch": 0.07, "learning_rate": 0.0019907723157422228, "loss": 2.5373, "step": 2679 }, { "epoch": 0.07, "learning_rate": 0.001990760514977367, "loss": 2.327, "step": 2680 }, { "epoch": 0.07, "learning_rate": 0.0019907487067066867, "loss": 2.802, "step": 2681 }, { "epoch": 0.07, "learning_rate": 0.0019907368909302717, "loss": 2.8831, "step": 2682 }, { "epoch": 0.07, "learning_rate": 0.0019907250676482113, "loss": 2.6398, "step": 2683 }, { "epoch": 0.07, "learning_rate": 0.0019907132368605944, "loss": 2.9355, "step": 2684 }, { "epoch": 0.07, "learning_rate": 0.0019907013985675116, "loss": 2.3031, "step": 2685 }, { "epoch": 0.07, "learning_rate": 0.001990689552769052, "loss": 2.9224, "step": 2686 }, { "epoch": 0.07, "learning_rate": 0.0019906776994653053, "loss": 2.88, "step": 2687 }, { "epoch": 0.07, "learning_rate": 0.0019906658386563613, "loss": 2.8376, "step": 2688 }, { "epoch": 0.07, "learning_rate": 0.00199065397034231, "loss": 2.3334, "step": 2689 }, { "epoch": 0.07, "learning_rate": 0.0019906420945232416, "loss": 2.5534, "step": 2690 }, { "epoch": 0.07, "learning_rate": 0.0019906302111992458, "loss": 2.349, "step": 2691 }, { "epoch": 0.07, "learning_rate": 0.0019906183203704125, "loss": 2.8906, "step": 2692 }, { "epoch": 0.07, "learning_rate": 0.001990606422036832, "loss": 2.8178, "step": 2693 }, { "epoch": 0.07, "learning_rate": 0.0019905945161985943, "loss": 2.6438, "step": 2694 }, { "epoch": 0.07, "learning_rate": 0.00199058260285579, "loss": 2.9439, "step": 2695 }, { "epoch": 0.07, "learning_rate": 0.0019905706820085084, "loss": 2.6975, "step": 2696 }, { "epoch": 0.07, "learning_rate": 0.001990558753656841, "loss": 2.9944, "step": 2697 }, { "epoch": 0.07, "learning_rate": 0.001990546817800877, "loss": 2.8544, "step": 2698 }, { "epoch": 0.07, "learning_rate": 0.0019905348744407077, "loss": 2.7803, "step": 2699 }, { "epoch": 0.07, "learning_rate": 0.0019905229235764235, "loss": 2.6094, "step": 2700 }, { "epoch": 0.07, "learning_rate": 0.0019905109652081144, "loss": 2.8605, "step": 2701 }, { "epoch": 0.07, "learning_rate": 0.0019904989993358717, "loss": 2.7115, "step": 2702 }, { "epoch": 0.07, "learning_rate": 0.001990487025959785, "loss": 2.8636, "step": 2703 }, { "epoch": 0.07, "learning_rate": 0.001990475045079946, "loss": 2.8947, "step": 2704 }, { "epoch": 0.07, "learning_rate": 0.0019904630566964453, "loss": 2.8428, "step": 2705 }, { "epoch": 0.07, "learning_rate": 0.0019904510608093734, "loss": 2.9336, "step": 2706 }, { "epoch": 0.07, "learning_rate": 0.0019904390574188215, "loss": 2.6324, "step": 2707 }, { "epoch": 0.07, "learning_rate": 0.00199042704652488, "loss": 2.9658, "step": 2708 }, { "epoch": 0.07, "learning_rate": 0.0019904150281276406, "loss": 2.6434, "step": 2709 }, { "epoch": 0.07, "learning_rate": 0.001990403002227194, "loss": 2.9749, "step": 2710 }, { "epoch": 0.07, "learning_rate": 0.0019903909688236314, "loss": 2.7144, "step": 2711 }, { "epoch": 0.07, "learning_rate": 0.0019903789279170437, "loss": 2.8632, "step": 2712 }, { "epoch": 0.07, "learning_rate": 0.0019903668795075223, "loss": 2.9181, "step": 2713 }, { "epoch": 0.07, "learning_rate": 0.0019903548235951584, "loss": 2.7677, "step": 2714 }, { "epoch": 0.07, "learning_rate": 0.001990342760180044, "loss": 2.963, "step": 2715 }, { "epoch": 0.07, "learning_rate": 0.0019903306892622694, "loss": 2.65, "step": 2716 }, { "epoch": 0.07, "learning_rate": 0.001990318610841926, "loss": 2.9127, "step": 2717 }, { "epoch": 0.07, "learning_rate": 0.0019903065249191067, "loss": 3.043, "step": 2718 }, { "epoch": 0.07, "learning_rate": 0.001990294431493902, "loss": 2.9323, "step": 2719 }, { "epoch": 0.07, "learning_rate": 0.0019902823305664036, "loss": 2.6107, "step": 2720 }, { "epoch": 0.07, "learning_rate": 0.0019902702221367037, "loss": 2.4008, "step": 2721 }, { "epoch": 0.07, "learning_rate": 0.0019902581062048934, "loss": 2.8955, "step": 2722 }, { "epoch": 0.07, "learning_rate": 0.0019902459827710645, "loss": 2.8542, "step": 2723 }, { "epoch": 0.07, "learning_rate": 0.0019902338518353094, "loss": 2.791, "step": 2724 }, { "epoch": 0.07, "learning_rate": 0.0019902217133977193, "loss": 2.8317, "step": 2725 }, { "epoch": 0.07, "learning_rate": 0.001990209567458387, "loss": 3.1046, "step": 2726 }, { "epoch": 0.07, "learning_rate": 0.0019901974140174037, "loss": 2.6767, "step": 2727 }, { "epoch": 0.07, "learning_rate": 0.001990185253074862, "loss": 3.0461, "step": 2728 }, { "epoch": 0.07, "learning_rate": 0.001990173084630854, "loss": 2.8271, "step": 2729 }, { "epoch": 0.07, "learning_rate": 0.0019901609086854714, "loss": 2.8203, "step": 2730 }, { "epoch": 0.07, "learning_rate": 0.0019901487252388067, "loss": 2.6145, "step": 2731 }, { "epoch": 0.07, "learning_rate": 0.0019901365342909526, "loss": 2.9784, "step": 2732 }, { "epoch": 0.07, "learning_rate": 0.001990124335842001, "loss": 2.7551, "step": 2733 }, { "epoch": 0.07, "learning_rate": 0.0019901121298920446, "loss": 2.8416, "step": 2734 }, { "epoch": 0.07, "learning_rate": 0.001990099916441176, "loss": 3.1254, "step": 2735 }, { "epoch": 0.07, "learning_rate": 0.0019900876954894865, "loss": 2.8599, "step": 2736 }, { "epoch": 0.07, "learning_rate": 0.0019900754670370705, "loss": 2.811, "step": 2737 }, { "epoch": 0.07, "learning_rate": 0.0019900632310840194, "loss": 2.3835, "step": 2738 }, { "epoch": 0.07, "learning_rate": 0.001990050987630426, "loss": 2.5744, "step": 2739 }, { "epoch": 0.07, "learning_rate": 0.0019900387366763835, "loss": 2.5863, "step": 2740 }, { "epoch": 0.07, "learning_rate": 0.0019900264782219852, "loss": 3.0878, "step": 2741 }, { "epoch": 0.07, "learning_rate": 0.0019900142122673227, "loss": 2.4896, "step": 2742 }, { "epoch": 0.07, "learning_rate": 0.0019900019388124895, "loss": 2.8594, "step": 2743 }, { "epoch": 0.07, "learning_rate": 0.0019899896578575785, "loss": 2.6905, "step": 2744 }, { "epoch": 0.07, "learning_rate": 0.0019899773694026833, "loss": 2.8655, "step": 2745 }, { "epoch": 0.07, "learning_rate": 0.0019899650734478964, "loss": 2.7039, "step": 2746 }, { "epoch": 0.07, "learning_rate": 0.001989952769993311, "loss": 2.8919, "step": 2747 }, { "epoch": 0.07, "learning_rate": 0.0019899404590390203, "loss": 2.9985, "step": 2748 }, { "epoch": 0.07, "learning_rate": 0.0019899281405851175, "loss": 2.7684, "step": 2749 }, { "epoch": 0.07, "learning_rate": 0.0019899158146316964, "loss": 2.7384, "step": 2750 }, { "epoch": 0.07, "learning_rate": 0.00198990348117885, "loss": 2.7265, "step": 2751 }, { "epoch": 0.07, "learning_rate": 0.001989891140226672, "loss": 2.6578, "step": 2752 }, { "epoch": 0.07, "learning_rate": 0.0019898787917752556, "loss": 2.7735, "step": 2753 }, { "epoch": 0.07, "learning_rate": 0.0019898664358246943, "loss": 2.5972, "step": 2754 }, { "epoch": 0.07, "learning_rate": 0.0019898540723750817, "loss": 2.7732, "step": 2755 }, { "epoch": 0.07, "learning_rate": 0.001989841701426512, "loss": 2.8651, "step": 2756 }, { "epoch": 0.07, "learning_rate": 0.0019898293229790786, "loss": 2.5913, "step": 2757 }, { "epoch": 0.07, "learning_rate": 0.0019898169370328746, "loss": 2.5754, "step": 2758 }, { "epoch": 0.07, "learning_rate": 0.001989804543587995, "loss": 2.8313, "step": 2759 }, { "epoch": 0.07, "learning_rate": 0.001989792142644533, "loss": 2.7387, "step": 2760 }, { "epoch": 0.07, "learning_rate": 0.0019897797342025825, "loss": 2.8184, "step": 2761 }, { "epoch": 0.07, "learning_rate": 0.001989767318262238, "loss": 2.8469, "step": 2762 }, { "epoch": 0.07, "learning_rate": 0.001989754894823593, "loss": 2.7536, "step": 2763 }, { "epoch": 0.07, "learning_rate": 0.001989742463886742, "loss": 2.7275, "step": 2764 }, { "epoch": 0.07, "learning_rate": 0.001989730025451779, "loss": 2.6503, "step": 2765 }, { "epoch": 0.07, "learning_rate": 0.001989717579518798, "loss": 2.4242, "step": 2766 }, { "epoch": 0.07, "learning_rate": 0.001989705126087894, "loss": 2.7292, "step": 2767 }, { "epoch": 0.07, "learning_rate": 0.0019896926651591608, "loss": 2.5088, "step": 2768 }, { "epoch": 0.07, "learning_rate": 0.001989680196732693, "loss": 2.6689, "step": 2769 }, { "epoch": 0.07, "learning_rate": 0.0019896677208085848, "loss": 2.9622, "step": 2770 }, { "epoch": 0.07, "learning_rate": 0.001989655237386931, "loss": 2.72, "step": 2771 }, { "epoch": 0.07, "learning_rate": 0.0019896427464678257, "loss": 2.942, "step": 2772 }, { "epoch": 0.07, "learning_rate": 0.001989630248051364, "loss": 2.8623, "step": 2773 }, { "epoch": 0.07, "learning_rate": 0.001989617742137641, "loss": 2.6909, "step": 2774 }, { "epoch": 0.07, "learning_rate": 0.0019896052287267504, "loss": 2.8876, "step": 2775 }, { "epoch": 0.07, "learning_rate": 0.0019895927078187876, "loss": 2.4981, "step": 2776 }, { "epoch": 0.07, "learning_rate": 0.0019895801794138474, "loss": 3.1517, "step": 2777 }, { "epoch": 0.07, "learning_rate": 0.0019895676435120247, "loss": 2.7657, "step": 2778 }, { "epoch": 0.07, "learning_rate": 0.0019895551001134146, "loss": 3.0194, "step": 2779 }, { "epoch": 0.07, "learning_rate": 0.001989542549218112, "loss": 2.7479, "step": 2780 }, { "epoch": 0.07, "learning_rate": 0.0019895299908262117, "loss": 3.0963, "step": 2781 }, { "epoch": 0.07, "learning_rate": 0.001989517424937809, "loss": 2.581, "step": 2782 }, { "epoch": 0.07, "learning_rate": 0.0019895048515529996, "loss": 2.978, "step": 2783 }, { "epoch": 0.07, "learning_rate": 0.001989492270671878, "loss": 2.8225, "step": 2784 }, { "epoch": 0.07, "learning_rate": 0.00198947968229454, "loss": 2.788, "step": 2785 }, { "epoch": 0.07, "learning_rate": 0.0019894670864210808, "loss": 2.7111, "step": 2786 }, { "epoch": 0.07, "learning_rate": 0.001989454483051596, "loss": 2.7948, "step": 2787 }, { "epoch": 0.07, "learning_rate": 0.0019894418721861807, "loss": 2.6424, "step": 2788 }, { "epoch": 0.07, "learning_rate": 0.0019894292538249307, "loss": 2.8414, "step": 2789 }, { "epoch": 0.07, "learning_rate": 0.001989416627967942, "loss": 2.4936, "step": 2790 }, { "epoch": 0.08, "learning_rate": 0.001989403994615309, "loss": 2.3924, "step": 2791 }, { "epoch": 0.08, "learning_rate": 0.001989391353767129, "loss": 2.6711, "step": 2792 }, { "epoch": 0.08, "learning_rate": 0.0019893787054234965, "loss": 2.9035, "step": 2793 }, { "epoch": 0.08, "learning_rate": 0.001989366049584508, "loss": 2.4674, "step": 2794 }, { "epoch": 0.08, "learning_rate": 0.0019893533862502593, "loss": 2.8609, "step": 2795 }, { "epoch": 0.08, "learning_rate": 0.001989340715420846, "loss": 2.7279, "step": 2796 }, { "epoch": 0.08, "learning_rate": 0.001989328037096365, "loss": 2.9319, "step": 2797 }, { "epoch": 0.08, "learning_rate": 0.0019893153512769105, "loss": 2.5231, "step": 2798 }, { "epoch": 0.08, "learning_rate": 0.0019893026579625808, "loss": 2.8411, "step": 2799 }, { "epoch": 0.08, "learning_rate": 0.00198928995715347, "loss": 2.8127, "step": 2800 }, { "epoch": 0.08, "learning_rate": 0.0019892772488496763, "loss": 3.246, "step": 2801 }, { "epoch": 0.08, "learning_rate": 0.0019892645330512946, "loss": 2.8751, "step": 2802 }, { "epoch": 0.08, "learning_rate": 0.001989251809758422, "loss": 2.7665, "step": 2803 }, { "epoch": 0.08, "learning_rate": 0.001989239078971154, "loss": 2.5315, "step": 2804 }, { "epoch": 0.08, "learning_rate": 0.0019892263406895883, "loss": 3.0494, "step": 2805 }, { "epoch": 0.08, "learning_rate": 0.00198921359491382, "loss": 2.775, "step": 2806 }, { "epoch": 0.08, "learning_rate": 0.001989200841643947, "loss": 2.1395, "step": 2807 }, { "epoch": 0.08, "learning_rate": 0.0019891880808800646, "loss": 2.8185, "step": 2808 }, { "epoch": 0.08, "learning_rate": 0.0019891753126222707, "loss": 2.798, "step": 2809 }, { "epoch": 0.08, "learning_rate": 0.0019891625368706613, "loss": 2.6214, "step": 2810 }, { "epoch": 0.08, "learning_rate": 0.001989149753625333, "loss": 3.5874, "step": 2811 }, { "epoch": 0.08, "learning_rate": 0.0019891369628863833, "loss": 2.5696, "step": 2812 }, { "epoch": 0.08, "learning_rate": 0.001989124164653909, "loss": 3.2755, "step": 2813 }, { "epoch": 0.08, "learning_rate": 0.0019891113589280067, "loss": 2.7363, "step": 2814 }, { "epoch": 0.08, "learning_rate": 0.0019890985457087737, "loss": 2.5827, "step": 2815 }, { "epoch": 0.08, "learning_rate": 0.0019890857249963067, "loss": 2.7889, "step": 2816 }, { "epoch": 0.08, "learning_rate": 0.001989072896790703, "loss": 2.7777, "step": 2817 }, { "epoch": 0.08, "learning_rate": 0.00198906006109206, "loss": 2.4255, "step": 2818 }, { "epoch": 0.08, "learning_rate": 0.0019890472179004753, "loss": 2.9073, "step": 2819 }, { "epoch": 0.08, "learning_rate": 0.0019890343672160455, "loss": 2.6014, "step": 2820 }, { "epoch": 0.08, "learning_rate": 0.0019890215090388676, "loss": 2.9305, "step": 2821 }, { "epoch": 0.08, "learning_rate": 0.00198900864336904, "loss": 2.7577, "step": 2822 }, { "epoch": 0.08, "learning_rate": 0.00198899577020666, "loss": 3.0702, "step": 2823 }, { "epoch": 0.08, "learning_rate": 0.0019889828895518244, "loss": 2.4536, "step": 2824 }, { "epoch": 0.08, "learning_rate": 0.0019889700014046312, "loss": 2.7966, "step": 2825 }, { "epoch": 0.08, "learning_rate": 0.0019889571057651783, "loss": 2.6012, "step": 2826 }, { "epoch": 0.08, "learning_rate": 0.001988944202633563, "loss": 2.2595, "step": 2827 }, { "epoch": 0.08, "learning_rate": 0.0019889312920098835, "loss": 2.9948, "step": 2828 }, { "epoch": 0.08, "learning_rate": 0.0019889183738942373, "loss": 2.6273, "step": 2829 }, { "epoch": 0.08, "learning_rate": 0.001988905448286722, "loss": 2.5316, "step": 2830 }, { "epoch": 0.08, "learning_rate": 0.001988892515187436, "loss": 3.2144, "step": 2831 }, { "epoch": 0.08, "learning_rate": 0.001988879574596477, "loss": 3.089, "step": 2832 }, { "epoch": 0.08, "learning_rate": 0.0019888666265139433, "loss": 2.8662, "step": 2833 }, { "epoch": 0.08, "learning_rate": 0.0019888536709399326, "loss": 2.6833, "step": 2834 }, { "epoch": 0.08, "learning_rate": 0.0019888407078745437, "loss": 2.3494, "step": 2835 }, { "epoch": 0.08, "learning_rate": 0.001988827737317874, "loss": 2.8778, "step": 2836 }, { "epoch": 0.08, "learning_rate": 0.0019888147592700225, "loss": 3.0749, "step": 2837 }, { "epoch": 0.08, "learning_rate": 0.0019888017737310867, "loss": 2.8441, "step": 2838 }, { "epoch": 0.08, "learning_rate": 0.001988788780701166, "loss": 2.6206, "step": 2839 }, { "epoch": 0.08, "learning_rate": 0.0019887757801803577, "loss": 2.6561, "step": 2840 }, { "epoch": 0.08, "learning_rate": 0.0019887627721687615, "loss": 2.7009, "step": 2841 }, { "epoch": 0.08, "learning_rate": 0.001988749756666475, "loss": 2.9904, "step": 2842 }, { "epoch": 0.08, "learning_rate": 0.0019887367336735968, "loss": 2.8457, "step": 2843 }, { "epoch": 0.08, "learning_rate": 0.0019887237031902265, "loss": 2.819, "step": 2844 }, { "epoch": 0.08, "learning_rate": 0.0019887106652164616, "loss": 2.6706, "step": 2845 }, { "epoch": 0.08, "learning_rate": 0.0019886976197524015, "loss": 3.099, "step": 2846 }, { "epoch": 0.08, "learning_rate": 0.0019886845667981454, "loss": 2.4947, "step": 2847 }, { "epoch": 0.08, "learning_rate": 0.0019886715063537914, "loss": 2.7562, "step": 2848 }, { "epoch": 0.08, "learning_rate": 0.001988658438419439, "loss": 2.6852, "step": 2849 }, { "epoch": 0.08, "learning_rate": 0.001988645362995187, "loss": 2.4696, "step": 2850 }, { "epoch": 0.08, "learning_rate": 0.0019886322800811347, "loss": 2.7842, "step": 2851 }, { "epoch": 0.08, "learning_rate": 0.001988619189677381, "loss": 2.8984, "step": 2852 }, { "epoch": 0.08, "learning_rate": 0.001988606091784025, "loss": 2.5783, "step": 2853 }, { "epoch": 0.08, "learning_rate": 0.0019885929864011656, "loss": 2.7337, "step": 2854 }, { "epoch": 0.08, "learning_rate": 0.0019885798735289027, "loss": 2.7302, "step": 2855 }, { "epoch": 0.08, "learning_rate": 0.0019885667531673356, "loss": 2.6883, "step": 2856 }, { "epoch": 0.08, "learning_rate": 0.0019885536253165634, "loss": 2.7787, "step": 2857 }, { "epoch": 0.08, "learning_rate": 0.0019885404899766855, "loss": 2.9072, "step": 2858 }, { "epoch": 0.08, "learning_rate": 0.0019885273471478017, "loss": 2.5685, "step": 2859 }, { "epoch": 0.08, "learning_rate": 0.0019885141968300117, "loss": 2.3788, "step": 2860 }, { "epoch": 0.08, "learning_rate": 0.0019885010390234144, "loss": 2.5705, "step": 2861 }, { "epoch": 0.08, "learning_rate": 0.0019884878737281104, "loss": 2.7068, "step": 2862 }, { "epoch": 0.08, "learning_rate": 0.001988474700944199, "loss": 2.4118, "step": 2863 }, { "epoch": 0.08, "learning_rate": 0.0019884615206717795, "loss": 2.8264, "step": 2864 }, { "epoch": 0.08, "learning_rate": 0.0019884483329109526, "loss": 2.5034, "step": 2865 }, { "epoch": 0.08, "learning_rate": 0.001988435137661818, "loss": 2.5058, "step": 2866 }, { "epoch": 0.08, "learning_rate": 0.001988421934924475, "loss": 2.7777, "step": 2867 }, { "epoch": 0.08, "learning_rate": 0.0019884087246990244, "loss": 2.6565, "step": 2868 }, { "epoch": 0.08, "learning_rate": 0.001988395506985566, "loss": 2.522, "step": 2869 }, { "epoch": 0.08, "learning_rate": 0.0019883822817842, "loss": 2.6565, "step": 2870 }, { "epoch": 0.08, "learning_rate": 0.001988369049095027, "loss": 2.9114, "step": 2871 }, { "epoch": 0.08, "learning_rate": 0.0019883558089181463, "loss": 2.5882, "step": 2872 }, { "epoch": 0.08, "learning_rate": 0.0019883425612536587, "loss": 2.6271, "step": 2873 }, { "epoch": 0.08, "learning_rate": 0.0019883293061016645, "loss": 2.5741, "step": 2874 }, { "epoch": 0.08, "learning_rate": 0.001988316043462264, "loss": 2.9017, "step": 2875 }, { "epoch": 0.08, "learning_rate": 0.0019883027733355583, "loss": 2.6242, "step": 2876 }, { "epoch": 0.08, "learning_rate": 0.001988289495721647, "loss": 2.7005, "step": 2877 }, { "epoch": 0.08, "learning_rate": 0.0019882762106206314, "loss": 3.0436, "step": 2878 }, { "epoch": 0.08, "learning_rate": 0.0019882629180326124, "loss": 2.6246, "step": 2879 }, { "epoch": 0.08, "learning_rate": 0.0019882496179576895, "loss": 2.9032, "step": 2880 }, { "epoch": 0.08, "learning_rate": 0.0019882363103959646, "loss": 2.5289, "step": 2881 }, { "epoch": 0.08, "learning_rate": 0.0019882229953475383, "loss": 2.5381, "step": 2882 }, { "epoch": 0.08, "learning_rate": 0.0019882096728125105, "loss": 3.0708, "step": 2883 }, { "epoch": 0.08, "learning_rate": 0.0019881963427909833, "loss": 2.6122, "step": 2884 }, { "epoch": 0.08, "learning_rate": 0.0019881830052830575, "loss": 2.7637, "step": 2885 }, { "epoch": 0.08, "learning_rate": 0.0019881696602888333, "loss": 2.7644, "step": 2886 }, { "epoch": 0.08, "learning_rate": 0.001988156307808413, "loss": 2.6078, "step": 2887 }, { "epoch": 0.08, "learning_rate": 0.0019881429478418975, "loss": 2.9701, "step": 2888 }, { "epoch": 0.08, "learning_rate": 0.0019881295803893867, "loss": 2.6238, "step": 2889 }, { "epoch": 0.08, "learning_rate": 0.0019881162054509838, "loss": 2.7699, "step": 2890 }, { "epoch": 0.08, "learning_rate": 0.0019881028230267885, "loss": 2.3926, "step": 2891 }, { "epoch": 0.08, "learning_rate": 0.001988089433116903, "loss": 2.7217, "step": 2892 }, { "epoch": 0.08, "learning_rate": 0.001988076035721429, "loss": 2.7389, "step": 2893 }, { "epoch": 0.08, "learning_rate": 0.001988062630840467, "loss": 3.0066, "step": 2894 }, { "epoch": 0.08, "learning_rate": 0.00198804921847412, "loss": 3.0485, "step": 2895 }, { "epoch": 0.08, "learning_rate": 0.001988035798622488, "loss": 2.8545, "step": 2896 }, { "epoch": 0.08, "learning_rate": 0.001988022371285674, "loss": 3.1423, "step": 2897 }, { "epoch": 0.08, "learning_rate": 0.0019880089364637784, "loss": 3.084, "step": 2898 }, { "epoch": 0.08, "learning_rate": 0.0019879954941569044, "loss": 2.9145, "step": 2899 }, { "epoch": 0.08, "learning_rate": 0.0019879820443651527, "loss": 2.8645, "step": 2900 }, { "epoch": 0.08, "learning_rate": 0.001987968587088626, "loss": 2.3823, "step": 2901 }, { "epoch": 0.08, "learning_rate": 0.001987955122327426, "loss": 2.9236, "step": 2902 }, { "epoch": 0.08, "learning_rate": 0.0019879416500816543, "loss": 2.6472, "step": 2903 }, { "epoch": 0.08, "learning_rate": 0.0019879281703514134, "loss": 3.1021, "step": 2904 }, { "epoch": 0.08, "learning_rate": 0.0019879146831368053, "loss": 2.8814, "step": 2905 }, { "epoch": 0.08, "learning_rate": 0.001987901188437932, "loss": 3.1223, "step": 2906 }, { "epoch": 0.08, "learning_rate": 0.0019878876862548965, "loss": 3.1306, "step": 2907 }, { "epoch": 0.08, "learning_rate": 0.0019878741765878, "loss": 3.1467, "step": 2908 }, { "epoch": 0.08, "learning_rate": 0.001987860659436746, "loss": 2.5052, "step": 2909 }, { "epoch": 0.08, "learning_rate": 0.0019878471348018355, "loss": 2.8436, "step": 2910 }, { "epoch": 0.08, "learning_rate": 0.001987833602683172, "loss": 2.8273, "step": 2911 }, { "epoch": 0.08, "learning_rate": 0.0019878200630808578, "loss": 2.7166, "step": 2912 }, { "epoch": 0.08, "learning_rate": 0.0019878065159949954, "loss": 2.7489, "step": 2913 }, { "epoch": 0.08, "learning_rate": 0.0019877929614256873, "loss": 2.5609, "step": 2914 }, { "epoch": 0.08, "learning_rate": 0.0019877793993730362, "loss": 2.8874, "step": 2915 }, { "epoch": 0.08, "learning_rate": 0.0019877658298371455, "loss": 2.7291, "step": 2916 }, { "epoch": 0.08, "learning_rate": 0.0019877522528181173, "loss": 3.0102, "step": 2917 }, { "epoch": 0.08, "learning_rate": 0.001987738668316054, "loss": 2.8946, "step": 2918 }, { "epoch": 0.08, "learning_rate": 0.00198772507633106, "loss": 2.7518, "step": 2919 }, { "epoch": 0.08, "learning_rate": 0.001987711476863237, "loss": 2.7228, "step": 2920 }, { "epoch": 0.08, "learning_rate": 0.0019876978699126884, "loss": 2.8611, "step": 2921 }, { "epoch": 0.08, "learning_rate": 0.0019876842554795173, "loss": 2.9719, "step": 2922 }, { "epoch": 0.08, "learning_rate": 0.001987670633563827, "loss": 2.727, "step": 2923 }, { "epoch": 0.08, "learning_rate": 0.00198765700416572, "loss": 2.9431, "step": 2924 }, { "epoch": 0.08, "learning_rate": 0.001987643367285301, "loss": 2.6952, "step": 2925 }, { "epoch": 0.08, "learning_rate": 0.001987629722922672, "loss": 2.7802, "step": 2926 }, { "epoch": 0.08, "learning_rate": 0.001987616071077937, "loss": 2.7658, "step": 2927 }, { "epoch": 0.08, "learning_rate": 0.001987602411751199, "loss": 2.6716, "step": 2928 }, { "epoch": 0.08, "learning_rate": 0.0019875887449425614, "loss": 2.9007, "step": 2929 }, { "epoch": 0.08, "learning_rate": 0.001987575070652129, "loss": 2.435, "step": 2930 }, { "epoch": 0.08, "learning_rate": 0.0019875613888800034, "loss": 3.0166, "step": 2931 }, { "epoch": 0.08, "learning_rate": 0.0019875476996262897, "loss": 2.7487, "step": 2932 }, { "epoch": 0.08, "learning_rate": 0.001987534002891091, "loss": 2.6346, "step": 2933 }, { "epoch": 0.08, "learning_rate": 0.0019875202986745113, "loss": 2.9987, "step": 2934 }, { "epoch": 0.08, "learning_rate": 0.0019875065869766548, "loss": 2.866, "step": 2935 }, { "epoch": 0.08, "learning_rate": 0.0019874928677976245, "loss": 2.6547, "step": 2936 }, { "epoch": 0.08, "learning_rate": 0.0019874791411375247, "loss": 3.0641, "step": 2937 }, { "epoch": 0.08, "learning_rate": 0.00198746540699646, "loss": 2.7397, "step": 2938 }, { "epoch": 0.08, "learning_rate": 0.0019874516653745336, "loss": 2.5184, "step": 2939 }, { "epoch": 0.08, "learning_rate": 0.00198743791627185, "loss": 3.2821, "step": 2940 }, { "epoch": 0.08, "learning_rate": 0.001987424159688513, "loss": 2.7914, "step": 2941 }, { "epoch": 0.08, "learning_rate": 0.001987410395624627, "loss": 2.6558, "step": 2942 }, { "epoch": 0.08, "learning_rate": 0.0019873966240802968, "loss": 2.6303, "step": 2943 }, { "epoch": 0.08, "learning_rate": 0.0019873828450556264, "loss": 3.1004, "step": 2944 }, { "epoch": 0.08, "learning_rate": 0.0019873690585507195, "loss": 2.6741, "step": 2945 }, { "epoch": 0.08, "learning_rate": 0.001987355264565682, "loss": 2.7321, "step": 2946 }, { "epoch": 0.08, "learning_rate": 0.001987341463100617, "loss": 2.6417, "step": 2947 }, { "epoch": 0.08, "learning_rate": 0.0019873276541556295, "loss": 2.6997, "step": 2948 }, { "epoch": 0.08, "learning_rate": 0.001987313837730824, "loss": 2.8752, "step": 2949 }, { "epoch": 0.08, "learning_rate": 0.001987300013826306, "loss": 2.7777, "step": 2950 }, { "epoch": 0.08, "learning_rate": 0.0019872861824421794, "loss": 2.661, "step": 2951 }, { "epoch": 0.08, "learning_rate": 0.0019872723435785493, "loss": 3.0702, "step": 2952 }, { "epoch": 0.08, "learning_rate": 0.00198725849723552, "loss": 2.5825, "step": 2953 }, { "epoch": 0.08, "learning_rate": 0.0019872446434131973, "loss": 3.0059, "step": 2954 }, { "epoch": 0.08, "learning_rate": 0.0019872307821116853, "loss": 3.0523, "step": 2955 }, { "epoch": 0.08, "learning_rate": 0.0019872169133310896, "loss": 2.902, "step": 2956 }, { "epoch": 0.08, "learning_rate": 0.001987203037071515, "loss": 2.499, "step": 2957 }, { "epoch": 0.08, "learning_rate": 0.0019871891533330666, "loss": 2.6254, "step": 2958 }, { "epoch": 0.08, "learning_rate": 0.00198717526211585, "loss": 2.6103, "step": 2959 }, { "epoch": 0.08, "learning_rate": 0.0019871613634199698, "loss": 2.4858, "step": 2960 }, { "epoch": 0.08, "learning_rate": 0.001987147457245532, "loss": 2.9162, "step": 2961 }, { "epoch": 0.08, "learning_rate": 0.001987133543592641, "loss": 2.7841, "step": 2962 }, { "epoch": 0.08, "learning_rate": 0.001987119622461403, "loss": 2.8705, "step": 2963 }, { "epoch": 0.08, "learning_rate": 0.0019871056938519233, "loss": 3.1863, "step": 2964 }, { "epoch": 0.08, "learning_rate": 0.0019870917577643073, "loss": 2.8813, "step": 2965 }, { "epoch": 0.08, "learning_rate": 0.0019870778141986606, "loss": 2.0838, "step": 2966 }, { "epoch": 0.08, "learning_rate": 0.001987063863155089, "loss": 2.6788, "step": 2967 }, { "epoch": 0.08, "learning_rate": 0.0019870499046336977, "loss": 2.9141, "step": 2968 }, { "epoch": 0.08, "learning_rate": 0.001987035938634593, "loss": 2.6134, "step": 2969 }, { "epoch": 0.08, "learning_rate": 0.00198702196515788, "loss": 2.9214, "step": 2970 }, { "epoch": 0.08, "learning_rate": 0.001987007984203666, "loss": 2.5786, "step": 2971 }, { "epoch": 0.08, "learning_rate": 0.0019869939957720554, "loss": 2.5522, "step": 2972 }, { "epoch": 0.08, "learning_rate": 0.0019869799998631548, "loss": 2.3629, "step": 2973 }, { "epoch": 0.08, "learning_rate": 0.0019869659964770704, "loss": 2.696, "step": 2974 }, { "epoch": 0.08, "learning_rate": 0.0019869519856139076, "loss": 2.5186, "step": 2975 }, { "epoch": 0.08, "learning_rate": 0.0019869379672737735, "loss": 2.635, "step": 2976 }, { "epoch": 0.08, "learning_rate": 0.0019869239414567735, "loss": 2.7861, "step": 2977 }, { "epoch": 0.08, "learning_rate": 0.0019869099081630142, "loss": 2.6495, "step": 2978 }, { "epoch": 0.08, "learning_rate": 0.001986895867392602, "loss": 2.6977, "step": 2979 }, { "epoch": 0.08, "learning_rate": 0.001986881819145643, "loss": 2.7166, "step": 2980 }, { "epoch": 0.08, "learning_rate": 0.001986867763422244, "loss": 2.5018, "step": 2981 }, { "epoch": 0.08, "learning_rate": 0.0019868537002225113, "loss": 2.8813, "step": 2982 }, { "epoch": 0.08, "learning_rate": 0.0019868396295465505, "loss": 2.989, "step": 2983 }, { "epoch": 0.08, "learning_rate": 0.0019868255513944702, "loss": 2.8364, "step": 2984 }, { "epoch": 0.08, "learning_rate": 0.0019868114657663758, "loss": 2.778, "step": 2985 }, { "epoch": 0.08, "learning_rate": 0.0019867973726623734, "loss": 2.7603, "step": 2986 }, { "epoch": 0.08, "learning_rate": 0.0019867832720825715, "loss": 2.9444, "step": 2987 }, { "epoch": 0.08, "learning_rate": 0.001986769164027075, "loss": 3.1911, "step": 2988 }, { "epoch": 0.08, "learning_rate": 0.0019867550484959926, "loss": 2.8971, "step": 2989 }, { "epoch": 0.08, "learning_rate": 0.00198674092548943, "loss": 2.6404, "step": 2990 }, { "epoch": 0.08, "learning_rate": 0.0019867267950074946, "loss": 2.8054, "step": 2991 }, { "epoch": 0.08, "learning_rate": 0.0019867126570502934, "loss": 3.0017, "step": 2992 }, { "epoch": 0.08, "learning_rate": 0.0019866985116179336, "loss": 2.516, "step": 2993 }, { "epoch": 0.08, "learning_rate": 0.001986684358710522, "loss": 2.9514, "step": 2994 }, { "epoch": 0.08, "learning_rate": 0.0019866701983281662, "loss": 3.245, "step": 2995 }, { "epoch": 0.08, "learning_rate": 0.0019866560304709737, "loss": 2.4613, "step": 2996 }, { "epoch": 0.08, "learning_rate": 0.001986641855139051, "loss": 2.7398, "step": 2997 }, { "epoch": 0.08, "learning_rate": 0.0019866276723325064, "loss": 3.3608, "step": 2998 }, { "epoch": 0.08, "learning_rate": 0.001986613482051447, "loss": 2.6496, "step": 2999 }, { "epoch": 0.08, "learning_rate": 0.00198659928429598, "loss": 2.4333, "step": 3000 }, { "epoch": 0.08, "learning_rate": 0.001986585079066213, "loss": 3.0385, "step": 3001 }, { "epoch": 0.08, "learning_rate": 0.0019865708663622545, "loss": 2.7408, "step": 3002 }, { "epoch": 0.08, "learning_rate": 0.0019865566461842107, "loss": 2.4736, "step": 3003 }, { "epoch": 0.08, "learning_rate": 0.0019865424185321907, "loss": 2.7467, "step": 3004 }, { "epoch": 0.08, "learning_rate": 0.0019865281834063014, "loss": 2.6145, "step": 3005 }, { "epoch": 0.08, "learning_rate": 0.0019865139408066514, "loss": 2.9192, "step": 3006 }, { "epoch": 0.08, "learning_rate": 0.0019864996907333478, "loss": 2.6739, "step": 3007 }, { "epoch": 0.08, "learning_rate": 0.001986485433186499, "loss": 2.3999, "step": 3008 }, { "epoch": 0.08, "learning_rate": 0.001986471168166213, "loss": 2.6195, "step": 3009 }, { "epoch": 0.08, "learning_rate": 0.0019864568956725974, "loss": 2.6811, "step": 3010 }, { "epoch": 0.08, "learning_rate": 0.001986442615705761, "loss": 2.4927, "step": 3011 }, { "epoch": 0.08, "learning_rate": 0.001986428328265812, "loss": 2.8333, "step": 3012 }, { "epoch": 0.08, "learning_rate": 0.001986414033352858, "loss": 2.5285, "step": 3013 }, { "epoch": 0.08, "learning_rate": 0.0019863997309670076, "loss": 3.0128, "step": 3014 }, { "epoch": 0.08, "learning_rate": 0.0019863854211083693, "loss": 2.727, "step": 3015 }, { "epoch": 0.08, "learning_rate": 0.001986371103777051, "loss": 2.9001, "step": 3016 }, { "epoch": 0.08, "learning_rate": 0.0019863567789731623, "loss": 2.9272, "step": 3017 }, { "epoch": 0.08, "learning_rate": 0.0019863424466968105, "loss": 2.8418, "step": 3018 }, { "epoch": 0.08, "learning_rate": 0.0019863281069481048, "loss": 2.7145, "step": 3019 }, { "epoch": 0.08, "learning_rate": 0.0019863137597271536, "loss": 2.7834, "step": 3020 }, { "epoch": 0.08, "learning_rate": 0.0019862994050340657, "loss": 2.7786, "step": 3021 }, { "epoch": 0.08, "learning_rate": 0.00198628504286895, "loss": 2.4697, "step": 3022 }, { "epoch": 0.08, "learning_rate": 0.001986270673231915, "loss": 3.0152, "step": 3023 }, { "epoch": 0.08, "learning_rate": 0.00198625629612307, "loss": 2.4417, "step": 3024 }, { "epoch": 0.08, "learning_rate": 0.0019862419115425235, "loss": 3.1568, "step": 3025 }, { "epoch": 0.08, "learning_rate": 0.0019862275194903844, "loss": 2.7748, "step": 3026 }, { "epoch": 0.08, "learning_rate": 0.001986213119966762, "loss": 2.7203, "step": 3027 }, { "epoch": 0.08, "learning_rate": 0.001986198712971765, "loss": 2.3845, "step": 3028 }, { "epoch": 0.08, "learning_rate": 0.0019861842985055035, "loss": 2.8839, "step": 3029 }, { "epoch": 0.08, "learning_rate": 0.001986169876568086, "loss": 2.5963, "step": 3030 }, { "epoch": 0.08, "learning_rate": 0.0019861554471596217, "loss": 2.4533, "step": 3031 }, { "epoch": 0.08, "learning_rate": 0.0019861410102802197, "loss": 2.9978, "step": 3032 }, { "epoch": 0.08, "learning_rate": 0.00198612656592999, "loss": 2.4822, "step": 3033 }, { "epoch": 0.08, "learning_rate": 0.0019861121141090416, "loss": 3.0459, "step": 3034 }, { "epoch": 0.08, "learning_rate": 0.0019860976548174846, "loss": 2.8561, "step": 3035 }, { "epoch": 0.08, "learning_rate": 0.0019860831880554276, "loss": 2.7049, "step": 3036 }, { "epoch": 0.08, "learning_rate": 0.001986068713822981, "loss": 2.6777, "step": 3037 }, { "epoch": 0.08, "learning_rate": 0.0019860542321202537, "loss": 2.9288, "step": 3038 }, { "epoch": 0.08, "learning_rate": 0.001986039742947356, "loss": 2.8626, "step": 3039 }, { "epoch": 0.08, "learning_rate": 0.0019860252463043977, "loss": 2.9323, "step": 3040 }, { "epoch": 0.08, "learning_rate": 0.0019860107421914882, "loss": 2.9443, "step": 3041 }, { "epoch": 0.08, "learning_rate": 0.0019859962306087373, "loss": 2.5958, "step": 3042 }, { "epoch": 0.08, "learning_rate": 0.0019859817115562557, "loss": 2.8108, "step": 3043 }, { "epoch": 0.08, "learning_rate": 0.001985967185034153, "loss": 3.182, "step": 3044 }, { "epoch": 0.08, "learning_rate": 0.001985952651042539, "loss": 2.6583, "step": 3045 }, { "epoch": 0.08, "learning_rate": 0.0019859381095815236, "loss": 2.752, "step": 3046 }, { "epoch": 0.08, "learning_rate": 0.001985923560651218, "loss": 3.127, "step": 3047 }, { "epoch": 0.08, "learning_rate": 0.0019859090042517315, "loss": 2.8359, "step": 3048 }, { "epoch": 0.08, "learning_rate": 0.0019858944403831746, "loss": 2.6486, "step": 3049 }, { "epoch": 0.08, "learning_rate": 0.0019858798690456573, "loss": 2.8271, "step": 3050 }, { "epoch": 0.08, "learning_rate": 0.001985865290239291, "loss": 2.5726, "step": 3051 }, { "epoch": 0.08, "learning_rate": 0.0019858507039641855, "loss": 2.6701, "step": 3052 }, { "epoch": 0.08, "learning_rate": 0.0019858361102204508, "loss": 2.5829, "step": 3053 }, { "epoch": 0.08, "learning_rate": 0.0019858215090081985, "loss": 2.8996, "step": 3054 }, { "epoch": 0.08, "learning_rate": 0.0019858069003275383, "loss": 2.6448, "step": 3055 }, { "epoch": 0.08, "learning_rate": 0.0019857922841785814, "loss": 2.5868, "step": 3056 }, { "epoch": 0.08, "learning_rate": 0.0019857776605614386, "loss": 2.5264, "step": 3057 }, { "epoch": 0.08, "learning_rate": 0.0019857630294762207, "loss": 2.4436, "step": 3058 }, { "epoch": 0.08, "learning_rate": 0.0019857483909230377, "loss": 2.7612, "step": 3059 }, { "epoch": 0.08, "learning_rate": 0.0019857337449020016, "loss": 3.0535, "step": 3060 }, { "epoch": 0.08, "learning_rate": 0.0019857190914132224, "loss": 2.6105, "step": 3061 }, { "epoch": 0.08, "learning_rate": 0.0019857044304568117, "loss": 2.6145, "step": 3062 }, { "epoch": 0.08, "learning_rate": 0.001985689762032881, "loss": 2.6153, "step": 3063 }, { "epoch": 0.08, "learning_rate": 0.0019856750861415406, "loss": 2.713, "step": 3064 }, { "epoch": 0.08, "learning_rate": 0.001985660402782902, "loss": 2.8504, "step": 3065 }, { "epoch": 0.08, "learning_rate": 0.001985645711957076, "loss": 2.6703, "step": 3066 }, { "epoch": 0.08, "learning_rate": 0.0019856310136641747, "loss": 2.6576, "step": 3067 }, { "epoch": 0.08, "learning_rate": 0.001985616307904309, "loss": 2.8902, "step": 3068 }, { "epoch": 0.08, "learning_rate": 0.00198560159467759, "loss": 2.671, "step": 3069 }, { "epoch": 0.08, "learning_rate": 0.00198558687398413, "loss": 2.7404, "step": 3070 }, { "epoch": 0.08, "learning_rate": 0.00198557214582404, "loss": 2.9236, "step": 3071 }, { "epoch": 0.08, "learning_rate": 0.001985557410197432, "loss": 2.3142, "step": 3072 }, { "epoch": 0.08, "learning_rate": 0.0019855426671044163, "loss": 2.8029, "step": 3073 }, { "epoch": 0.08, "learning_rate": 0.001985527916545106, "loss": 2.7918, "step": 3074 }, { "epoch": 0.08, "learning_rate": 0.0019855131585196123, "loss": 2.6981, "step": 3075 }, { "epoch": 0.08, "learning_rate": 0.0019854983930280476, "loss": 2.6374, "step": 3076 }, { "epoch": 0.08, "learning_rate": 0.001985483620070523, "loss": 2.7632, "step": 3077 }, { "epoch": 0.08, "learning_rate": 0.00198546883964715, "loss": 2.8038, "step": 3078 }, { "epoch": 0.08, "learning_rate": 0.001985454051758042, "loss": 3.0232, "step": 3079 }, { "epoch": 0.08, "learning_rate": 0.0019854392564033103, "loss": 2.7785, "step": 3080 }, { "epoch": 0.08, "learning_rate": 0.001985424453583067, "loss": 2.9041, "step": 3081 }, { "epoch": 0.08, "learning_rate": 0.0019854096432974236, "loss": 2.8702, "step": 3082 }, { "epoch": 0.08, "learning_rate": 0.0019853948255464937, "loss": 2.5608, "step": 3083 }, { "epoch": 0.08, "learning_rate": 0.001985380000330388, "loss": 2.8913, "step": 3084 }, { "epoch": 0.08, "learning_rate": 0.0019853651676492202, "loss": 2.8713, "step": 3085 }, { "epoch": 0.08, "learning_rate": 0.0019853503275031018, "loss": 2.5468, "step": 3086 }, { "epoch": 0.08, "learning_rate": 0.0019853354798921455, "loss": 2.6766, "step": 3087 }, { "epoch": 0.08, "learning_rate": 0.0019853206248164642, "loss": 2.9138, "step": 3088 }, { "epoch": 0.08, "learning_rate": 0.0019853057622761694, "loss": 2.975, "step": 3089 }, { "epoch": 0.08, "learning_rate": 0.0019852908922713746, "loss": 2.2874, "step": 3090 }, { "epoch": 0.08, "learning_rate": 0.001985276014802192, "loss": 2.4607, "step": 3091 }, { "epoch": 0.08, "learning_rate": 0.0019852611298687346, "loss": 3.1234, "step": 3092 }, { "epoch": 0.08, "learning_rate": 0.001985246237471115, "loss": 3.1766, "step": 3093 }, { "epoch": 0.08, "learning_rate": 0.001985231337609446, "loss": 2.4478, "step": 3094 }, { "epoch": 0.08, "learning_rate": 0.0019852164302838404, "loss": 3.147, "step": 3095 }, { "epoch": 0.08, "learning_rate": 0.0019852015154944117, "loss": 2.9804, "step": 3096 }, { "epoch": 0.08, "learning_rate": 0.001985186593241272, "loss": 2.5984, "step": 3097 }, { "epoch": 0.08, "learning_rate": 0.0019851716635245348, "loss": 2.8714, "step": 3098 }, { "epoch": 0.08, "learning_rate": 0.0019851567263443138, "loss": 2.5363, "step": 3099 }, { "epoch": 0.08, "learning_rate": 0.001985141781700721, "loss": 2.6408, "step": 3100 }, { "epoch": 0.08, "learning_rate": 0.0019851268295938704, "loss": 2.924, "step": 3101 }, { "epoch": 0.08, "learning_rate": 0.0019851118700238745, "loss": 2.9496, "step": 3102 }, { "epoch": 0.08, "learning_rate": 0.001985096902990848, "loss": 2.4336, "step": 3103 }, { "epoch": 0.08, "learning_rate": 0.001985081928494903, "loss": 3.064, "step": 3104 }, { "epoch": 0.08, "learning_rate": 0.001985066946536154, "loss": 2.5395, "step": 3105 }, { "epoch": 0.08, "learning_rate": 0.0019850519571147133, "loss": 3.0396, "step": 3106 }, { "epoch": 0.08, "learning_rate": 0.0019850369602306952, "loss": 2.9911, "step": 3107 }, { "epoch": 0.08, "learning_rate": 0.0019850219558842134, "loss": 2.8015, "step": 3108 }, { "epoch": 0.08, "learning_rate": 0.0019850069440753813, "loss": 2.3981, "step": 3109 }, { "epoch": 0.08, "learning_rate": 0.0019849919248043127, "loss": 2.9378, "step": 3110 }, { "epoch": 0.08, "learning_rate": 0.001984976898071121, "loss": 2.4132, "step": 3111 }, { "epoch": 0.08, "learning_rate": 0.0019849618638759212, "loss": 2.6146, "step": 3112 }, { "epoch": 0.08, "learning_rate": 0.001984946822218826, "loss": 3.1055, "step": 3113 }, { "epoch": 0.08, "learning_rate": 0.0019849317730999496, "loss": 2.7197, "step": 3114 }, { "epoch": 0.08, "learning_rate": 0.001984916716519406, "loss": 2.7076, "step": 3115 }, { "epoch": 0.08, "learning_rate": 0.00198490165247731, "loss": 2.5344, "step": 3116 }, { "epoch": 0.08, "learning_rate": 0.0019848865809737747, "loss": 2.7596, "step": 3117 }, { "epoch": 0.08, "learning_rate": 0.0019848715020089154, "loss": 2.9072, "step": 3118 }, { "epoch": 0.08, "learning_rate": 0.001984856415582845, "loss": 2.4471, "step": 3119 }, { "epoch": 0.08, "learning_rate": 0.001984841321695679, "loss": 2.7582, "step": 3120 }, { "epoch": 0.08, "learning_rate": 0.001984826220347531, "loss": 2.7769, "step": 3121 }, { "epoch": 0.08, "learning_rate": 0.0019848111115385154, "loss": 2.5729, "step": 3122 }, { "epoch": 0.08, "learning_rate": 0.001984795995268747, "loss": 2.8856, "step": 3123 }, { "epoch": 0.08, "learning_rate": 0.0019847808715383404, "loss": 2.5816, "step": 3124 }, { "epoch": 0.08, "learning_rate": 0.0019847657403474096, "loss": 2.7493, "step": 3125 }, { "epoch": 0.08, "learning_rate": 0.00198475060169607, "loss": 2.3946, "step": 3126 }, { "epoch": 0.08, "learning_rate": 0.0019847354555844357, "loss": 2.9251, "step": 3127 }, { "epoch": 0.08, "learning_rate": 0.0019847203020126217, "loss": 3.2267, "step": 3128 }, { "epoch": 0.08, "learning_rate": 0.0019847051409807425, "loss": 2.8226, "step": 3129 }, { "epoch": 0.08, "learning_rate": 0.0019846899724889136, "loss": 3.0373, "step": 3130 }, { "epoch": 0.08, "learning_rate": 0.0019846747965372494, "loss": 2.7633, "step": 3131 }, { "epoch": 0.08, "learning_rate": 0.001984659613125865, "loss": 2.7837, "step": 3132 }, { "epoch": 0.08, "learning_rate": 0.0019846444222548754, "loss": 3.1627, "step": 3133 }, { "epoch": 0.08, "learning_rate": 0.0019846292239243954, "loss": 2.8388, "step": 3134 }, { "epoch": 0.08, "learning_rate": 0.0019846140181345407, "loss": 2.8732, "step": 3135 }, { "epoch": 0.08, "learning_rate": 0.0019845988048854263, "loss": 2.6709, "step": 3136 }, { "epoch": 0.08, "learning_rate": 0.0019845835841771674, "loss": 2.7057, "step": 3137 }, { "epoch": 0.08, "learning_rate": 0.001984568356009879, "loss": 2.9987, "step": 3138 }, { "epoch": 0.08, "learning_rate": 0.001984553120383677, "loss": 2.5342, "step": 3139 }, { "epoch": 0.08, "learning_rate": 0.0019845378772986766, "loss": 2.4241, "step": 3140 }, { "epoch": 0.08, "learning_rate": 0.0019845226267549932, "loss": 2.4224, "step": 3141 }, { "epoch": 0.08, "learning_rate": 0.0019845073687527423, "loss": 2.6524, "step": 3142 }, { "epoch": 0.08, "learning_rate": 0.00198449210329204, "loss": 2.9251, "step": 3143 }, { "epoch": 0.08, "learning_rate": 0.001984476830373001, "loss": 2.7229, "step": 3144 }, { "epoch": 0.08, "learning_rate": 0.0019844615499957415, "loss": 2.7887, "step": 3145 }, { "epoch": 0.08, "learning_rate": 0.0019844462621603776, "loss": 2.5365, "step": 3146 }, { "epoch": 0.08, "learning_rate": 0.001984430966867025, "loss": 3.0048, "step": 3147 }, { "epoch": 0.08, "learning_rate": 0.001984415664115799, "loss": 2.3495, "step": 3148 }, { "epoch": 0.08, "learning_rate": 0.0019844003539068165, "loss": 2.9836, "step": 3149 }, { "epoch": 0.08, "learning_rate": 0.0019843850362401922, "loss": 2.5123, "step": 3150 }, { "epoch": 0.08, "learning_rate": 0.001984369711116043, "loss": 3.1922, "step": 3151 }, { "epoch": 0.08, "learning_rate": 0.0019843543785344852, "loss": 2.9745, "step": 3152 }, { "epoch": 0.08, "learning_rate": 0.0019843390384956345, "loss": 2.4245, "step": 3153 }, { "epoch": 0.08, "learning_rate": 0.001984323690999607, "loss": 2.4516, "step": 3154 }, { "epoch": 0.08, "learning_rate": 0.0019843083360465193, "loss": 2.8242, "step": 3155 }, { "epoch": 0.08, "learning_rate": 0.0019842929736364878, "loss": 2.7154, "step": 3156 }, { "epoch": 0.08, "learning_rate": 0.0019842776037696285, "loss": 3.111, "step": 3157 }, { "epoch": 0.08, "learning_rate": 0.001984262226446058, "loss": 2.5312, "step": 3158 }, { "epoch": 0.08, "learning_rate": 0.001984246841665893, "loss": 2.7269, "step": 3159 }, { "epoch": 0.08, "learning_rate": 0.0019842314494292503, "loss": 2.3548, "step": 3160 }, { "epoch": 0.08, "learning_rate": 0.0019842160497362455, "loss": 2.2298, "step": 3161 }, { "epoch": 0.08, "learning_rate": 0.001984200642586996, "loss": 2.3866, "step": 3162 }, { "epoch": 0.09, "learning_rate": 0.0019841852279816182, "loss": 3.0402, "step": 3163 }, { "epoch": 0.09, "learning_rate": 0.0019841698059202295, "loss": 2.909, "step": 3164 }, { "epoch": 0.09, "learning_rate": 0.001984154376402946, "loss": 2.8352, "step": 3165 }, { "epoch": 0.09, "learning_rate": 0.0019841389394298853, "loss": 2.7048, "step": 3166 }, { "epoch": 0.09, "learning_rate": 0.0019841234950011637, "loss": 2.3479, "step": 3167 }, { "epoch": 0.09, "learning_rate": 0.001984108043116898, "loss": 2.8509, "step": 3168 }, { "epoch": 0.09, "learning_rate": 0.001984092583777206, "loss": 3.0361, "step": 3169 }, { "epoch": 0.09, "learning_rate": 0.001984077116982205, "loss": 2.9621, "step": 3170 }, { "epoch": 0.09, "learning_rate": 0.0019840616427320113, "loss": 2.8804, "step": 3171 }, { "epoch": 0.09, "learning_rate": 0.0019840461610267424, "loss": 2.9393, "step": 3172 }, { "epoch": 0.09, "learning_rate": 0.001984030671866516, "loss": 2.5113, "step": 3173 }, { "epoch": 0.09, "learning_rate": 0.0019840151752514488, "loss": 2.5524, "step": 3174 }, { "epoch": 0.09, "learning_rate": 0.0019839996711816586, "loss": 2.2235, "step": 3175 }, { "epoch": 0.09, "learning_rate": 0.0019839841596572634, "loss": 2.7051, "step": 3176 }, { "epoch": 0.09, "learning_rate": 0.0019839686406783797, "loss": 2.5355, "step": 3177 }, { "epoch": 0.09, "learning_rate": 0.0019839531142451256, "loss": 2.525, "step": 3178 }, { "epoch": 0.09, "learning_rate": 0.001983937580357618, "loss": 2.6574, "step": 3179 }, { "epoch": 0.09, "learning_rate": 0.001983922039015976, "loss": 2.9399, "step": 3180 }, { "epoch": 0.09, "learning_rate": 0.0019839064902203163, "loss": 2.9693, "step": 3181 }, { "epoch": 0.09, "learning_rate": 0.001983890933970757, "loss": 2.9121, "step": 3182 }, { "epoch": 0.09, "learning_rate": 0.0019838753702674156, "loss": 2.7643, "step": 3183 }, { "epoch": 0.09, "learning_rate": 0.001983859799110411, "loss": 2.6685, "step": 3184 }, { "epoch": 0.09, "learning_rate": 0.0019838442204998595, "loss": 3.1738, "step": 3185 }, { "epoch": 0.09, "learning_rate": 0.0019838286344358805, "loss": 2.8256, "step": 3186 }, { "epoch": 0.09, "learning_rate": 0.0019838130409185915, "loss": 3.0464, "step": 3187 }, { "epoch": 0.09, "learning_rate": 0.001983797439948111, "loss": 2.7212, "step": 3188 }, { "epoch": 0.09, "learning_rate": 0.001983781831524557, "loss": 2.5597, "step": 3189 }, { "epoch": 0.09, "learning_rate": 0.001983766215648048, "loss": 3.3273, "step": 3190 }, { "epoch": 0.09, "learning_rate": 0.0019837505923187017, "loss": 3.0856, "step": 3191 }, { "epoch": 0.09, "learning_rate": 0.001983734961536637, "loss": 2.4911, "step": 3192 }, { "epoch": 0.09, "learning_rate": 0.0019837193233019717, "loss": 2.6949, "step": 3193 }, { "epoch": 0.09, "learning_rate": 0.001983703677614825, "loss": 2.6124, "step": 3194 }, { "epoch": 0.09, "learning_rate": 0.001983688024475315, "loss": 2.7491, "step": 3195 }, { "epoch": 0.09, "learning_rate": 0.00198367236388356, "loss": 2.675, "step": 3196 }, { "epoch": 0.09, "learning_rate": 0.0019836566958396796, "loss": 2.5752, "step": 3197 }, { "epoch": 0.09, "learning_rate": 0.001983641020343792, "loss": 2.4887, "step": 3198 }, { "epoch": 0.09, "learning_rate": 0.001983625337396016, "loss": 2.6742, "step": 3199 }, { "epoch": 0.09, "learning_rate": 0.0019836096469964697, "loss": 2.8457, "step": 3200 }, { "epoch": 0.09, "learning_rate": 0.0019835939491452724, "loss": 2.7456, "step": 3201 }, { "epoch": 0.09, "learning_rate": 0.001983578243842544, "loss": 2.757, "step": 3202 }, { "epoch": 0.09, "learning_rate": 0.0019835625310884023, "loss": 2.8483, "step": 3203 }, { "epoch": 0.09, "learning_rate": 0.0019835468108829668, "loss": 2.8057, "step": 3204 }, { "epoch": 0.09, "learning_rate": 0.001983531083226356, "loss": 2.4898, "step": 3205 }, { "epoch": 0.09, "learning_rate": 0.00198351534811869, "loss": 2.3579, "step": 3206 }, { "epoch": 0.09, "learning_rate": 0.0019834996055600874, "loss": 2.4222, "step": 3207 }, { "epoch": 0.09, "learning_rate": 0.001983483855550668, "loss": 2.8257, "step": 3208 }, { "epoch": 0.09, "learning_rate": 0.001983468098090551, "loss": 2.5827, "step": 3209 }, { "epoch": 0.09, "learning_rate": 0.0019834523331798545, "loss": 2.684, "step": 3210 }, { "epoch": 0.09, "learning_rate": 0.0019834365608186995, "loss": 2.5388, "step": 3211 }, { "epoch": 0.09, "learning_rate": 0.0019834207810072047, "loss": 2.5823, "step": 3212 }, { "epoch": 0.09, "learning_rate": 0.0019834049937454902, "loss": 2.6577, "step": 3213 }, { "epoch": 0.09, "learning_rate": 0.0019833891990336753, "loss": 2.4932, "step": 3214 }, { "epoch": 0.09, "learning_rate": 0.001983373396871879, "loss": 3.1635, "step": 3215 }, { "epoch": 0.09, "learning_rate": 0.0019833575872602225, "loss": 2.5628, "step": 3216 }, { "epoch": 0.09, "learning_rate": 0.0019833417701988244, "loss": 2.3764, "step": 3217 }, { "epoch": 0.09, "learning_rate": 0.0019833259456878047, "loss": 2.4986, "step": 3218 }, { "epoch": 0.09, "learning_rate": 0.0019833101137272835, "loss": 3.2759, "step": 3219 }, { "epoch": 0.09, "learning_rate": 0.001983294274317381, "loss": 2.4197, "step": 3220 }, { "epoch": 0.09, "learning_rate": 0.0019832784274582166, "loss": 2.6535, "step": 3221 }, { "epoch": 0.09, "learning_rate": 0.0019832625731499107, "loss": 2.8083, "step": 3222 }, { "epoch": 0.09, "learning_rate": 0.001983246711392583, "loss": 3.1389, "step": 3223 }, { "epoch": 0.09, "learning_rate": 0.0019832308421863544, "loss": 2.8146, "step": 3224 }, { "epoch": 0.09, "learning_rate": 0.0019832149655313446, "loss": 2.4175, "step": 3225 }, { "epoch": 0.09, "learning_rate": 0.001983199081427674, "loss": 2.7662, "step": 3226 }, { "epoch": 0.09, "learning_rate": 0.001983183189875463, "loss": 2.9258, "step": 3227 }, { "epoch": 0.09, "learning_rate": 0.0019831672908748317, "loss": 2.6847, "step": 3228 }, { "epoch": 0.09, "learning_rate": 0.001983151384425901, "loss": 2.8387, "step": 3229 }, { "epoch": 0.09, "learning_rate": 0.0019831354705287913, "loss": 2.4937, "step": 3230 }, { "epoch": 0.09, "learning_rate": 0.001983119549183623, "loss": 2.842, "step": 3231 }, { "epoch": 0.09, "learning_rate": 0.0019831036203905167, "loss": 2.7525, "step": 3232 }, { "epoch": 0.09, "learning_rate": 0.001983087684149593, "loss": 2.7739, "step": 3233 }, { "epoch": 0.09, "learning_rate": 0.001983071740460973, "loss": 2.6772, "step": 3234 }, { "epoch": 0.09, "learning_rate": 0.001983055789324777, "loss": 2.7599, "step": 3235 }, { "epoch": 0.09, "learning_rate": 0.001983039830741126, "loss": 3.0429, "step": 3236 }, { "epoch": 0.09, "learning_rate": 0.001983023864710141, "loss": 2.8746, "step": 3237 }, { "epoch": 0.09, "learning_rate": 0.001983007891231943, "loss": 2.7889, "step": 3238 }, { "epoch": 0.09, "learning_rate": 0.0019829919103066533, "loss": 2.6967, "step": 3239 }, { "epoch": 0.09, "learning_rate": 0.0019829759219343926, "loss": 3.0539, "step": 3240 }, { "epoch": 0.09, "learning_rate": 0.001982959926115282, "loss": 3.0869, "step": 3241 }, { "epoch": 0.09, "learning_rate": 0.0019829439228494423, "loss": 2.8999, "step": 3242 }, { "epoch": 0.09, "learning_rate": 0.0019829279121369955, "loss": 2.4848, "step": 3243 }, { "epoch": 0.09, "learning_rate": 0.0019829118939780625, "loss": 2.8246, "step": 3244 }, { "epoch": 0.09, "learning_rate": 0.001982895868372765, "loss": 2.7593, "step": 3245 }, { "epoch": 0.09, "learning_rate": 0.001982879835321224, "loss": 2.8724, "step": 3246 }, { "epoch": 0.09, "learning_rate": 0.0019828637948235608, "loss": 2.6888, "step": 3247 }, { "epoch": 0.09, "learning_rate": 0.001982847746879897, "loss": 3.2011, "step": 3248 }, { "epoch": 0.09, "learning_rate": 0.0019828316914903554, "loss": 2.9653, "step": 3249 }, { "epoch": 0.09, "learning_rate": 0.0019828156286550557, "loss": 2.9491, "step": 3250 }, { "epoch": 0.09, "learning_rate": 0.0019827995583741207, "loss": 2.9505, "step": 3251 }, { "epoch": 0.09, "learning_rate": 0.0019827834806476724, "loss": 2.4531, "step": 3252 }, { "epoch": 0.09, "learning_rate": 0.0019827673954758316, "loss": 2.6723, "step": 3253 }, { "epoch": 0.09, "learning_rate": 0.001982751302858721, "loss": 2.9306, "step": 3254 }, { "epoch": 0.09, "learning_rate": 0.001982735202796462, "loss": 2.7007, "step": 3255 }, { "epoch": 0.09, "learning_rate": 0.001982719095289177, "loss": 2.2714, "step": 3256 }, { "epoch": 0.09, "learning_rate": 0.0019827029803369876, "loss": 3.0146, "step": 3257 }, { "epoch": 0.09, "learning_rate": 0.0019826868579400168, "loss": 3.0711, "step": 3258 }, { "epoch": 0.09, "learning_rate": 0.001982670728098385, "loss": 2.8841, "step": 3259 }, { "epoch": 0.09, "learning_rate": 0.0019826545908122164, "loss": 2.9064, "step": 3260 }, { "epoch": 0.09, "learning_rate": 0.001982638446081632, "loss": 2.7641, "step": 3261 }, { "epoch": 0.09, "learning_rate": 0.0019826222939067543, "loss": 2.9979, "step": 3262 }, { "epoch": 0.09, "learning_rate": 0.0019826061342877056, "loss": 2.7216, "step": 3263 }, { "epoch": 0.09, "learning_rate": 0.001982589967224609, "loss": 2.7892, "step": 3264 }, { "epoch": 0.09, "learning_rate": 0.001982573792717586, "loss": 2.6405, "step": 3265 }, { "epoch": 0.09, "learning_rate": 0.00198255761076676, "loss": 2.4285, "step": 3266 }, { "epoch": 0.09, "learning_rate": 0.0019825414213722526, "loss": 2.6683, "step": 3267 }, { "epoch": 0.09, "learning_rate": 0.0019825252245341874, "loss": 2.4673, "step": 3268 }, { "epoch": 0.09, "learning_rate": 0.001982509020252687, "loss": 2.7101, "step": 3269 }, { "epoch": 0.09, "learning_rate": 0.0019824928085278738, "loss": 2.5893, "step": 3270 }, { "epoch": 0.09, "learning_rate": 0.0019824765893598707, "loss": 2.7796, "step": 3271 }, { "epoch": 0.09, "learning_rate": 0.0019824603627488003, "loss": 2.859, "step": 3272 }, { "epoch": 0.09, "learning_rate": 0.0019824441286947865, "loss": 2.6769, "step": 3273 }, { "epoch": 0.09, "learning_rate": 0.001982427887197951, "loss": 2.841, "step": 3274 }, { "epoch": 0.09, "learning_rate": 0.001982411638258418, "loss": 2.7941, "step": 3275 }, { "epoch": 0.09, "learning_rate": 0.0019823953818763097, "loss": 2.5291, "step": 3276 }, { "epoch": 0.09, "learning_rate": 0.0019823791180517496, "loss": 2.763, "step": 3277 }, { "epoch": 0.09, "learning_rate": 0.001982362846784861, "loss": 3.094, "step": 3278 }, { "epoch": 0.09, "learning_rate": 0.0019823465680757673, "loss": 2.9527, "step": 3279 }, { "epoch": 0.09, "learning_rate": 0.0019823302819245913, "loss": 2.529, "step": 3280 }, { "epoch": 0.09, "learning_rate": 0.001982313988331457, "loss": 3.1583, "step": 3281 }, { "epoch": 0.09, "learning_rate": 0.001982297687296487, "loss": 2.3654, "step": 3282 }, { "epoch": 0.09, "learning_rate": 0.001982281378819806, "loss": 2.7226, "step": 3283 }, { "epoch": 0.09, "learning_rate": 0.001982265062901537, "loss": 2.6362, "step": 3284 }, { "epoch": 0.09, "learning_rate": 0.0019822487395418026, "loss": 2.6429, "step": 3285 }, { "epoch": 0.09, "learning_rate": 0.0019822324087407283, "loss": 2.7752, "step": 3286 }, { "epoch": 0.09, "learning_rate": 0.0019822160704984363, "loss": 2.6511, "step": 3287 }, { "epoch": 0.09, "learning_rate": 0.0019821997248150513, "loss": 2.789, "step": 3288 }, { "epoch": 0.09, "learning_rate": 0.0019821833716906967, "loss": 2.9804, "step": 3289 }, { "epoch": 0.09, "learning_rate": 0.0019821670111254963, "loss": 2.6513, "step": 3290 }, { "epoch": 0.09, "learning_rate": 0.0019821506431195743, "loss": 2.7683, "step": 3291 }, { "epoch": 0.09, "learning_rate": 0.0019821342676730547, "loss": 2.7262, "step": 3292 }, { "epoch": 0.09, "learning_rate": 0.001982117884786061, "loss": 2.6071, "step": 3293 }, { "epoch": 0.09, "learning_rate": 0.0019821014944587188, "loss": 3.23, "step": 3294 }, { "epoch": 0.09, "learning_rate": 0.0019820850966911505, "loss": 2.4432, "step": 3295 }, { "epoch": 0.09, "learning_rate": 0.001982068691483481, "loss": 2.5384, "step": 3296 }, { "epoch": 0.09, "learning_rate": 0.001982052278835835, "loss": 2.9122, "step": 3297 }, { "epoch": 0.09, "learning_rate": 0.0019820358587483364, "loss": 3.2067, "step": 3298 }, { "epoch": 0.09, "learning_rate": 0.00198201943122111, "loss": 3.0006, "step": 3299 }, { "epoch": 0.09, "learning_rate": 0.0019820029962542792, "loss": 2.2553, "step": 3300 }, { "epoch": 0.09, "learning_rate": 0.00198198655384797, "loss": 2.6609, "step": 3301 }, { "epoch": 0.09, "learning_rate": 0.001981970104002306, "loss": 2.5786, "step": 3302 }, { "epoch": 0.09, "learning_rate": 0.001981953646717412, "loss": 2.842, "step": 3303 }, { "epoch": 0.09, "learning_rate": 0.0019819371819934125, "loss": 2.7723, "step": 3304 }, { "epoch": 0.09, "learning_rate": 0.001981920709830433, "loss": 2.5559, "step": 3305 }, { "epoch": 0.09, "learning_rate": 0.0019819042302285975, "loss": 2.6345, "step": 3306 }, { "epoch": 0.09, "learning_rate": 0.001981887743188031, "loss": 2.8565, "step": 3307 }, { "epoch": 0.09, "learning_rate": 0.0019818712487088587, "loss": 2.4963, "step": 3308 }, { "epoch": 0.09, "learning_rate": 0.001981854746791205, "loss": 3.1063, "step": 3309 }, { "epoch": 0.09, "learning_rate": 0.0019818382374351957, "loss": 2.6644, "step": 3310 }, { "epoch": 0.09, "learning_rate": 0.0019818217206409553, "loss": 2.5376, "step": 3311 }, { "epoch": 0.09, "learning_rate": 0.001981805196408609, "loss": 3.0969, "step": 3312 }, { "epoch": 0.09, "learning_rate": 0.001981788664738282, "loss": 3.0711, "step": 3313 }, { "epoch": 0.09, "learning_rate": 0.0019817721256301, "loss": 2.4319, "step": 3314 }, { "epoch": 0.09, "learning_rate": 0.0019817555790841873, "loss": 3.2019, "step": 3315 }, { "epoch": 0.09, "learning_rate": 0.0019817390251006704, "loss": 2.6582, "step": 3316 }, { "epoch": 0.09, "learning_rate": 0.001981722463679674, "loss": 2.5445, "step": 3317 }, { "epoch": 0.09, "learning_rate": 0.0019817058948213236, "loss": 2.9686, "step": 3318 }, { "epoch": 0.09, "learning_rate": 0.001981689318525745, "loss": 2.7946, "step": 3319 }, { "epoch": 0.09, "learning_rate": 0.0019816727347930635, "loss": 2.4557, "step": 3320 }, { "epoch": 0.09, "learning_rate": 0.001981656143623405, "loss": 3.3837, "step": 3321 }, { "epoch": 0.09, "learning_rate": 0.0019816395450168948, "loss": 2.4665, "step": 3322 }, { "epoch": 0.09, "learning_rate": 0.001981622938973659, "loss": 2.3923, "step": 3323 }, { "epoch": 0.09, "learning_rate": 0.0019816063254938236, "loss": 2.4467, "step": 3324 }, { "epoch": 0.09, "learning_rate": 0.001981589704577514, "loss": 2.9157, "step": 3325 }, { "epoch": 0.09, "learning_rate": 0.001981573076224856, "loss": 2.7872, "step": 3326 }, { "epoch": 0.09, "learning_rate": 0.0019815564404359765, "loss": 2.3823, "step": 3327 }, { "epoch": 0.09, "learning_rate": 0.0019815397972110004, "loss": 2.8302, "step": 3328 }, { "epoch": 0.09, "learning_rate": 0.0019815231465500544, "loss": 2.8971, "step": 3329 }, { "epoch": 0.09, "learning_rate": 0.0019815064884532644, "loss": 2.9941, "step": 3330 }, { "epoch": 0.09, "learning_rate": 0.001981489822920757, "loss": 2.5286, "step": 3331 }, { "epoch": 0.09, "learning_rate": 0.001981473149952658, "loss": 2.3413, "step": 3332 }, { "epoch": 0.09, "learning_rate": 0.001981456469549094, "loss": 2.4469, "step": 3333 }, { "epoch": 0.09, "learning_rate": 0.001981439781710191, "loss": 2.9261, "step": 3334 }, { "epoch": 0.09, "learning_rate": 0.001981423086436076, "loss": 2.8467, "step": 3335 }, { "epoch": 0.09, "learning_rate": 0.001981406383726875, "loss": 2.6503, "step": 3336 }, { "epoch": 0.09, "learning_rate": 0.0019813896735827144, "loss": 2.6445, "step": 3337 }, { "epoch": 0.09, "learning_rate": 0.0019813729560037214, "loss": 2.8774, "step": 3338 }, { "epoch": 0.09, "learning_rate": 0.0019813562309900228, "loss": 2.9622, "step": 3339 }, { "epoch": 0.09, "learning_rate": 0.0019813394985417443, "loss": 2.5683, "step": 3340 }, { "epoch": 0.09, "learning_rate": 0.001981322758659013, "loss": 2.7971, "step": 3341 }, { "epoch": 0.09, "learning_rate": 0.0019813060113419564, "loss": 2.9248, "step": 3342 }, { "epoch": 0.09, "learning_rate": 0.0019812892565907007, "loss": 2.9738, "step": 3343 }, { "epoch": 0.09, "learning_rate": 0.0019812724944053726, "loss": 2.6313, "step": 3344 }, { "epoch": 0.09, "learning_rate": 0.0019812557247861004, "loss": 2.5391, "step": 3345 }, { "epoch": 0.09, "learning_rate": 0.00198123894773301, "loss": 2.5068, "step": 3346 }, { "epoch": 0.09, "learning_rate": 0.001981222163246228, "loss": 2.772, "step": 3347 }, { "epoch": 0.09, "learning_rate": 0.001981205371325883, "loss": 2.9014, "step": 3348 }, { "epoch": 0.09, "learning_rate": 0.0019811885719721017, "loss": 2.5466, "step": 3349 }, { "epoch": 0.09, "learning_rate": 0.0019811717651850107, "loss": 2.971, "step": 3350 }, { "epoch": 0.09, "learning_rate": 0.001981154950964738, "loss": 2.8679, "step": 3351 }, { "epoch": 0.09, "learning_rate": 0.001981138129311411, "loss": 2.8976, "step": 3352 }, { "epoch": 0.09, "learning_rate": 0.0019811213002251566, "loss": 3.3554, "step": 3353 }, { "epoch": 0.09, "learning_rate": 0.001981104463706103, "loss": 2.784, "step": 3354 }, { "epoch": 0.09, "learning_rate": 0.001981087619754377, "loss": 2.9484, "step": 3355 }, { "epoch": 0.09, "learning_rate": 0.001981070768370107, "loss": 2.8311, "step": 3356 }, { "epoch": 0.09, "learning_rate": 0.00198105390955342, "loss": 2.556, "step": 3357 }, { "epoch": 0.09, "learning_rate": 0.001981037043304444, "loss": 2.6089, "step": 3358 }, { "epoch": 0.09, "learning_rate": 0.0019810201696233067, "loss": 2.8244, "step": 3359 }, { "epoch": 0.09, "learning_rate": 0.001981003288510136, "loss": 2.6568, "step": 3360 }, { "epoch": 0.09, "learning_rate": 0.00198098639996506, "loss": 2.1334, "step": 3361 }, { "epoch": 0.09, "learning_rate": 0.001980969503988206, "loss": 2.8811, "step": 3362 }, { "epoch": 0.09, "learning_rate": 0.001980952600579703, "loss": 2.9294, "step": 3363 }, { "epoch": 0.09, "learning_rate": 0.001980935689739678, "loss": 2.507, "step": 3364 }, { "epoch": 0.09, "learning_rate": 0.00198091877146826, "loss": 2.8871, "step": 3365 }, { "epoch": 0.09, "learning_rate": 0.0019809018457655767, "loss": 2.6676, "step": 3366 }, { "epoch": 0.09, "learning_rate": 0.0019808849126317562, "loss": 2.8347, "step": 3367 }, { "epoch": 0.09, "learning_rate": 0.001980867972066927, "loss": 3.0314, "step": 3368 }, { "epoch": 0.09, "learning_rate": 0.001980851024071217, "loss": 2.6953, "step": 3369 }, { "epoch": 0.09, "learning_rate": 0.0019808340686447556, "loss": 3.2387, "step": 3370 }, { "epoch": 0.09, "learning_rate": 0.0019808171057876705, "loss": 2.5482, "step": 3371 }, { "epoch": 0.09, "learning_rate": 0.0019808001355000903, "loss": 2.8727, "step": 3372 }, { "epoch": 0.09, "learning_rate": 0.0019807831577821435, "loss": 2.651, "step": 3373 }, { "epoch": 0.09, "learning_rate": 0.001980766172633959, "loss": 2.7363, "step": 3374 }, { "epoch": 0.09, "learning_rate": 0.001980749180055665, "loss": 3.1775, "step": 3375 }, { "epoch": 0.09, "learning_rate": 0.001980732180047391, "loss": 2.7112, "step": 3376 }, { "epoch": 0.09, "learning_rate": 0.001980715172609265, "loss": 2.7033, "step": 3377 }, { "epoch": 0.09, "learning_rate": 0.0019806981577414166, "loss": 2.4071, "step": 3378 }, { "epoch": 0.09, "learning_rate": 0.001980681135443974, "loss": 2.7591, "step": 3379 }, { "epoch": 0.09, "learning_rate": 0.0019806641057170666, "loss": 2.7413, "step": 3380 }, { "epoch": 0.09, "learning_rate": 0.001980647068560823, "loss": 2.769, "step": 3381 }, { "epoch": 0.09, "learning_rate": 0.0019806300239753726, "loss": 2.6942, "step": 3382 }, { "epoch": 0.09, "learning_rate": 0.0019806129719608444, "loss": 2.5832, "step": 3383 }, { "epoch": 0.09, "learning_rate": 0.001980595912517368, "loss": 2.9195, "step": 3384 }, { "epoch": 0.09, "learning_rate": 0.0019805788456450724, "loss": 2.9511, "step": 3385 }, { "epoch": 0.09, "learning_rate": 0.0019805617713440863, "loss": 2.7595, "step": 3386 }, { "epoch": 0.09, "learning_rate": 0.0019805446896145394, "loss": 2.9858, "step": 3387 }, { "epoch": 0.09, "learning_rate": 0.001980527600456562, "loss": 3.2281, "step": 3388 }, { "epoch": 0.09, "learning_rate": 0.001980510503870282, "loss": 2.7782, "step": 3389 }, { "epoch": 0.09, "learning_rate": 0.0019804933998558297, "loss": 2.53, "step": 3390 }, { "epoch": 0.09, "learning_rate": 0.0019804762884133354, "loss": 2.9631, "step": 3391 }, { "epoch": 0.09, "learning_rate": 0.0019804591695429274, "loss": 2.3983, "step": 3392 }, { "epoch": 0.09, "learning_rate": 0.001980442043244736, "loss": 2.6994, "step": 3393 }, { "epoch": 0.09, "learning_rate": 0.0019804249095188914, "loss": 2.9531, "step": 3394 }, { "epoch": 0.09, "learning_rate": 0.001980407768365523, "loss": 2.7216, "step": 3395 }, { "epoch": 0.09, "learning_rate": 0.0019803906197847607, "loss": 2.6952, "step": 3396 }, { "epoch": 0.09, "learning_rate": 0.001980373463776734, "loss": 2.6565, "step": 3397 }, { "epoch": 0.09, "learning_rate": 0.001980356300341573, "loss": 2.653, "step": 3398 }, { "epoch": 0.09, "learning_rate": 0.0019803391294794083, "loss": 2.7597, "step": 3399 }, { "epoch": 0.09, "learning_rate": 0.0019803219511903697, "loss": 3.0052, "step": 3400 }, { "epoch": 0.09, "learning_rate": 0.0019803047654745874, "loss": 2.5311, "step": 3401 }, { "epoch": 0.09, "learning_rate": 0.001980287572332191, "loss": 2.6749, "step": 3402 }, { "epoch": 0.09, "learning_rate": 0.0019802703717633112, "loss": 2.6981, "step": 3403 }, { "epoch": 0.09, "learning_rate": 0.001980253163768079, "loss": 3.1055, "step": 3404 }, { "epoch": 0.09, "learning_rate": 0.0019802359483466233, "loss": 2.4092, "step": 3405 }, { "epoch": 0.09, "learning_rate": 0.001980218725499076, "loss": 2.6718, "step": 3406 }, { "epoch": 0.09, "learning_rate": 0.001980201495225566, "loss": 2.6116, "step": 3407 }, { "epoch": 0.09, "learning_rate": 0.001980184257526225, "loss": 2.7411, "step": 3408 }, { "epoch": 0.09, "learning_rate": 0.001980167012401184, "loss": 2.5743, "step": 3409 }, { "epoch": 0.09, "learning_rate": 0.0019801497598505723, "loss": 3.2525, "step": 3410 }, { "epoch": 0.09, "learning_rate": 0.0019801324998745214, "loss": 2.7446, "step": 3411 }, { "epoch": 0.09, "learning_rate": 0.001980115232473162, "loss": 2.7501, "step": 3412 }, { "epoch": 0.09, "learning_rate": 0.001980097957646625, "loss": 3.3941, "step": 3413 }, { "epoch": 0.09, "learning_rate": 0.0019800806753950406, "loss": 2.7349, "step": 3414 }, { "epoch": 0.09, "learning_rate": 0.0019800633857185402, "loss": 2.602, "step": 3415 }, { "epoch": 0.09, "learning_rate": 0.0019800460886172555, "loss": 2.6749, "step": 3416 }, { "epoch": 0.09, "learning_rate": 0.001980028784091316, "loss": 2.8132, "step": 3417 }, { "epoch": 0.09, "learning_rate": 0.001980011472140854, "loss": 2.6975, "step": 3418 }, { "epoch": 0.09, "learning_rate": 0.001979994152766001, "loss": 2.6946, "step": 3419 }, { "epoch": 0.09, "learning_rate": 0.0019799768259668865, "loss": 3.2015, "step": 3420 }, { "epoch": 0.09, "learning_rate": 0.001979959491743643, "loss": 3.08, "step": 3421 }, { "epoch": 0.09, "learning_rate": 0.001979942150096402, "loss": 2.5758, "step": 3422 }, { "epoch": 0.09, "learning_rate": 0.0019799248010252944, "loss": 2.7754, "step": 3423 }, { "epoch": 0.09, "learning_rate": 0.0019799074445304514, "loss": 2.7862, "step": 3424 }, { "epoch": 0.09, "learning_rate": 0.0019798900806120047, "loss": 2.769, "step": 3425 }, { "epoch": 0.09, "learning_rate": 0.001979872709270086, "loss": 2.7362, "step": 3426 }, { "epoch": 0.09, "learning_rate": 0.001979855330504827, "loss": 2.6583, "step": 3427 }, { "epoch": 0.09, "learning_rate": 0.0019798379443163594, "loss": 2.9053, "step": 3428 }, { "epoch": 0.09, "learning_rate": 0.0019798205507048144, "loss": 2.3877, "step": 3429 }, { "epoch": 0.09, "learning_rate": 0.0019798031496703243, "loss": 2.7261, "step": 3430 }, { "epoch": 0.09, "learning_rate": 0.0019797857412130206, "loss": 2.724, "step": 3431 }, { "epoch": 0.09, "learning_rate": 0.001979768325333035, "loss": 2.601, "step": 3432 }, { "epoch": 0.09, "learning_rate": 0.0019797509020305004, "loss": 2.6512, "step": 3433 }, { "epoch": 0.09, "learning_rate": 0.0019797334713055476, "loss": 2.5884, "step": 3434 }, { "epoch": 0.09, "learning_rate": 0.0019797160331583093, "loss": 2.4512, "step": 3435 }, { "epoch": 0.09, "learning_rate": 0.0019796985875889174, "loss": 2.7002, "step": 3436 }, { "epoch": 0.09, "learning_rate": 0.0019796811345975046, "loss": 2.7708, "step": 3437 }, { "epoch": 0.09, "learning_rate": 0.0019796636741842024, "loss": 2.8431, "step": 3438 }, { "epoch": 0.09, "learning_rate": 0.001979646206349143, "loss": 2.8038, "step": 3439 }, { "epoch": 0.09, "learning_rate": 0.0019796287310924593, "loss": 2.7431, "step": 3440 }, { "epoch": 0.09, "learning_rate": 0.0019796112484142835, "loss": 2.8092, "step": 3441 }, { "epoch": 0.09, "learning_rate": 0.001979593758314748, "loss": 2.6309, "step": 3442 }, { "epoch": 0.09, "learning_rate": 0.0019795762607939856, "loss": 2.3092, "step": 3443 }, { "epoch": 0.09, "learning_rate": 0.0019795587558521285, "loss": 3.1407, "step": 3444 }, { "epoch": 0.09, "learning_rate": 0.001979541243489309, "loss": 2.7727, "step": 3445 }, { "epoch": 0.09, "learning_rate": 0.001979523723705661, "loss": 2.9924, "step": 3446 }, { "epoch": 0.09, "learning_rate": 0.0019795061965013155, "loss": 3.2411, "step": 3447 }, { "epoch": 0.09, "learning_rate": 0.0019794886618764067, "loss": 2.9518, "step": 3448 }, { "epoch": 0.09, "learning_rate": 0.0019794711198310665, "loss": 2.2759, "step": 3449 }, { "epoch": 0.09, "learning_rate": 0.0019794535703654284, "loss": 2.5744, "step": 3450 }, { "epoch": 0.09, "learning_rate": 0.001979436013479625, "loss": 2.5733, "step": 3451 }, { "epoch": 0.09, "learning_rate": 0.00197941844917379, "loss": 2.5517, "step": 3452 }, { "epoch": 0.09, "learning_rate": 0.0019794008774480553, "loss": 2.7446, "step": 3453 }, { "epoch": 0.09, "learning_rate": 0.001979383298302555, "loss": 2.7903, "step": 3454 }, { "epoch": 0.09, "learning_rate": 0.001979365711737422, "loss": 2.7418, "step": 3455 }, { "epoch": 0.09, "learning_rate": 0.0019793481177527894, "loss": 2.6363, "step": 3456 }, { "epoch": 0.09, "learning_rate": 0.0019793305163487906, "loss": 2.8233, "step": 3457 }, { "epoch": 0.09, "learning_rate": 0.0019793129075255586, "loss": 3.117, "step": 3458 }, { "epoch": 0.09, "learning_rate": 0.001979295291283227, "loss": 2.6166, "step": 3459 }, { "epoch": 0.09, "learning_rate": 0.00197927766762193, "loss": 2.5742, "step": 3460 }, { "epoch": 0.09, "learning_rate": 0.0019792600365418, "loss": 3.266, "step": 3461 }, { "epoch": 0.09, "learning_rate": 0.001979242398042971, "loss": 2.97, "step": 3462 }, { "epoch": 0.09, "learning_rate": 0.001979224752125577, "loss": 2.8879, "step": 3463 }, { "epoch": 0.09, "learning_rate": 0.001979207098789751, "loss": 2.4799, "step": 3464 }, { "epoch": 0.09, "learning_rate": 0.0019791894380356274, "loss": 2.7582, "step": 3465 }, { "epoch": 0.09, "learning_rate": 0.0019791717698633394, "loss": 3.0741, "step": 3466 }, { "epoch": 0.09, "learning_rate": 0.001979154094273021, "loss": 2.3654, "step": 3467 }, { "epoch": 0.09, "learning_rate": 0.0019791364112648068, "loss": 2.8589, "step": 3468 }, { "epoch": 0.09, "learning_rate": 0.00197911872083883, "loss": 2.2117, "step": 3469 }, { "epoch": 0.09, "learning_rate": 0.0019791010229952243, "loss": 2.8935, "step": 3470 }, { "epoch": 0.09, "learning_rate": 0.001979083317734125, "loss": 2.9323, "step": 3471 }, { "epoch": 0.09, "learning_rate": 0.001979065605055665, "loss": 2.7969, "step": 3472 }, { "epoch": 0.09, "learning_rate": 0.0019790478849599793, "loss": 2.8403, "step": 3473 }, { "epoch": 0.09, "learning_rate": 0.0019790301574472017, "loss": 2.8751, "step": 3474 }, { "epoch": 0.09, "learning_rate": 0.001979012422517467, "loss": 2.9912, "step": 3475 }, { "epoch": 0.09, "learning_rate": 0.0019789946801709087, "loss": 2.3135, "step": 3476 }, { "epoch": 0.09, "learning_rate": 0.0019789769304076623, "loss": 2.5153, "step": 3477 }, { "epoch": 0.09, "learning_rate": 0.0019789591732278615, "loss": 2.7848, "step": 3478 }, { "epoch": 0.09, "learning_rate": 0.001978941408631641, "loss": 2.5848, "step": 3479 }, { "epoch": 0.09, "learning_rate": 0.001978923636619135, "loss": 2.7015, "step": 3480 }, { "epoch": 0.09, "learning_rate": 0.001978905857190479, "loss": 2.7986, "step": 3481 }, { "epoch": 0.09, "learning_rate": 0.001978888070345807, "loss": 2.7669, "step": 3482 }, { "epoch": 0.09, "learning_rate": 0.0019788702760852542, "loss": 2.9202, "step": 3483 }, { "epoch": 0.09, "learning_rate": 0.001978852474408955, "loss": 2.6937, "step": 3484 }, { "epoch": 0.09, "learning_rate": 0.001978834665317045, "loss": 3.3084, "step": 3485 }, { "epoch": 0.09, "learning_rate": 0.001978816848809658, "loss": 2.3061, "step": 3486 }, { "epoch": 0.09, "learning_rate": 0.0019787990248869296, "loss": 2.9795, "step": 3487 }, { "epoch": 0.09, "learning_rate": 0.0019787811935489947, "loss": 2.7607, "step": 3488 }, { "epoch": 0.09, "learning_rate": 0.0019787633547959887, "loss": 2.4076, "step": 3489 }, { "epoch": 0.09, "learning_rate": 0.0019787455086280464, "loss": 2.536, "step": 3490 }, { "epoch": 0.09, "learning_rate": 0.0019787276550453036, "loss": 2.9467, "step": 3491 }, { "epoch": 0.09, "learning_rate": 0.001978709794047894, "loss": 2.9433, "step": 3492 }, { "epoch": 0.09, "learning_rate": 0.001978691925635955, "loss": 2.6789, "step": 3493 }, { "epoch": 0.09, "learning_rate": 0.0019786740498096205, "loss": 2.9565, "step": 3494 }, { "epoch": 0.09, "learning_rate": 0.0019786561665690264, "loss": 2.9058, "step": 3495 }, { "epoch": 0.09, "learning_rate": 0.0019786382759143083, "loss": 2.8355, "step": 3496 }, { "epoch": 0.09, "learning_rate": 0.0019786203778456015, "loss": 2.6837, "step": 3497 }, { "epoch": 0.09, "learning_rate": 0.001978602472363042, "loss": 2.8434, "step": 3498 }, { "epoch": 0.09, "learning_rate": 0.0019785845594667644, "loss": 2.6721, "step": 3499 }, { "epoch": 0.09, "learning_rate": 0.0019785666391569055, "loss": 2.4599, "step": 3500 }, { "epoch": 0.09, "learning_rate": 0.0019785487114336005, "loss": 2.8604, "step": 3501 }, { "epoch": 0.09, "learning_rate": 0.0019785307762969855, "loss": 3.017, "step": 3502 }, { "epoch": 0.09, "learning_rate": 0.0019785128337471967, "loss": 2.5882, "step": 3503 }, { "epoch": 0.09, "learning_rate": 0.0019784948837843694, "loss": 2.9521, "step": 3504 }, { "epoch": 0.09, "learning_rate": 0.0019784769264086393, "loss": 2.9118, "step": 3505 }, { "epoch": 0.09, "learning_rate": 0.0019784589616201435, "loss": 3.2907, "step": 3506 }, { "epoch": 0.09, "learning_rate": 0.0019784409894190173, "loss": 3.3854, "step": 3507 }, { "epoch": 0.09, "learning_rate": 0.0019784230098053974, "loss": 2.6194, "step": 3508 }, { "epoch": 0.09, "learning_rate": 0.0019784050227794193, "loss": 2.8595, "step": 3509 }, { "epoch": 0.09, "learning_rate": 0.00197838702834122, "loss": 2.3367, "step": 3510 }, { "epoch": 0.09, "learning_rate": 0.001978369026490935, "loss": 2.5822, "step": 3511 }, { "epoch": 0.09, "learning_rate": 0.0019783510172287017, "loss": 2.5988, "step": 3512 }, { "epoch": 0.09, "learning_rate": 0.001978333000554656, "loss": 3.0922, "step": 3513 }, { "epoch": 0.09, "learning_rate": 0.001978314976468934, "loss": 3.0957, "step": 3514 }, { "epoch": 0.09, "learning_rate": 0.0019782969449716726, "loss": 2.8515, "step": 3515 }, { "epoch": 0.09, "learning_rate": 0.001978278906063009, "loss": 2.5282, "step": 3516 }, { "epoch": 0.09, "learning_rate": 0.0019782608597430787, "loss": 2.773, "step": 3517 }, { "epoch": 0.09, "learning_rate": 0.0019782428060120196, "loss": 2.7762, "step": 3518 }, { "epoch": 0.09, "learning_rate": 0.0019782247448699676, "loss": 2.8749, "step": 3519 }, { "epoch": 0.09, "learning_rate": 0.00197820667631706, "loss": 2.8693, "step": 3520 }, { "epoch": 0.09, "learning_rate": 0.0019781886003534333, "loss": 2.9019, "step": 3521 }, { "epoch": 0.09, "learning_rate": 0.001978170516979224, "loss": 2.3963, "step": 3522 }, { "epoch": 0.09, "learning_rate": 0.001978152426194571, "loss": 2.84, "step": 3523 }, { "epoch": 0.09, "learning_rate": 0.0019781343279996096, "loss": 2.5563, "step": 3524 }, { "epoch": 0.09, "learning_rate": 0.001978116222394477, "loss": 3.0171, "step": 3525 }, { "epoch": 0.09, "learning_rate": 0.0019780981093793113, "loss": 2.9028, "step": 3526 }, { "epoch": 0.09, "learning_rate": 0.001978079988954249, "loss": 2.6342, "step": 3527 }, { "epoch": 0.09, "learning_rate": 0.0019780618611194276, "loss": 2.8839, "step": 3528 }, { "epoch": 0.09, "learning_rate": 0.0019780437258749843, "loss": 2.3928, "step": 3529 }, { "epoch": 0.09, "learning_rate": 0.001978025583221057, "loss": 2.7676, "step": 3530 }, { "epoch": 0.09, "learning_rate": 0.001978007433157782, "loss": 2.4645, "step": 3531 }, { "epoch": 0.09, "learning_rate": 0.0019779892756852983, "loss": 2.8638, "step": 3532 }, { "epoch": 0.09, "learning_rate": 0.0019779711108037423, "loss": 2.8438, "step": 3533 }, { "epoch": 0.09, "learning_rate": 0.0019779529385132518, "loss": 2.3577, "step": 3534 }, { "epoch": 0.09, "learning_rate": 0.001977934758813965, "loss": 2.787, "step": 3535 }, { "epoch": 0.1, "learning_rate": 0.001977916571706019, "loss": 2.9261, "step": 3536 }, { "epoch": 0.1, "learning_rate": 0.0019778983771895522, "loss": 2.5902, "step": 3537 }, { "epoch": 0.1, "learning_rate": 0.001977880175264702, "loss": 2.7232, "step": 3538 }, { "epoch": 0.1, "learning_rate": 0.0019778619659316064, "loss": 2.5369, "step": 3539 }, { "epoch": 0.1, "learning_rate": 0.0019778437491904037, "loss": 2.5904, "step": 3540 }, { "epoch": 0.1, "learning_rate": 0.0019778255250412313, "loss": 2.8583, "step": 3541 }, { "epoch": 0.1, "learning_rate": 0.0019778072934842276, "loss": 2.7902, "step": 3542 }, { "epoch": 0.1, "learning_rate": 0.0019777890545195306, "loss": 2.4501, "step": 3543 }, { "epoch": 0.1, "learning_rate": 0.0019777708081472785, "loss": 3.1198, "step": 3544 }, { "epoch": 0.1, "learning_rate": 0.0019777525543676097, "loss": 2.7514, "step": 3545 }, { "epoch": 0.1, "learning_rate": 0.001977734293180662, "loss": 3.1513, "step": 3546 }, { "epoch": 0.1, "learning_rate": 0.0019777160245865746, "loss": 2.5072, "step": 3547 }, { "epoch": 0.1, "learning_rate": 0.0019776977485854853, "loss": 2.449, "step": 3548 }, { "epoch": 0.1, "learning_rate": 0.0019776794651775323, "loss": 2.6353, "step": 3549 }, { "epoch": 0.1, "learning_rate": 0.001977661174362855, "loss": 2.362, "step": 3550 }, { "epoch": 0.1, "learning_rate": 0.0019776428761415906, "loss": 2.9743, "step": 3551 }, { "epoch": 0.1, "learning_rate": 0.0019776245705138795, "loss": 2.4601, "step": 3552 }, { "epoch": 0.1, "learning_rate": 0.001977606257479859, "loss": 2.7019, "step": 3553 }, { "epoch": 0.1, "learning_rate": 0.0019775879370396683, "loss": 2.9194, "step": 3554 }, { "epoch": 0.1, "learning_rate": 0.001977569609193446, "loss": 2.3696, "step": 3555 }, { "epoch": 0.1, "learning_rate": 0.001977551273941331, "loss": 2.6381, "step": 3556 }, { "epoch": 0.1, "learning_rate": 0.001977532931283463, "loss": 2.8772, "step": 3557 }, { "epoch": 0.1, "learning_rate": 0.00197751458121998, "loss": 2.6726, "step": 3558 }, { "epoch": 0.1, "learning_rate": 0.0019774962237510208, "loss": 2.2656, "step": 3559 }, { "epoch": 0.1, "learning_rate": 0.0019774778588767254, "loss": 3.1785, "step": 3560 }, { "epoch": 0.1, "learning_rate": 0.0019774594865972325, "loss": 2.8868, "step": 3561 }, { "epoch": 0.1, "learning_rate": 0.0019774411069126813, "loss": 2.5027, "step": 3562 }, { "epoch": 0.1, "learning_rate": 0.0019774227198232105, "loss": 2.6848, "step": 3563 }, { "epoch": 0.1, "learning_rate": 0.0019774043253289607, "loss": 2.8195, "step": 3564 }, { "epoch": 0.1, "learning_rate": 0.00197738592343007, "loss": 2.4702, "step": 3565 }, { "epoch": 0.1, "learning_rate": 0.0019773675141266786, "loss": 2.729, "step": 3566 }, { "epoch": 0.1, "learning_rate": 0.001977349097418925, "loss": 2.6878, "step": 3567 }, { "epoch": 0.1, "learning_rate": 0.00197733067330695, "loss": 2.6146, "step": 3568 }, { "epoch": 0.1, "learning_rate": 0.0019773122417908926, "loss": 2.8847, "step": 3569 }, { "epoch": 0.1, "learning_rate": 0.001977293802870892, "loss": 2.936, "step": 3570 }, { "epoch": 0.1, "learning_rate": 0.0019772753565470884, "loss": 2.8457, "step": 3571 }, { "epoch": 0.1, "learning_rate": 0.0019772569028196213, "loss": 2.7025, "step": 3572 }, { "epoch": 0.1, "learning_rate": 0.001977238441688631, "loss": 3.1462, "step": 3573 }, { "epoch": 0.1, "learning_rate": 0.001977219973154257, "loss": 2.9364, "step": 3574 }, { "epoch": 0.1, "learning_rate": 0.0019772014972166386, "loss": 2.7508, "step": 3575 }, { "epoch": 0.1, "learning_rate": 0.001977183013875917, "loss": 2.6881, "step": 3576 }, { "epoch": 0.1, "learning_rate": 0.001977164523132231, "loss": 2.7074, "step": 3577 }, { "epoch": 0.1, "learning_rate": 0.0019771460249857218, "loss": 2.7381, "step": 3578 }, { "epoch": 0.1, "learning_rate": 0.001977127519436529, "loss": 2.5855, "step": 3579 }, { "epoch": 0.1, "learning_rate": 0.001977109006484792, "loss": 2.5133, "step": 3580 }, { "epoch": 0.1, "learning_rate": 0.0019770904861306526, "loss": 2.8828, "step": 3581 }, { "epoch": 0.1, "learning_rate": 0.0019770719583742506, "loss": 2.8897, "step": 3582 }, { "epoch": 0.1, "learning_rate": 0.0019770534232157254, "loss": 2.9749, "step": 3583 }, { "epoch": 0.1, "learning_rate": 0.001977034880655219, "loss": 2.5814, "step": 3584 }, { "epoch": 0.1, "learning_rate": 0.0019770163306928705, "loss": 2.6404, "step": 3585 }, { "epoch": 0.1, "learning_rate": 0.0019769977733288206, "loss": 2.9066, "step": 3586 }, { "epoch": 0.1, "learning_rate": 0.0019769792085632108, "loss": 2.7001, "step": 3587 }, { "epoch": 0.1, "learning_rate": 0.001976960636396181, "loss": 2.9074, "step": 3588 }, { "epoch": 0.1, "learning_rate": 0.001976942056827872, "loss": 2.514, "step": 3589 }, { "epoch": 0.1, "learning_rate": 0.0019769234698584245, "loss": 2.9533, "step": 3590 }, { "epoch": 0.1, "learning_rate": 0.0019769048754879797, "loss": 2.9488, "step": 3591 }, { "epoch": 0.1, "learning_rate": 0.001976886273716678, "loss": 2.7084, "step": 3592 }, { "epoch": 0.1, "learning_rate": 0.0019768676645446613, "loss": 3.0749, "step": 3593 }, { "epoch": 0.1, "learning_rate": 0.001976849047972069, "loss": 2.7813, "step": 3594 }, { "epoch": 0.1, "learning_rate": 0.001976830423999043, "loss": 2.4511, "step": 3595 }, { "epoch": 0.1, "learning_rate": 0.001976811792625725, "loss": 2.5198, "step": 3596 }, { "epoch": 0.1, "learning_rate": 0.001976793153852255, "loss": 2.8911, "step": 3597 }, { "epoch": 0.1, "learning_rate": 0.0019767745076787746, "loss": 2.4112, "step": 3598 }, { "epoch": 0.1, "learning_rate": 0.0019767558541054255, "loss": 2.6425, "step": 3599 }, { "epoch": 0.1, "learning_rate": 0.0019767371931323483, "loss": 3.0078, "step": 3600 }, { "epoch": 0.1, "learning_rate": 0.0019767185247596846, "loss": 2.5978, "step": 3601 }, { "epoch": 0.1, "learning_rate": 0.0019766998489875766, "loss": 3.5931, "step": 3602 }, { "epoch": 0.1, "learning_rate": 0.0019766811658161647, "loss": 2.9508, "step": 3603 }, { "epoch": 0.1, "learning_rate": 0.0019766624752455913, "loss": 2.5803, "step": 3604 }, { "epoch": 0.1, "learning_rate": 0.001976643777275997, "loss": 2.6017, "step": 3605 }, { "epoch": 0.1, "learning_rate": 0.0019766250719075247, "loss": 2.4445, "step": 3606 }, { "epoch": 0.1, "learning_rate": 0.0019766063591403153, "loss": 2.4332, "step": 3607 }, { "epoch": 0.1, "learning_rate": 0.0019765876389745106, "loss": 2.5539, "step": 3608 }, { "epoch": 0.1, "learning_rate": 0.0019765689114102526, "loss": 3.0759, "step": 3609 }, { "epoch": 0.1, "learning_rate": 0.001976550176447683, "loss": 2.8006, "step": 3610 }, { "epoch": 0.1, "learning_rate": 0.0019765314340869436, "loss": 2.781, "step": 3611 }, { "epoch": 0.1, "learning_rate": 0.001976512684328177, "loss": 2.7465, "step": 3612 }, { "epoch": 0.1, "learning_rate": 0.001976493927171525, "loss": 2.698, "step": 3613 }, { "epoch": 0.1, "learning_rate": 0.0019764751626171295, "loss": 2.9508, "step": 3614 }, { "epoch": 0.1, "learning_rate": 0.0019764563906651323, "loss": 2.6645, "step": 3615 }, { "epoch": 0.1, "learning_rate": 0.0019764376113156766, "loss": 2.4694, "step": 3616 }, { "epoch": 0.1, "learning_rate": 0.0019764188245689042, "loss": 2.5769, "step": 3617 }, { "epoch": 0.1, "learning_rate": 0.0019764000304249574, "loss": 2.7145, "step": 3618 }, { "epoch": 0.1, "learning_rate": 0.001976381228883978, "loss": 2.5909, "step": 3619 }, { "epoch": 0.1, "learning_rate": 0.0019763624199461093, "loss": 2.3942, "step": 3620 }, { "epoch": 0.1, "learning_rate": 0.0019763436036114935, "loss": 2.708, "step": 3621 }, { "epoch": 0.1, "learning_rate": 0.001976324779880273, "loss": 3.1858, "step": 3622 }, { "epoch": 0.1, "learning_rate": 0.00197630594875259, "loss": 2.2701, "step": 3623 }, { "epoch": 0.1, "learning_rate": 0.0019762871102285886, "loss": 2.9621, "step": 3624 }, { "epoch": 0.1, "learning_rate": 0.00197626826430841, "loss": 2.9468, "step": 3625 }, { "epoch": 0.1, "learning_rate": 0.001976249410992198, "loss": 2.4936, "step": 3626 }, { "epoch": 0.1, "learning_rate": 0.0019762305502800948, "loss": 2.9836, "step": 3627 }, { "epoch": 0.1, "learning_rate": 0.0019762116821722435, "loss": 2.8869, "step": 3628 }, { "epoch": 0.1, "learning_rate": 0.0019761928066687868, "loss": 2.8657, "step": 3629 }, { "epoch": 0.1, "learning_rate": 0.0019761739237698682, "loss": 2.4982, "step": 3630 }, { "epoch": 0.1, "learning_rate": 0.00197615503347563, "loss": 2.6818, "step": 3631 }, { "epoch": 0.1, "learning_rate": 0.0019761361357862163, "loss": 2.99, "step": 3632 }, { "epoch": 0.1, "learning_rate": 0.0019761172307017696, "loss": 2.2075, "step": 3633 }, { "epoch": 0.1, "learning_rate": 0.0019760983182224336, "loss": 2.7286, "step": 3634 }, { "epoch": 0.1, "learning_rate": 0.0019760793983483508, "loss": 2.6464, "step": 3635 }, { "epoch": 0.1, "learning_rate": 0.0019760604710796653, "loss": 3.1387, "step": 3636 }, { "epoch": 0.1, "learning_rate": 0.00197604153641652, "loss": 2.5905, "step": 3637 }, { "epoch": 0.1, "learning_rate": 0.0019760225943590585, "loss": 2.3063, "step": 3638 }, { "epoch": 0.1, "learning_rate": 0.0019760036449074244, "loss": 3.0638, "step": 3639 }, { "epoch": 0.1, "learning_rate": 0.001975984688061761, "loss": 2.9607, "step": 3640 }, { "epoch": 0.1, "learning_rate": 0.0019759657238222123, "loss": 2.3171, "step": 3641 }, { "epoch": 0.1, "learning_rate": 0.0019759467521889215, "loss": 2.7726, "step": 3642 }, { "epoch": 0.1, "learning_rate": 0.001975927773162033, "loss": 2.6101, "step": 3643 }, { "epoch": 0.1, "learning_rate": 0.0019759087867416898, "loss": 2.9241, "step": 3644 }, { "epoch": 0.1, "learning_rate": 0.0019758897929280364, "loss": 2.5598, "step": 3645 }, { "epoch": 0.1, "learning_rate": 0.001975870791721216, "loss": 2.6701, "step": 3646 }, { "epoch": 0.1, "learning_rate": 0.0019758517831213736, "loss": 2.7605, "step": 3647 }, { "epoch": 0.1, "learning_rate": 0.0019758327671286517, "loss": 3.0268, "step": 3648 }, { "epoch": 0.1, "learning_rate": 0.001975813743743196, "loss": 2.6514, "step": 3649 }, { "epoch": 0.1, "learning_rate": 0.0019757947129651495, "loss": 2.5053, "step": 3650 }, { "epoch": 0.1, "learning_rate": 0.0019757756747946567, "loss": 2.6421, "step": 3651 }, { "epoch": 0.1, "learning_rate": 0.001975756629231862, "loss": 3.0917, "step": 3652 }, { "epoch": 0.1, "learning_rate": 0.001975737576276909, "loss": 2.8671, "step": 3653 }, { "epoch": 0.1, "learning_rate": 0.0019757185159299433, "loss": 2.5904, "step": 3654 }, { "epoch": 0.1, "learning_rate": 0.001975699448191108, "loss": 2.8127, "step": 3655 }, { "epoch": 0.1, "learning_rate": 0.0019756803730605482, "loss": 2.9404, "step": 3656 }, { "epoch": 0.1, "learning_rate": 0.0019756612905384085, "loss": 2.5342, "step": 3657 }, { "epoch": 0.1, "learning_rate": 0.0019756422006248333, "loss": 2.7193, "step": 3658 }, { "epoch": 0.1, "learning_rate": 0.0019756231033199673, "loss": 2.8394, "step": 3659 }, { "epoch": 0.1, "learning_rate": 0.001975603998623955, "loss": 2.7313, "step": 3660 }, { "epoch": 0.1, "learning_rate": 0.0019755848865369414, "loss": 2.8116, "step": 3661 }, { "epoch": 0.1, "learning_rate": 0.0019755657670590706, "loss": 2.8185, "step": 3662 }, { "epoch": 0.1, "learning_rate": 0.0019755466401904886, "loss": 2.4834, "step": 3663 }, { "epoch": 0.1, "learning_rate": 0.0019755275059313393, "loss": 2.861, "step": 3664 }, { "epoch": 0.1, "learning_rate": 0.001975508364281768, "loss": 2.5338, "step": 3665 }, { "epoch": 0.1, "learning_rate": 0.0019754892152419198, "loss": 2.705, "step": 3666 }, { "epoch": 0.1, "learning_rate": 0.0019754700588119397, "loss": 2.7323, "step": 3667 }, { "epoch": 0.1, "learning_rate": 0.001975450894991973, "loss": 2.7773, "step": 3668 }, { "epoch": 0.1, "learning_rate": 0.0019754317237821646, "loss": 2.7456, "step": 3669 }, { "epoch": 0.1, "learning_rate": 0.0019754125451826596, "loss": 2.8215, "step": 3670 }, { "epoch": 0.1, "learning_rate": 0.001975393359193604, "loss": 2.7138, "step": 3671 }, { "epoch": 0.1, "learning_rate": 0.0019753741658151422, "loss": 2.8301, "step": 3672 }, { "epoch": 0.1, "learning_rate": 0.0019753549650474204, "loss": 2.9584, "step": 3673 }, { "epoch": 0.1, "learning_rate": 0.001975335756890584, "loss": 2.6578, "step": 3674 }, { "epoch": 0.1, "learning_rate": 0.001975316541344778, "loss": 2.7991, "step": 3675 }, { "epoch": 0.1, "learning_rate": 0.001975297318410148, "loss": 3.276, "step": 3676 }, { "epoch": 0.1, "learning_rate": 0.00197527808808684, "loss": 2.3837, "step": 3677 }, { "epoch": 0.1, "learning_rate": 0.001975258850375, "loss": 2.8862, "step": 3678 }, { "epoch": 0.1, "learning_rate": 0.0019752396052747727, "loss": 2.8785, "step": 3679 }, { "epoch": 0.1, "learning_rate": 0.0019752203527863047, "loss": 2.8197, "step": 3680 }, { "epoch": 0.1, "learning_rate": 0.0019752010929097417, "loss": 2.2434, "step": 3681 }, { "epoch": 0.1, "learning_rate": 0.00197518182564523, "loss": 2.5587, "step": 3682 }, { "epoch": 0.1, "learning_rate": 0.001975162550992915, "loss": 2.5698, "step": 3683 }, { "epoch": 0.1, "learning_rate": 0.0019751432689529423, "loss": 2.5447, "step": 3684 }, { "epoch": 0.1, "learning_rate": 0.001975123979525459, "loss": 2.6383, "step": 3685 }, { "epoch": 0.1, "learning_rate": 0.001975104682710611, "loss": 2.5469, "step": 3686 }, { "epoch": 0.1, "learning_rate": 0.0019750853785085436, "loss": 2.3899, "step": 3687 }, { "epoch": 0.1, "learning_rate": 0.0019750660669194038, "loss": 2.5553, "step": 3688 }, { "epoch": 0.1, "learning_rate": 0.001975046747943338, "loss": 2.8113, "step": 3689 }, { "epoch": 0.1, "learning_rate": 0.0019750274215804926, "loss": 2.7739, "step": 3690 }, { "epoch": 0.1, "learning_rate": 0.0019750080878310136, "loss": 2.9762, "step": 3691 }, { "epoch": 0.1, "learning_rate": 0.0019749887466950474, "loss": 2.7168, "step": 3692 }, { "epoch": 0.1, "learning_rate": 0.001974969398172741, "loss": 2.7086, "step": 3693 }, { "epoch": 0.1, "learning_rate": 0.0019749500422642408, "loss": 3.1187, "step": 3694 }, { "epoch": 0.1, "learning_rate": 0.001974930678969693, "loss": 2.4843, "step": 3695 }, { "epoch": 0.1, "learning_rate": 0.001974911308289245, "loss": 2.7054, "step": 3696 }, { "epoch": 0.1, "learning_rate": 0.0019748919302230434, "loss": 2.7085, "step": 3697 }, { "epoch": 0.1, "learning_rate": 0.0019748725447712345, "loss": 2.579, "step": 3698 }, { "epoch": 0.1, "learning_rate": 0.0019748531519339653, "loss": 2.4522, "step": 3699 }, { "epoch": 0.1, "learning_rate": 0.0019748337517113833, "loss": 2.5051, "step": 3700 }, { "epoch": 0.1, "learning_rate": 0.0019748143441036354, "loss": 2.5345, "step": 3701 }, { "epoch": 0.1, "learning_rate": 0.0019747949291108674, "loss": 2.7051, "step": 3702 }, { "epoch": 0.1, "learning_rate": 0.001974775506733228, "loss": 2.7832, "step": 3703 }, { "epoch": 0.1, "learning_rate": 0.0019747560769708635, "loss": 3.1032, "step": 3704 }, { "epoch": 0.1, "learning_rate": 0.001974736639823921, "loss": 2.56, "step": 3705 }, { "epoch": 0.1, "learning_rate": 0.001974717195292548, "loss": 2.55, "step": 3706 }, { "epoch": 0.1, "learning_rate": 0.001974697743376892, "loss": 2.4353, "step": 3707 }, { "epoch": 0.1, "learning_rate": 0.0019746782840771, "loss": 2.6697, "step": 3708 }, { "epoch": 0.1, "learning_rate": 0.00197465881739332, "loss": 2.6396, "step": 3709 }, { "epoch": 0.1, "learning_rate": 0.0019746393433256984, "loss": 2.604, "step": 3710 }, { "epoch": 0.1, "learning_rate": 0.001974619861874384, "loss": 2.6403, "step": 3711 }, { "epoch": 0.1, "learning_rate": 0.0019746003730395233, "loss": 2.5211, "step": 3712 }, { "epoch": 0.1, "learning_rate": 0.0019745808768212646, "loss": 2.9048, "step": 3713 }, { "epoch": 0.1, "learning_rate": 0.0019745613732197556, "loss": 2.283, "step": 3714 }, { "epoch": 0.1, "learning_rate": 0.0019745418622351438, "loss": 2.435, "step": 3715 }, { "epoch": 0.1, "learning_rate": 0.0019745223438675766, "loss": 2.937, "step": 3716 }, { "epoch": 0.1, "learning_rate": 0.001974502818117203, "loss": 2.5875, "step": 3717 }, { "epoch": 0.1, "learning_rate": 0.00197448328498417, "loss": 3.1378, "step": 3718 }, { "epoch": 0.1, "learning_rate": 0.0019744637444686257, "loss": 2.3728, "step": 3719 }, { "epoch": 0.1, "learning_rate": 0.0019744441965707186, "loss": 2.6097, "step": 3720 }, { "epoch": 0.1, "learning_rate": 0.0019744246412905964, "loss": 2.6972, "step": 3721 }, { "epoch": 0.1, "learning_rate": 0.001974405078628407, "loss": 2.7003, "step": 3722 }, { "epoch": 0.1, "learning_rate": 0.001974385508584299, "loss": 2.5566, "step": 3723 }, { "epoch": 0.1, "learning_rate": 0.001974365931158421, "loss": 2.6897, "step": 3724 }, { "epoch": 0.1, "learning_rate": 0.0019743463463509207, "loss": 2.3781, "step": 3725 }, { "epoch": 0.1, "learning_rate": 0.0019743267541619466, "loss": 2.8132, "step": 3726 }, { "epoch": 0.1, "learning_rate": 0.001974307154591647, "loss": 2.7189, "step": 3727 }, { "epoch": 0.1, "learning_rate": 0.001974287547640171, "loss": 3.0036, "step": 3728 }, { "epoch": 0.1, "learning_rate": 0.0019742679333076664, "loss": 2.675, "step": 3729 }, { "epoch": 0.1, "learning_rate": 0.0019742483115942826, "loss": 2.6532, "step": 3730 }, { "epoch": 0.1, "learning_rate": 0.0019742286825001672, "loss": 2.7968, "step": 3731 }, { "epoch": 0.1, "learning_rate": 0.0019742090460254697, "loss": 2.918, "step": 3732 }, { "epoch": 0.1, "learning_rate": 0.001974189402170339, "loss": 2.5983, "step": 3733 }, { "epoch": 0.1, "learning_rate": 0.001974169750934923, "loss": 2.7061, "step": 3734 }, { "epoch": 0.1, "learning_rate": 0.0019741500923193714, "loss": 2.7047, "step": 3735 }, { "epoch": 0.1, "learning_rate": 0.0019741304263238327, "loss": 2.5053, "step": 3736 }, { "epoch": 0.1, "learning_rate": 0.0019741107529484565, "loss": 3.228, "step": 3737 }, { "epoch": 0.1, "learning_rate": 0.001974091072193391, "loss": 3.0013, "step": 3738 }, { "epoch": 0.1, "learning_rate": 0.0019740713840587856, "loss": 2.8119, "step": 3739 }, { "epoch": 0.1, "learning_rate": 0.00197405168854479, "loss": 2.5979, "step": 3740 }, { "epoch": 0.1, "learning_rate": 0.0019740319856515524, "loss": 2.9975, "step": 3741 }, { "epoch": 0.1, "learning_rate": 0.0019740122753792227, "loss": 2.8437, "step": 3742 }, { "epoch": 0.1, "learning_rate": 0.0019739925577279506, "loss": 2.7891, "step": 3743 }, { "epoch": 0.1, "learning_rate": 0.0019739728326978847, "loss": 2.9642, "step": 3744 }, { "epoch": 0.1, "learning_rate": 0.0019739531002891746, "loss": 2.7991, "step": 3745 }, { "epoch": 0.1, "learning_rate": 0.00197393336050197, "loss": 2.5063, "step": 3746 }, { "epoch": 0.1, "learning_rate": 0.0019739136133364206, "loss": 2.4838, "step": 3747 }, { "epoch": 0.1, "learning_rate": 0.0019738938587926754, "loss": 2.423, "step": 3748 }, { "epoch": 0.1, "learning_rate": 0.001973874096870885, "loss": 2.2922, "step": 3749 }, { "epoch": 0.1, "learning_rate": 0.001973854327571198, "loss": 2.5371, "step": 3750 }, { "epoch": 0.1, "learning_rate": 0.0019738345508937653, "loss": 2.5933, "step": 3751 }, { "epoch": 0.1, "learning_rate": 0.0019738147668387357, "loss": 2.8771, "step": 3752 }, { "epoch": 0.1, "learning_rate": 0.0019737949754062597, "loss": 2.6363, "step": 3753 }, { "epoch": 0.1, "learning_rate": 0.001973775176596487, "loss": 2.7027, "step": 3754 }, { "epoch": 0.1, "learning_rate": 0.001973755370409568, "loss": 2.681, "step": 3755 }, { "epoch": 0.1, "learning_rate": 0.001973735556845652, "loss": 2.7704, "step": 3756 }, { "epoch": 0.1, "learning_rate": 0.0019737157359048896, "loss": 2.5669, "step": 3757 }, { "epoch": 0.1, "learning_rate": 0.0019736959075874307, "loss": 2.6242, "step": 3758 }, { "epoch": 0.1, "learning_rate": 0.001973676071893426, "loss": 2.8497, "step": 3759 }, { "epoch": 0.1, "learning_rate": 0.001973656228823025, "loss": 2.7095, "step": 3760 }, { "epoch": 0.1, "learning_rate": 0.001973636378376379, "loss": 2.7096, "step": 3761 }, { "epoch": 0.1, "learning_rate": 0.0019736165205536376, "loss": 2.7929, "step": 3762 }, { "epoch": 0.1, "learning_rate": 0.0019735966553549515, "loss": 2.4498, "step": 3763 }, { "epoch": 0.1, "learning_rate": 0.0019735767827804714, "loss": 2.2574, "step": 3764 }, { "epoch": 0.1, "learning_rate": 0.0019735569028303474, "loss": 2.8402, "step": 3765 }, { "epoch": 0.1, "learning_rate": 0.0019735370155047303, "loss": 2.7802, "step": 3766 }, { "epoch": 0.1, "learning_rate": 0.0019735171208037712, "loss": 2.5589, "step": 3767 }, { "epoch": 0.1, "learning_rate": 0.0019734972187276205, "loss": 2.8727, "step": 3768 }, { "epoch": 0.1, "learning_rate": 0.0019734773092764286, "loss": 2.5441, "step": 3769 }, { "epoch": 0.1, "learning_rate": 0.0019734573924503466, "loss": 2.7023, "step": 3770 }, { "epoch": 0.1, "learning_rate": 0.0019734374682495257, "loss": 2.4078, "step": 3771 }, { "epoch": 0.1, "learning_rate": 0.0019734175366741165, "loss": 2.5407, "step": 3772 }, { "epoch": 0.1, "learning_rate": 0.00197339759772427, "loss": 2.6635, "step": 3773 }, { "epoch": 0.1, "learning_rate": 0.001973377651400137, "loss": 3.07, "step": 3774 }, { "epoch": 0.1, "learning_rate": 0.001973357697701869, "loss": 3.046, "step": 3775 }, { "epoch": 0.1, "learning_rate": 0.001973337736629618, "loss": 2.5863, "step": 3776 }, { "epoch": 0.1, "learning_rate": 0.0019733177681835333, "loss": 3.0306, "step": 3777 }, { "epoch": 0.1, "learning_rate": 0.0019732977923637676, "loss": 2.8504, "step": 3778 }, { "epoch": 0.1, "learning_rate": 0.001973277809170472, "loss": 3.1917, "step": 3779 }, { "epoch": 0.1, "learning_rate": 0.0019732578186037976, "loss": 2.9354, "step": 3780 }, { "epoch": 0.1, "learning_rate": 0.001973237820663896, "loss": 2.9629, "step": 3781 }, { "epoch": 0.1, "learning_rate": 0.0019732178153509185, "loss": 2.4689, "step": 3782 }, { "epoch": 0.1, "learning_rate": 0.0019731978026650164, "loss": 2.773, "step": 3783 }, { "epoch": 0.1, "learning_rate": 0.0019731777826063426, "loss": 3.0704, "step": 3784 }, { "epoch": 0.1, "learning_rate": 0.0019731577551750476, "loss": 2.6557, "step": 3785 }, { "epoch": 0.1, "learning_rate": 0.0019731377203712833, "loss": 3.0488, "step": 3786 }, { "epoch": 0.1, "learning_rate": 0.0019731176781952017, "loss": 2.6429, "step": 3787 }, { "epoch": 0.1, "learning_rate": 0.0019730976286469544, "loss": 2.5124, "step": 3788 }, { "epoch": 0.1, "learning_rate": 0.0019730775717266935, "loss": 3.0608, "step": 3789 }, { "epoch": 0.1, "learning_rate": 0.001973057507434571, "loss": 2.8139, "step": 3790 }, { "epoch": 0.1, "learning_rate": 0.001973037435770739, "loss": 2.6874, "step": 3791 }, { "epoch": 0.1, "learning_rate": 0.001973017356735349, "loss": 2.7301, "step": 3792 }, { "epoch": 0.1, "learning_rate": 0.0019729972703285536, "loss": 2.9444, "step": 3793 }, { "epoch": 0.1, "learning_rate": 0.0019729771765505046, "loss": 2.5938, "step": 3794 }, { "epoch": 0.1, "learning_rate": 0.0019729570754013544, "loss": 2.6871, "step": 3795 }, { "epoch": 0.1, "learning_rate": 0.001972936966881256, "loss": 2.9573, "step": 3796 }, { "epoch": 0.1, "learning_rate": 0.0019729168509903606, "loss": 2.609, "step": 3797 }, { "epoch": 0.1, "learning_rate": 0.0019728967277288212, "loss": 3.0289, "step": 3798 }, { "epoch": 0.1, "learning_rate": 0.00197287659709679, "loss": 2.7866, "step": 3799 }, { "epoch": 0.1, "learning_rate": 0.00197285645909442, "loss": 2.6575, "step": 3800 }, { "epoch": 0.1, "learning_rate": 0.001972836313721863, "loss": 2.8467, "step": 3801 }, { "epoch": 0.1, "learning_rate": 0.001972816160979272, "loss": 2.564, "step": 3802 }, { "epoch": 0.1, "learning_rate": 0.0019727960008668, "loss": 2.8832, "step": 3803 }, { "epoch": 0.1, "learning_rate": 0.001972775833384599, "loss": 2.5141, "step": 3804 }, { "epoch": 0.1, "learning_rate": 0.001972755658532823, "loss": 3.011, "step": 3805 }, { "epoch": 0.1, "learning_rate": 0.001972735476311623, "loss": 2.8623, "step": 3806 }, { "epoch": 0.1, "learning_rate": 0.0019727152867211536, "loss": 2.514, "step": 3807 }, { "epoch": 0.1, "learning_rate": 0.001972695089761567, "loss": 2.9469, "step": 3808 }, { "epoch": 0.1, "learning_rate": 0.001972674885433016, "loss": 2.6253, "step": 3809 }, { "epoch": 0.1, "learning_rate": 0.0019726546737356544, "loss": 3.0176, "step": 3810 }, { "epoch": 0.1, "learning_rate": 0.001972634454669635, "loss": 2.4761, "step": 3811 }, { "epoch": 0.1, "learning_rate": 0.00197261422823511, "loss": 2.7074, "step": 3812 }, { "epoch": 0.1, "learning_rate": 0.0019725939944322344, "loss": 2.9192, "step": 3813 }, { "epoch": 0.1, "learning_rate": 0.00197257375326116, "loss": 3.1217, "step": 3814 }, { "epoch": 0.1, "learning_rate": 0.0019725535047220412, "loss": 2.9312, "step": 3815 }, { "epoch": 0.1, "learning_rate": 0.0019725332488150305, "loss": 2.66, "step": 3816 }, { "epoch": 0.1, "learning_rate": 0.001972512985540282, "loss": 3.098, "step": 3817 }, { "epoch": 0.1, "learning_rate": 0.0019724927148979487, "loss": 2.6286, "step": 3818 }, { "epoch": 0.1, "learning_rate": 0.0019724724368881848, "loss": 2.6719, "step": 3819 }, { "epoch": 0.1, "learning_rate": 0.0019724521515111434, "loss": 2.7526, "step": 3820 }, { "epoch": 0.1, "learning_rate": 0.0019724318587669787, "loss": 2.5664, "step": 3821 }, { "epoch": 0.1, "learning_rate": 0.0019724115586558437, "loss": 2.7999, "step": 3822 }, { "epoch": 0.1, "learning_rate": 0.0019723912511778927, "loss": 2.5216, "step": 3823 }, { "epoch": 0.1, "learning_rate": 0.0019723709363332798, "loss": 2.5929, "step": 3824 }, { "epoch": 0.1, "learning_rate": 0.0019723506141221575, "loss": 2.2088, "step": 3825 }, { "epoch": 0.1, "learning_rate": 0.0019723302845446817, "loss": 2.5433, "step": 3826 }, { "epoch": 0.1, "learning_rate": 0.0019723099476010053, "loss": 2.8892, "step": 3827 }, { "epoch": 0.1, "learning_rate": 0.0019722896032912823, "loss": 2.6668, "step": 3828 }, { "epoch": 0.1, "learning_rate": 0.0019722692516156676, "loss": 2.638, "step": 3829 }, { "epoch": 0.1, "learning_rate": 0.0019722488925743146, "loss": 2.7673, "step": 3830 }, { "epoch": 0.1, "learning_rate": 0.001972228526167378, "loss": 2.839, "step": 3831 }, { "epoch": 0.1, "learning_rate": 0.0019722081523950116, "loss": 2.3761, "step": 3832 }, { "epoch": 0.1, "learning_rate": 0.00197218777125737, "loss": 2.729, "step": 3833 }, { "epoch": 0.1, "learning_rate": 0.001972167382754608, "loss": 2.9008, "step": 3834 }, { "epoch": 0.1, "learning_rate": 0.0019721469868868792, "loss": 2.7321, "step": 3835 }, { "epoch": 0.1, "learning_rate": 0.001972126583654339, "loss": 2.962, "step": 3836 }, { "epoch": 0.1, "learning_rate": 0.0019721061730571415, "loss": 2.7155, "step": 3837 }, { "epoch": 0.1, "learning_rate": 0.0019720857550954416, "loss": 3.0108, "step": 3838 }, { "epoch": 0.1, "learning_rate": 0.001972065329769394, "loss": 2.7363, "step": 3839 }, { "epoch": 0.1, "learning_rate": 0.0019720448970791528, "loss": 2.7022, "step": 3840 }, { "epoch": 0.1, "learning_rate": 0.0019720244570248734, "loss": 2.6459, "step": 3841 }, { "epoch": 0.1, "learning_rate": 0.0019720040096067107, "loss": 2.7754, "step": 3842 }, { "epoch": 0.1, "learning_rate": 0.001971983554824819, "loss": 3.3519, "step": 3843 }, { "epoch": 0.1, "learning_rate": 0.001971963092679354, "loss": 2.242, "step": 3844 }, { "epoch": 0.1, "learning_rate": 0.00197194262317047, "loss": 2.5123, "step": 3845 }, { "epoch": 0.1, "learning_rate": 0.001971922146298323, "loss": 2.7886, "step": 3846 }, { "epoch": 0.1, "learning_rate": 0.001971901662063067, "loss": 2.606, "step": 3847 }, { "epoch": 0.1, "learning_rate": 0.001971881170464858, "loss": 2.7318, "step": 3848 }, { "epoch": 0.1, "learning_rate": 0.001971860671503851, "loss": 2.8758, "step": 3849 }, { "epoch": 0.1, "learning_rate": 0.0019718401651802014, "loss": 2.3118, "step": 3850 }, { "epoch": 0.1, "learning_rate": 0.0019718196514940645, "loss": 2.4613, "step": 3851 }, { "epoch": 0.1, "learning_rate": 0.0019717991304455955, "loss": 2.7744, "step": 3852 }, { "epoch": 0.1, "learning_rate": 0.0019717786020349505, "loss": 2.6368, "step": 3853 }, { "epoch": 0.1, "learning_rate": 0.001971758066262284, "loss": 3.0287, "step": 3854 }, { "epoch": 0.1, "learning_rate": 0.0019717375231277524, "loss": 2.7712, "step": 3855 }, { "epoch": 0.1, "learning_rate": 0.0019717169726315106, "loss": 2.8508, "step": 3856 }, { "epoch": 0.1, "learning_rate": 0.001971696414773715, "loss": 2.5043, "step": 3857 }, { "epoch": 0.1, "learning_rate": 0.0019716758495545213, "loss": 2.8228, "step": 3858 }, { "epoch": 0.1, "learning_rate": 0.0019716552769740853, "loss": 3.1688, "step": 3859 }, { "epoch": 0.1, "learning_rate": 0.001971634697032562, "loss": 2.7173, "step": 3860 }, { "epoch": 0.1, "learning_rate": 0.0019716141097301083, "loss": 3.0184, "step": 3861 }, { "epoch": 0.1, "learning_rate": 0.00197159351506688, "loss": 2.7895, "step": 3862 }, { "epoch": 0.1, "learning_rate": 0.0019715729130430322, "loss": 2.9741, "step": 3863 }, { "epoch": 0.1, "learning_rate": 0.0019715523036587224, "loss": 2.7146, "step": 3864 }, { "epoch": 0.1, "learning_rate": 0.0019715316869141058, "loss": 2.7196, "step": 3865 }, { "epoch": 0.1, "learning_rate": 0.001971511062809339, "loss": 2.6929, "step": 3866 }, { "epoch": 0.1, "learning_rate": 0.001971490431344578, "loss": 2.7525, "step": 3867 }, { "epoch": 0.1, "learning_rate": 0.001971469792519979, "loss": 2.565, "step": 3868 }, { "epoch": 0.1, "learning_rate": 0.001971449146335699, "loss": 2.5747, "step": 3869 }, { "epoch": 0.1, "learning_rate": 0.0019714284927918936, "loss": 3.188, "step": 3870 }, { "epoch": 0.1, "learning_rate": 0.0019714078318887195, "loss": 2.5226, "step": 3871 }, { "epoch": 0.1, "learning_rate": 0.0019713871636263336, "loss": 2.9131, "step": 3872 }, { "epoch": 0.1, "learning_rate": 0.0019713664880048917, "loss": 3.0823, "step": 3873 }, { "epoch": 0.1, "learning_rate": 0.0019713458050245516, "loss": 2.4563, "step": 3874 }, { "epoch": 0.1, "learning_rate": 0.001971325114685469, "loss": 2.5388, "step": 3875 }, { "epoch": 0.1, "learning_rate": 0.0019713044169878007, "loss": 2.8673, "step": 3876 }, { "epoch": 0.1, "learning_rate": 0.0019712837119317045, "loss": 2.7757, "step": 3877 }, { "epoch": 0.1, "learning_rate": 0.001971262999517336, "loss": 2.8708, "step": 3878 }, { "epoch": 0.1, "learning_rate": 0.001971242279744853, "loss": 2.6878, "step": 3879 }, { "epoch": 0.1, "learning_rate": 0.001971221552614412, "loss": 2.5372, "step": 3880 }, { "epoch": 0.1, "learning_rate": 0.00197120081812617, "loss": 2.5212, "step": 3881 }, { "epoch": 0.1, "learning_rate": 0.0019711800762802845, "loss": 2.3367, "step": 3882 }, { "epoch": 0.1, "learning_rate": 0.0019711593270769125, "loss": 2.7207, "step": 3883 }, { "epoch": 0.1, "learning_rate": 0.0019711385705162105, "loss": 2.6275, "step": 3884 }, { "epoch": 0.1, "learning_rate": 0.001971117806598337, "loss": 2.5372, "step": 3885 }, { "epoch": 0.1, "learning_rate": 0.001971097035323448, "loss": 2.9552, "step": 3886 }, { "epoch": 0.1, "learning_rate": 0.0019710762566917017, "loss": 2.4136, "step": 3887 }, { "epoch": 0.1, "learning_rate": 0.0019710554707032552, "loss": 2.9792, "step": 3888 }, { "epoch": 0.1, "learning_rate": 0.0019710346773582662, "loss": 2.7148, "step": 3889 }, { "epoch": 0.1, "learning_rate": 0.0019710138766568922, "loss": 2.9957, "step": 3890 }, { "epoch": 0.1, "learning_rate": 0.0019709930685992906, "loss": 2.7243, "step": 3891 }, { "epoch": 0.1, "learning_rate": 0.001970972253185619, "loss": 2.6497, "step": 3892 }, { "epoch": 0.1, "learning_rate": 0.001970951430416035, "loss": 2.6108, "step": 3893 }, { "epoch": 0.1, "learning_rate": 0.001970930600290697, "loss": 2.7509, "step": 3894 }, { "epoch": 0.1, "learning_rate": 0.0019709097628097623, "loss": 2.5713, "step": 3895 }, { "epoch": 0.1, "learning_rate": 0.0019708889179733883, "loss": 2.8088, "step": 3896 }, { "epoch": 0.1, "learning_rate": 0.001970868065781734, "loss": 2.6517, "step": 3897 }, { "epoch": 0.1, "learning_rate": 0.0019708472062349566, "loss": 2.4484, "step": 3898 }, { "epoch": 0.1, "learning_rate": 0.0019708263393332145, "loss": 2.5359, "step": 3899 }, { "epoch": 0.1, "learning_rate": 0.0019708054650766655, "loss": 2.3877, "step": 3900 }, { "epoch": 0.1, "learning_rate": 0.001970784583465468, "loss": 2.9918, "step": 3901 }, { "epoch": 0.1, "learning_rate": 0.0019707636944997797, "loss": 2.8554, "step": 3902 }, { "epoch": 0.1, "learning_rate": 0.0019707427981797594, "loss": 2.5433, "step": 3903 }, { "epoch": 0.1, "learning_rate": 0.0019707218945055655, "loss": 2.782, "step": 3904 }, { "epoch": 0.1, "learning_rate": 0.0019707009834773557, "loss": 2.6606, "step": 3905 }, { "epoch": 0.1, "learning_rate": 0.001970680065095289, "loss": 2.5514, "step": 3906 }, { "epoch": 0.1, "learning_rate": 0.001970659139359523, "loss": 2.7811, "step": 3907 }, { "epoch": 0.11, "learning_rate": 0.0019706382062702177, "loss": 2.9513, "step": 3908 }, { "epoch": 0.11, "learning_rate": 0.0019706172658275306, "loss": 2.3522, "step": 3909 }, { "epoch": 0.11, "learning_rate": 0.001970596318031621, "loss": 3.1914, "step": 3910 }, { "epoch": 0.11, "learning_rate": 0.0019705753628826467, "loss": 2.5546, "step": 3911 }, { "epoch": 0.11, "learning_rate": 0.001970554400380767, "loss": 2.672, "step": 3912 }, { "epoch": 0.11, "learning_rate": 0.0019705334305261412, "loss": 2.5872, "step": 3913 }, { "epoch": 0.11, "learning_rate": 0.0019705124533189273, "loss": 2.8501, "step": 3914 }, { "epoch": 0.11, "learning_rate": 0.0019704914687592844, "loss": 2.6689, "step": 3915 }, { "epoch": 0.11, "learning_rate": 0.0019704704768473717, "loss": 2.7835, "step": 3916 }, { "epoch": 0.11, "learning_rate": 0.0019704494775833483, "loss": 2.5735, "step": 3917 }, { "epoch": 0.11, "learning_rate": 0.0019704284709673734, "loss": 2.4801, "step": 3918 }, { "epoch": 0.11, "learning_rate": 0.0019704074569996052, "loss": 2.5879, "step": 3919 }, { "epoch": 0.11, "learning_rate": 0.0019703864356802043, "loss": 2.6092, "step": 3920 }, { "epoch": 0.11, "learning_rate": 0.0019703654070093285, "loss": 2.4858, "step": 3921 }, { "epoch": 0.11, "learning_rate": 0.0019703443709871388, "loss": 2.4977, "step": 3922 }, { "epoch": 0.11, "learning_rate": 0.0019703233276137933, "loss": 2.3978, "step": 3923 }, { "epoch": 0.11, "learning_rate": 0.001970302276889451, "loss": 2.7489, "step": 3924 }, { "epoch": 0.11, "learning_rate": 0.001970281218814273, "loss": 2.8111, "step": 3925 }, { "epoch": 0.11, "learning_rate": 0.0019702601533884176, "loss": 3.1057, "step": 3926 }, { "epoch": 0.11, "learning_rate": 0.0019702390806120447, "loss": 2.7114, "step": 3927 }, { "epoch": 0.11, "learning_rate": 0.001970218000485314, "loss": 2.8235, "step": 3928 }, { "epoch": 0.11, "learning_rate": 0.0019701969130083855, "loss": 2.6274, "step": 3929 }, { "epoch": 0.11, "learning_rate": 0.0019701758181814182, "loss": 2.7155, "step": 3930 }, { "epoch": 0.11, "learning_rate": 0.001970154716004573, "loss": 2.8755, "step": 3931 }, { "epoch": 0.11, "learning_rate": 0.001970133606478009, "loss": 2.795, "step": 3932 }, { "epoch": 0.11, "learning_rate": 0.0019701124896018855, "loss": 2.6538, "step": 3933 }, { "epoch": 0.11, "learning_rate": 0.001970091365376364, "loss": 2.9054, "step": 3934 }, { "epoch": 0.11, "learning_rate": 0.001970070233801603, "loss": 2.8375, "step": 3935 }, { "epoch": 0.11, "learning_rate": 0.0019700490948777643, "loss": 2.6882, "step": 3936 }, { "epoch": 0.11, "learning_rate": 0.0019700279486050062, "loss": 2.9148, "step": 3937 }, { "epoch": 0.11, "learning_rate": 0.0019700067949834903, "loss": 2.5444, "step": 3938 }, { "epoch": 0.11, "learning_rate": 0.001969985634013376, "loss": 2.6947, "step": 3939 }, { "epoch": 0.11, "learning_rate": 0.0019699644656948245, "loss": 2.575, "step": 3940 }, { "epoch": 0.11, "learning_rate": 0.001969943290027995, "loss": 2.7916, "step": 3941 }, { "epoch": 0.11, "learning_rate": 0.001969922107013049, "loss": 3.2148, "step": 3942 }, { "epoch": 0.11, "learning_rate": 0.001969900916650146, "loss": 2.4603, "step": 3943 }, { "epoch": 0.11, "learning_rate": 0.001969879718939448, "loss": 2.583, "step": 3944 }, { "epoch": 0.11, "learning_rate": 0.0019698585138811136, "loss": 2.6785, "step": 3945 }, { "epoch": 0.11, "learning_rate": 0.0019698373014753047, "loss": 2.737, "step": 3946 }, { "epoch": 0.11, "learning_rate": 0.001969816081722182, "loss": 2.3571, "step": 3947 }, { "epoch": 0.11, "learning_rate": 0.0019697948546219066, "loss": 2.8586, "step": 3948 }, { "epoch": 0.11, "learning_rate": 0.001969773620174638, "loss": 2.7753, "step": 3949 }, { "epoch": 0.11, "learning_rate": 0.0019697523783805382, "loss": 2.7667, "step": 3950 }, { "epoch": 0.11, "learning_rate": 0.0019697311292397675, "loss": 2.7592, "step": 3951 }, { "epoch": 0.11, "learning_rate": 0.001969709872752487, "loss": 2.6289, "step": 3952 }, { "epoch": 0.11, "learning_rate": 0.0019696886089188587, "loss": 2.4753, "step": 3953 }, { "epoch": 0.11, "learning_rate": 0.001969667337739042, "loss": 2.7792, "step": 3954 }, { "epoch": 0.11, "learning_rate": 0.0019696460592131993, "loss": 2.7146, "step": 3955 }, { "epoch": 0.11, "learning_rate": 0.0019696247733414912, "loss": 2.3826, "step": 3956 }, { "epoch": 0.11, "learning_rate": 0.0019696034801240793, "loss": 2.6464, "step": 3957 }, { "epoch": 0.11, "learning_rate": 0.0019695821795611248, "loss": 2.5569, "step": 3958 }, { "epoch": 0.11, "learning_rate": 0.001969560871652789, "loss": 2.8666, "step": 3959 }, { "epoch": 0.11, "learning_rate": 0.0019695395563992337, "loss": 2.7972, "step": 3960 }, { "epoch": 0.11, "learning_rate": 0.00196951823380062, "loss": 2.3853, "step": 3961 }, { "epoch": 0.11, "learning_rate": 0.001969496903857109, "loss": 3.128, "step": 3962 }, { "epoch": 0.11, "learning_rate": 0.001969475566568863, "loss": 2.7446, "step": 3963 }, { "epoch": 0.11, "learning_rate": 0.001969454221936043, "loss": 2.6005, "step": 3964 }, { "epoch": 0.11, "learning_rate": 0.001969432869958812, "loss": 2.5167, "step": 3965 }, { "epoch": 0.11, "learning_rate": 0.0019694115106373305, "loss": 2.5858, "step": 3966 }, { "epoch": 0.11, "learning_rate": 0.0019693901439717604, "loss": 2.8855, "step": 3967 }, { "epoch": 0.11, "learning_rate": 0.0019693687699622645, "loss": 2.5559, "step": 3968 }, { "epoch": 0.11, "learning_rate": 0.0019693473886090037, "loss": 3.0925, "step": 3969 }, { "epoch": 0.11, "learning_rate": 0.0019693259999121406, "loss": 2.7439, "step": 3970 }, { "epoch": 0.11, "learning_rate": 0.001969304603871837, "loss": 2.8309, "step": 3971 }, { "epoch": 0.11, "learning_rate": 0.001969283200488255, "loss": 2.4401, "step": 3972 }, { "epoch": 0.11, "learning_rate": 0.0019692617897615564, "loss": 2.5142, "step": 3973 }, { "epoch": 0.11, "learning_rate": 0.001969240371691904, "loss": 2.5091, "step": 3974 }, { "epoch": 0.11, "learning_rate": 0.00196921894627946, "loss": 2.9595, "step": 3975 }, { "epoch": 0.11, "learning_rate": 0.0019691975135243864, "loss": 2.4279, "step": 3976 }, { "epoch": 0.11, "learning_rate": 0.001969176073426846, "loss": 3.036, "step": 3977 }, { "epoch": 0.11, "learning_rate": 0.0019691546259870004, "loss": 2.6307, "step": 3978 }, { "epoch": 0.11, "learning_rate": 0.001969133171205013, "loss": 2.5996, "step": 3979 }, { "epoch": 0.11, "learning_rate": 0.001969111709081046, "loss": 2.8679, "step": 3980 }, { "epoch": 0.11, "learning_rate": 0.001969090239615262, "loss": 2.7869, "step": 3981 }, { "epoch": 0.11, "learning_rate": 0.001969068762807823, "loss": 2.7044, "step": 3982 }, { "epoch": 0.11, "learning_rate": 0.001969047278658893, "loss": 3.0272, "step": 3983 }, { "epoch": 0.11, "learning_rate": 0.0019690257871686338, "loss": 2.9025, "step": 3984 }, { "epoch": 0.11, "learning_rate": 0.001969004288337208, "loss": 2.8075, "step": 3985 }, { "epoch": 0.11, "learning_rate": 0.0019689827821647798, "loss": 2.9685, "step": 3986 }, { "epoch": 0.11, "learning_rate": 0.001968961268651511, "loss": 2.6924, "step": 3987 }, { "epoch": 0.11, "learning_rate": 0.0019689397477975646, "loss": 1.9863, "step": 3988 }, { "epoch": 0.11, "learning_rate": 0.001968918219603104, "loss": 2.6697, "step": 3989 }, { "epoch": 0.11, "learning_rate": 0.0019688966840682924, "loss": 2.5699, "step": 3990 }, { "epoch": 0.11, "learning_rate": 0.001968875141193293, "loss": 2.6645, "step": 3991 }, { "epoch": 0.11, "learning_rate": 0.001968853590978268, "loss": 2.8566, "step": 3992 }, { "epoch": 0.11, "learning_rate": 0.001968832033423382, "loss": 3.151, "step": 3993 }, { "epoch": 0.11, "learning_rate": 0.0019688104685287974, "loss": 2.931, "step": 3994 }, { "epoch": 0.11, "learning_rate": 0.001968788896294678, "loss": 2.3712, "step": 3995 }, { "epoch": 0.11, "learning_rate": 0.001968767316721187, "loss": 2.4833, "step": 3996 }, { "epoch": 0.11, "learning_rate": 0.001968745729808488, "loss": 2.4919, "step": 3997 }, { "epoch": 0.11, "learning_rate": 0.001968724135556745, "loss": 3.255, "step": 3998 }, { "epoch": 0.11, "learning_rate": 0.0019687025339661206, "loss": 2.7293, "step": 3999 }, { "epoch": 0.11, "learning_rate": 0.0019686809250367794, "loss": 2.8429, "step": 4000 }, { "epoch": 0.11, "learning_rate": 0.0019686593087688844, "loss": 2.361, "step": 4001 }, { "epoch": 0.11, "learning_rate": 0.0019686376851626, "loss": 2.7921, "step": 4002 }, { "epoch": 0.11, "learning_rate": 0.001968616054218089, "loss": 2.5492, "step": 4003 }, { "epoch": 0.11, "learning_rate": 0.0019685944159355167, "loss": 3.3509, "step": 4004 }, { "epoch": 0.11, "learning_rate": 0.001968572770315046, "loss": 2.5153, "step": 4005 }, { "epoch": 0.11, "learning_rate": 0.001968551117356841, "loss": 2.3114, "step": 4006 }, { "epoch": 0.11, "learning_rate": 0.001968529457061066, "loss": 2.4921, "step": 4007 }, { "epoch": 0.11, "learning_rate": 0.001968507789427885, "loss": 2.4667, "step": 4008 }, { "epoch": 0.11, "learning_rate": 0.0019684861144574624, "loss": 2.69, "step": 4009 }, { "epoch": 0.11, "learning_rate": 0.0019684644321499617, "loss": 2.8867, "step": 4010 }, { "epoch": 0.11, "learning_rate": 0.001968442742505548, "loss": 2.647, "step": 4011 }, { "epoch": 0.11, "learning_rate": 0.0019684210455243848, "loss": 2.7358, "step": 4012 }, { "epoch": 0.11, "learning_rate": 0.001968399341206637, "loss": 2.5823, "step": 4013 }, { "epoch": 0.11, "learning_rate": 0.001968377629552469, "loss": 2.8143, "step": 4014 }, { "epoch": 0.11, "learning_rate": 0.0019683559105620452, "loss": 2.9369, "step": 4015 }, { "epoch": 0.11, "learning_rate": 0.0019683341842355304, "loss": 2.8109, "step": 4016 }, { "epoch": 0.11, "learning_rate": 0.0019683124505730887, "loss": 2.5744, "step": 4017 }, { "epoch": 0.11, "learning_rate": 0.001968290709574885, "loss": 2.8999, "step": 4018 }, { "epoch": 0.11, "learning_rate": 0.001968268961241084, "loss": 2.5693, "step": 4019 }, { "epoch": 0.11, "learning_rate": 0.0019682472055718506, "loss": 2.7202, "step": 4020 }, { "epoch": 0.11, "learning_rate": 0.001968225442567349, "loss": 2.7522, "step": 4021 }, { "epoch": 0.11, "learning_rate": 0.0019682036722277452, "loss": 2.7295, "step": 4022 }, { "epoch": 0.11, "learning_rate": 0.001968181894553203, "loss": 2.7754, "step": 4023 }, { "epoch": 0.11, "learning_rate": 0.0019681601095438883, "loss": 2.3015, "step": 4024 }, { "epoch": 0.11, "learning_rate": 0.0019681383171999654, "loss": 3.3355, "step": 4025 }, { "epoch": 0.11, "learning_rate": 0.0019681165175215996, "loss": 2.8813, "step": 4026 }, { "epoch": 0.11, "learning_rate": 0.0019680947105089565, "loss": 2.6149, "step": 4027 }, { "epoch": 0.11, "learning_rate": 0.001968072896162201, "loss": 2.9465, "step": 4028 }, { "epoch": 0.11, "learning_rate": 0.001968051074481498, "loss": 2.6616, "step": 4029 }, { "epoch": 0.11, "learning_rate": 0.001968029245467013, "loss": 2.6283, "step": 4030 }, { "epoch": 0.11, "learning_rate": 0.001968007409118912, "loss": 2.5381, "step": 4031 }, { "epoch": 0.11, "learning_rate": 0.0019679855654373595, "loss": 2.8944, "step": 4032 }, { "epoch": 0.11, "learning_rate": 0.0019679637144225212, "loss": 2.7909, "step": 4033 }, { "epoch": 0.11, "learning_rate": 0.0019679418560745636, "loss": 2.67, "step": 4034 }, { "epoch": 0.11, "learning_rate": 0.001967919990393651, "loss": 2.8545, "step": 4035 }, { "epoch": 0.11, "learning_rate": 0.0019678981173799496, "loss": 3.0758, "step": 4036 }, { "epoch": 0.11, "learning_rate": 0.0019678762370336253, "loss": 3.0375, "step": 4037 }, { "epoch": 0.11, "learning_rate": 0.0019678543493548434, "loss": 2.6884, "step": 4038 }, { "epoch": 0.11, "learning_rate": 0.00196783245434377, "loss": 2.631, "step": 4039 }, { "epoch": 0.11, "learning_rate": 0.0019678105520005715, "loss": 2.06, "step": 4040 }, { "epoch": 0.11, "learning_rate": 0.001967788642325413, "loss": 2.3051, "step": 4041 }, { "epoch": 0.11, "learning_rate": 0.0019677667253184604, "loss": 2.8968, "step": 4042 }, { "epoch": 0.11, "learning_rate": 0.001967744800979881, "loss": 2.7402, "step": 4043 }, { "epoch": 0.11, "learning_rate": 0.0019677228693098393, "loss": 2.848, "step": 4044 }, { "epoch": 0.11, "learning_rate": 0.001967700930308502, "loss": 2.3838, "step": 4045 }, { "epoch": 0.11, "learning_rate": 0.001967678983976036, "loss": 3.0523, "step": 4046 }, { "epoch": 0.11, "learning_rate": 0.001967657030312607, "loss": 2.3007, "step": 4047 }, { "epoch": 0.11, "learning_rate": 0.001967635069318381, "loss": 2.8105, "step": 4048 }, { "epoch": 0.11, "learning_rate": 0.0019676131009935247, "loss": 2.6836, "step": 4049 }, { "epoch": 0.11, "learning_rate": 0.0019675911253382045, "loss": 2.6105, "step": 4050 }, { "epoch": 0.11, "learning_rate": 0.0019675691423525874, "loss": 2.6811, "step": 4051 }, { "epoch": 0.11, "learning_rate": 0.001967547152036839, "loss": 2.8277, "step": 4052 }, { "epoch": 0.11, "learning_rate": 0.0019675251543911265, "loss": 2.8404, "step": 4053 }, { "epoch": 0.11, "learning_rate": 0.0019675031494156164, "loss": 2.8386, "step": 4054 }, { "epoch": 0.11, "learning_rate": 0.0019674811371104754, "loss": 2.4026, "step": 4055 }, { "epoch": 0.11, "learning_rate": 0.00196745911747587, "loss": 2.7566, "step": 4056 }, { "epoch": 0.11, "learning_rate": 0.001967437090511968, "loss": 2.8881, "step": 4057 }, { "epoch": 0.11, "learning_rate": 0.001967415056218935, "loss": 2.9748, "step": 4058 }, { "epoch": 0.11, "learning_rate": 0.0019673930145969387, "loss": 3.0874, "step": 4059 }, { "epoch": 0.11, "learning_rate": 0.001967370965646146, "loss": 2.8055, "step": 4060 }, { "epoch": 0.11, "learning_rate": 0.0019673489093667237, "loss": 3.0702, "step": 4061 }, { "epoch": 0.11, "learning_rate": 0.001967326845758839, "loss": 2.7706, "step": 4062 }, { "epoch": 0.11, "learning_rate": 0.0019673047748226587, "loss": 2.9282, "step": 4063 }, { "epoch": 0.11, "learning_rate": 0.001967282696558351, "loss": 2.6312, "step": 4064 }, { "epoch": 0.11, "learning_rate": 0.001967260610966082, "loss": 2.5707, "step": 4065 }, { "epoch": 0.11, "learning_rate": 0.0019672385180460198, "loss": 2.882, "step": 4066 }, { "epoch": 0.11, "learning_rate": 0.0019672164177983315, "loss": 2.8277, "step": 4067 }, { "epoch": 0.11, "learning_rate": 0.001967194310223184, "loss": 2.5269, "step": 4068 }, { "epoch": 0.11, "learning_rate": 0.0019671721953207462, "loss": 2.9593, "step": 4069 }, { "epoch": 0.11, "learning_rate": 0.0019671500730911846, "loss": 2.8855, "step": 4070 }, { "epoch": 0.11, "learning_rate": 0.0019671279435346666, "loss": 2.8521, "step": 4071 }, { "epoch": 0.11, "learning_rate": 0.00196710580665136, "loss": 2.6078, "step": 4072 }, { "epoch": 0.11, "learning_rate": 0.0019670836624414334, "loss": 2.6982, "step": 4073 }, { "epoch": 0.11, "learning_rate": 0.0019670615109050535, "loss": 2.9498, "step": 4074 }, { "epoch": 0.11, "learning_rate": 0.0019670393520423886, "loss": 2.6894, "step": 4075 }, { "epoch": 0.11, "learning_rate": 0.001967017185853606, "loss": 2.664, "step": 4076 }, { "epoch": 0.11, "learning_rate": 0.0019669950123388747, "loss": 2.8176, "step": 4077 }, { "epoch": 0.11, "learning_rate": 0.001966972831498362, "loss": 2.4582, "step": 4078 }, { "epoch": 0.11, "learning_rate": 0.001966950643332236, "loss": 2.9981, "step": 4079 }, { "epoch": 0.11, "learning_rate": 0.0019669284478406645, "loss": 2.5615, "step": 4080 }, { "epoch": 0.11, "learning_rate": 0.001966906245023816, "loss": 2.7336, "step": 4081 }, { "epoch": 0.11, "learning_rate": 0.0019668840348818586, "loss": 2.6694, "step": 4082 }, { "epoch": 0.11, "learning_rate": 0.0019668618174149607, "loss": 2.8926, "step": 4083 }, { "epoch": 0.11, "learning_rate": 0.001966839592623291, "loss": 2.9567, "step": 4084 }, { "epoch": 0.11, "learning_rate": 0.0019668173605070166, "loss": 2.3516, "step": 4085 }, { "epoch": 0.11, "learning_rate": 0.001966795121066307, "loss": 2.7052, "step": 4086 }, { "epoch": 0.11, "learning_rate": 0.001966772874301331, "loss": 2.8789, "step": 4087 }, { "epoch": 0.11, "learning_rate": 0.0019667506202122554, "loss": 2.215, "step": 4088 }, { "epoch": 0.11, "learning_rate": 0.001966728358799251, "loss": 2.8705, "step": 4089 }, { "epoch": 0.11, "learning_rate": 0.0019667060900624847, "loss": 2.4846, "step": 4090 }, { "epoch": 0.11, "learning_rate": 0.0019666838140021264, "loss": 3.1049, "step": 4091 }, { "epoch": 0.11, "learning_rate": 0.001966661530618344, "loss": 2.7745, "step": 4092 }, { "epoch": 0.11, "learning_rate": 0.001966639239911307, "loss": 2.7043, "step": 4093 }, { "epoch": 0.11, "learning_rate": 0.0019666169418811837, "loss": 2.4567, "step": 4094 }, { "epoch": 0.11, "learning_rate": 0.0019665946365281435, "loss": 2.964, "step": 4095 }, { "epoch": 0.11, "learning_rate": 0.001966572323852355, "loss": 2.5549, "step": 4096 }, { "epoch": 0.11, "learning_rate": 0.001966550003853987, "loss": 2.8009, "step": 4097 }, { "epoch": 0.11, "learning_rate": 0.0019665276765332093, "loss": 2.6418, "step": 4098 }, { "epoch": 0.11, "learning_rate": 0.001966505341890191, "loss": 2.8178, "step": 4099 }, { "epoch": 0.11, "learning_rate": 0.0019664829999251005, "loss": 2.5994, "step": 4100 }, { "epoch": 0.11, "learning_rate": 0.001966460650638108, "loss": 2.7565, "step": 4101 }, { "epoch": 0.11, "learning_rate": 0.001966438294029382, "loss": 2.3563, "step": 4102 }, { "epoch": 0.11, "learning_rate": 0.001966415930099093, "loss": 2.6496, "step": 4103 }, { "epoch": 0.11, "learning_rate": 0.0019663935588474088, "loss": 2.5654, "step": 4104 }, { "epoch": 0.11, "learning_rate": 0.0019663711802745004, "loss": 2.6685, "step": 4105 }, { "epoch": 0.11, "learning_rate": 0.0019663487943805363, "loss": 2.6747, "step": 4106 }, { "epoch": 0.11, "learning_rate": 0.0019663264011656866, "loss": 2.7456, "step": 4107 }, { "epoch": 0.11, "learning_rate": 0.001966304000630121, "loss": 2.5347, "step": 4108 }, { "epoch": 0.11, "learning_rate": 0.001966281592774009, "loss": 2.6463, "step": 4109 }, { "epoch": 0.11, "learning_rate": 0.00196625917759752, "loss": 2.9455, "step": 4110 }, { "epoch": 0.11, "learning_rate": 0.001966236755100825, "loss": 2.6051, "step": 4111 }, { "epoch": 0.11, "learning_rate": 0.0019662143252840926, "loss": 2.673, "step": 4112 }, { "epoch": 0.11, "learning_rate": 0.0019661918881474934, "loss": 3.0062, "step": 4113 }, { "epoch": 0.11, "learning_rate": 0.001966169443691197, "loss": 2.4351, "step": 4114 }, { "epoch": 0.11, "learning_rate": 0.001966146991915374, "loss": 2.6621, "step": 4115 }, { "epoch": 0.11, "learning_rate": 0.0019661245328201934, "loss": 2.4298, "step": 4116 }, { "epoch": 0.11, "learning_rate": 0.001966102066405827, "loss": 2.8615, "step": 4117 }, { "epoch": 0.11, "learning_rate": 0.001966079592672443, "loss": 2.7932, "step": 4118 }, { "epoch": 0.11, "learning_rate": 0.0019660571116202137, "loss": 2.3771, "step": 4119 }, { "epoch": 0.11, "learning_rate": 0.0019660346232493082, "loss": 2.2696, "step": 4120 }, { "epoch": 0.11, "learning_rate": 0.001966012127559897, "loss": 3.0195, "step": 4121 }, { "epoch": 0.11, "learning_rate": 0.0019659896245521505, "loss": 2.7102, "step": 4122 }, { "epoch": 0.11, "learning_rate": 0.001965967114226239, "loss": 2.5567, "step": 4123 }, { "epoch": 0.11, "learning_rate": 0.001965944596582334, "loss": 2.5604, "step": 4124 }, { "epoch": 0.11, "learning_rate": 0.001965922071620605, "loss": 2.4826, "step": 4125 }, { "epoch": 0.11, "learning_rate": 0.0019658995393412237, "loss": 3.2779, "step": 4126 }, { "epoch": 0.11, "learning_rate": 0.0019658769997443594, "loss": 2.5075, "step": 4127 }, { "epoch": 0.11, "learning_rate": 0.001965854452830184, "loss": 2.9232, "step": 4128 }, { "epoch": 0.11, "learning_rate": 0.001965831898598868, "loss": 2.2104, "step": 4129 }, { "epoch": 0.11, "learning_rate": 0.001965809337050582, "loss": 2.7426, "step": 4130 }, { "epoch": 0.11, "learning_rate": 0.001965786768185497, "loss": 2.821, "step": 4131 }, { "epoch": 0.11, "learning_rate": 0.0019657641920037845, "loss": 2.9382, "step": 4132 }, { "epoch": 0.11, "learning_rate": 0.0019657416085056153, "loss": 2.698, "step": 4133 }, { "epoch": 0.11, "learning_rate": 0.00196571901769116, "loss": 2.6988, "step": 4134 }, { "epoch": 0.11, "learning_rate": 0.00196569641956059, "loss": 2.8803, "step": 4135 }, { "epoch": 0.11, "learning_rate": 0.0019656738141140767, "loss": 2.577, "step": 4136 }, { "epoch": 0.11, "learning_rate": 0.0019656512013517913, "loss": 3.0122, "step": 4137 }, { "epoch": 0.11, "learning_rate": 0.001965628581273905, "loss": 2.5766, "step": 4138 }, { "epoch": 0.11, "learning_rate": 0.0019656059538805887, "loss": 3.0298, "step": 4139 }, { "epoch": 0.11, "learning_rate": 0.001965583319172015, "loss": 2.9262, "step": 4140 }, { "epoch": 0.11, "learning_rate": 0.0019655606771483546, "loss": 3.0196, "step": 4141 }, { "epoch": 0.11, "learning_rate": 0.001965538027809779, "loss": 2.6223, "step": 4142 }, { "epoch": 0.11, "learning_rate": 0.00196551537115646, "loss": 2.8651, "step": 4143 }, { "epoch": 0.11, "learning_rate": 0.0019654927071885687, "loss": 2.7356, "step": 4144 }, { "epoch": 0.11, "learning_rate": 0.001965470035906278, "loss": 2.9693, "step": 4145 }, { "epoch": 0.11, "learning_rate": 0.0019654473573097585, "loss": 2.7759, "step": 4146 }, { "epoch": 0.11, "learning_rate": 0.0019654246713991827, "loss": 3.0127, "step": 4147 }, { "epoch": 0.11, "learning_rate": 0.001965401978174722, "loss": 2.4544, "step": 4148 }, { "epoch": 0.11, "learning_rate": 0.0019653792776365485, "loss": 2.8779, "step": 4149 }, { "epoch": 0.11, "learning_rate": 0.001965356569784834, "loss": 2.9446, "step": 4150 }, { "epoch": 0.11, "learning_rate": 0.0019653338546197514, "loss": 2.6758, "step": 4151 }, { "epoch": 0.11, "learning_rate": 0.0019653111321414713, "loss": 3.327, "step": 4152 }, { "epoch": 0.11, "learning_rate": 0.001965288402350167, "loss": 2.8579, "step": 4153 }, { "epoch": 0.11, "learning_rate": 0.0019652656652460105, "loss": 2.8152, "step": 4154 }, { "epoch": 0.11, "learning_rate": 0.0019652429208291736, "loss": 2.9962, "step": 4155 }, { "epoch": 0.11, "learning_rate": 0.001965220169099829, "loss": 2.5154, "step": 4156 }, { "epoch": 0.11, "learning_rate": 0.001965197410058149, "loss": 2.7232, "step": 4157 }, { "epoch": 0.11, "learning_rate": 0.001965174643704306, "loss": 2.5825, "step": 4158 }, { "epoch": 0.11, "learning_rate": 0.0019651518700384723, "loss": 2.8855, "step": 4159 }, { "epoch": 0.11, "learning_rate": 0.0019651290890608207, "loss": 2.5323, "step": 4160 }, { "epoch": 0.11, "learning_rate": 0.001965106300771524, "loss": 2.6513, "step": 4161 }, { "epoch": 0.11, "learning_rate": 0.001965083505170754, "loss": 2.541, "step": 4162 }, { "epoch": 0.11, "learning_rate": 0.0019650607022586837, "loss": 2.7446, "step": 4163 }, { "epoch": 0.11, "learning_rate": 0.0019650378920354865, "loss": 2.2837, "step": 4164 }, { "epoch": 0.11, "learning_rate": 0.001965015074501335, "loss": 2.5198, "step": 4165 }, { "epoch": 0.11, "learning_rate": 0.0019649922496564015, "loss": 3.1082, "step": 4166 }, { "epoch": 0.11, "learning_rate": 0.0019649694175008594, "loss": 2.7095, "step": 4167 }, { "epoch": 0.11, "learning_rate": 0.001964946578034881, "loss": 2.7443, "step": 4168 }, { "epoch": 0.11, "learning_rate": 0.0019649237312586404, "loss": 2.6527, "step": 4169 }, { "epoch": 0.11, "learning_rate": 0.00196490087717231, "loss": 2.7809, "step": 4170 }, { "epoch": 0.11, "learning_rate": 0.001964878015776063, "loss": 2.3233, "step": 4171 }, { "epoch": 0.11, "learning_rate": 0.0019648551470700724, "loss": 2.7555, "step": 4172 }, { "epoch": 0.11, "learning_rate": 0.0019648322710545123, "loss": 2.2599, "step": 4173 }, { "epoch": 0.11, "learning_rate": 0.001964809387729555, "loss": 2.492, "step": 4174 }, { "epoch": 0.11, "learning_rate": 0.0019647864970953745, "loss": 2.9513, "step": 4175 }, { "epoch": 0.11, "learning_rate": 0.0019647635991521437, "loss": 3.2608, "step": 4176 }, { "epoch": 0.11, "learning_rate": 0.0019647406939000364, "loss": 2.8, "step": 4177 }, { "epoch": 0.11, "learning_rate": 0.001964717781339226, "loss": 2.5955, "step": 4178 }, { "epoch": 0.11, "learning_rate": 0.0019646948614698866, "loss": 2.7331, "step": 4179 }, { "epoch": 0.11, "learning_rate": 0.0019646719342921912, "loss": 2.5685, "step": 4180 }, { "epoch": 0.11, "learning_rate": 0.0019646489998063135, "loss": 2.8386, "step": 4181 }, { "epoch": 0.11, "learning_rate": 0.0019646260580124275, "loss": 2.5583, "step": 4182 }, { "epoch": 0.11, "learning_rate": 0.001964603108910707, "loss": 2.5114, "step": 4183 }, { "epoch": 0.11, "learning_rate": 0.001964580152501326, "loss": 2.7362, "step": 4184 }, { "epoch": 0.11, "learning_rate": 0.001964557188784458, "loss": 2.6661, "step": 4185 }, { "epoch": 0.11, "learning_rate": 0.0019645342177602772, "loss": 2.4719, "step": 4186 }, { "epoch": 0.11, "learning_rate": 0.0019645112394289575, "loss": 3.1081, "step": 4187 }, { "epoch": 0.11, "learning_rate": 0.0019644882537906733, "loss": 2.9516, "step": 4188 }, { "epoch": 0.11, "learning_rate": 0.0019644652608455985, "loss": 2.8148, "step": 4189 }, { "epoch": 0.11, "learning_rate": 0.001964442260593907, "loss": 2.3761, "step": 4190 }, { "epoch": 0.11, "learning_rate": 0.001964419253035774, "loss": 2.4583, "step": 4191 }, { "epoch": 0.11, "learning_rate": 0.0019643962381713726, "loss": 3.1486, "step": 4192 }, { "epoch": 0.11, "learning_rate": 0.001964373216000878, "loss": 2.7078, "step": 4193 }, { "epoch": 0.11, "learning_rate": 0.001964350186524464, "loss": 2.5118, "step": 4194 }, { "epoch": 0.11, "learning_rate": 0.0019643271497423054, "loss": 2.7434, "step": 4195 }, { "epoch": 0.11, "learning_rate": 0.0019643041056545776, "loss": 2.8594, "step": 4196 }, { "epoch": 0.11, "learning_rate": 0.0019642810542614534, "loss": 2.3508, "step": 4197 }, { "epoch": 0.11, "learning_rate": 0.001964257995563108, "loss": 2.8839, "step": 4198 }, { "epoch": 0.11, "learning_rate": 0.0019642349295597174, "loss": 2.7908, "step": 4199 }, { "epoch": 0.11, "learning_rate": 0.001964211856251455, "loss": 2.1436, "step": 4200 }, { "epoch": 0.11, "learning_rate": 0.001964188775638496, "loss": 2.6151, "step": 4201 }, { "epoch": 0.11, "learning_rate": 0.001964165687721015, "loss": 2.8163, "step": 4202 }, { "epoch": 0.11, "learning_rate": 0.001964142592499187, "loss": 2.6589, "step": 4203 }, { "epoch": 0.11, "learning_rate": 0.0019641194899731877, "loss": 2.9623, "step": 4204 }, { "epoch": 0.11, "learning_rate": 0.001964096380143191, "loss": 2.8005, "step": 4205 }, { "epoch": 0.11, "learning_rate": 0.0019640732630093727, "loss": 2.9565, "step": 4206 }, { "epoch": 0.11, "learning_rate": 0.0019640501385719076, "loss": 2.5764, "step": 4207 }, { "epoch": 0.11, "learning_rate": 0.0019640270068309713, "loss": 2.937, "step": 4208 }, { "epoch": 0.11, "learning_rate": 0.0019640038677867385, "loss": 2.8958, "step": 4209 }, { "epoch": 0.11, "learning_rate": 0.0019639807214393845, "loss": 2.5699, "step": 4210 }, { "epoch": 0.11, "learning_rate": 0.0019639575677890854, "loss": 2.8982, "step": 4211 }, { "epoch": 0.11, "learning_rate": 0.001963934406836016, "loss": 2.7548, "step": 4212 }, { "epoch": 0.11, "learning_rate": 0.0019639112385803513, "loss": 2.7532, "step": 4213 }, { "epoch": 0.11, "learning_rate": 0.0019638880630222684, "loss": 2.5152, "step": 4214 }, { "epoch": 0.11, "learning_rate": 0.001963864880161941, "loss": 2.7251, "step": 4215 }, { "epoch": 0.11, "learning_rate": 0.001963841689999546, "loss": 2.7402, "step": 4216 }, { "epoch": 0.11, "learning_rate": 0.0019638184925352587, "loss": 2.6398, "step": 4217 }, { "epoch": 0.11, "learning_rate": 0.0019637952877692546, "loss": 2.8674, "step": 4218 }, { "epoch": 0.11, "learning_rate": 0.0019637720757017096, "loss": 2.3474, "step": 4219 }, { "epoch": 0.11, "learning_rate": 0.0019637488563327998, "loss": 2.876, "step": 4220 }, { "epoch": 0.11, "learning_rate": 0.0019637256296627013, "loss": 2.5353, "step": 4221 }, { "epoch": 0.11, "learning_rate": 0.001963702395691589, "loss": 3.1591, "step": 4222 }, { "epoch": 0.11, "learning_rate": 0.00196367915441964, "loss": 2.98, "step": 4223 }, { "epoch": 0.11, "learning_rate": 0.0019636559058470305, "loss": 2.8976, "step": 4224 }, { "epoch": 0.11, "learning_rate": 0.0019636326499739357, "loss": 2.5541, "step": 4225 }, { "epoch": 0.11, "learning_rate": 0.001963609386800532, "loss": 2.6922, "step": 4226 }, { "epoch": 0.11, "learning_rate": 0.0019635861163269965, "loss": 2.8244, "step": 4227 }, { "epoch": 0.11, "learning_rate": 0.0019635628385535043, "loss": 2.4105, "step": 4228 }, { "epoch": 0.11, "learning_rate": 0.0019635395534802324, "loss": 2.4926, "step": 4229 }, { "epoch": 0.11, "learning_rate": 0.0019635162611073573, "loss": 2.684, "step": 4230 }, { "epoch": 0.11, "learning_rate": 0.001963492961435055, "loss": 2.5896, "step": 4231 }, { "epoch": 0.11, "learning_rate": 0.0019634696544635023, "loss": 2.454, "step": 4232 }, { "epoch": 0.11, "learning_rate": 0.001963446340192876, "loss": 2.4566, "step": 4233 }, { "epoch": 0.11, "learning_rate": 0.0019634230186233526, "loss": 2.5904, "step": 4234 }, { "epoch": 0.11, "learning_rate": 0.0019633996897551083, "loss": 2.4753, "step": 4235 }, { "epoch": 0.11, "learning_rate": 0.0019633763535883203, "loss": 2.7191, "step": 4236 }, { "epoch": 0.11, "learning_rate": 0.001963353010123165, "loss": 2.6396, "step": 4237 }, { "epoch": 0.11, "learning_rate": 0.00196332965935982, "loss": 2.6571, "step": 4238 }, { "epoch": 0.11, "learning_rate": 0.0019633063012984616, "loss": 2.6586, "step": 4239 }, { "epoch": 0.11, "learning_rate": 0.001963282935939267, "loss": 2.7018, "step": 4240 }, { "epoch": 0.11, "learning_rate": 0.0019632595632824127, "loss": 2.536, "step": 4241 }, { "epoch": 0.11, "learning_rate": 0.0019632361833280764, "loss": 2.989, "step": 4242 }, { "epoch": 0.11, "learning_rate": 0.001963212796076435, "loss": 2.1776, "step": 4243 }, { "epoch": 0.11, "learning_rate": 0.001963189401527666, "loss": 2.4818, "step": 4244 }, { "epoch": 0.11, "learning_rate": 0.001963165999681946, "loss": 2.6236, "step": 4245 }, { "epoch": 0.11, "learning_rate": 0.001963142590539452, "loss": 2.9525, "step": 4246 }, { "epoch": 0.11, "learning_rate": 0.0019631191741003623, "loss": 2.8462, "step": 4247 }, { "epoch": 0.11, "learning_rate": 0.0019630957503648542, "loss": 2.8422, "step": 4248 }, { "epoch": 0.11, "learning_rate": 0.001963072319333105, "loss": 2.6781, "step": 4249 }, { "epoch": 0.11, "learning_rate": 0.001963048881005292, "loss": 2.8217, "step": 4250 }, { "epoch": 0.11, "learning_rate": 0.0019630254353815925, "loss": 2.4502, "step": 4251 }, { "epoch": 0.11, "learning_rate": 0.0019630019824621848, "loss": 2.3763, "step": 4252 }, { "epoch": 0.11, "learning_rate": 0.001962978522247246, "loss": 2.7695, "step": 4253 }, { "epoch": 0.11, "learning_rate": 0.0019629550547369543, "loss": 2.5587, "step": 4254 }, { "epoch": 0.11, "learning_rate": 0.001962931579931487, "loss": 2.6622, "step": 4255 }, { "epoch": 0.11, "learning_rate": 0.0019629080978310226, "loss": 3.0832, "step": 4256 }, { "epoch": 0.11, "learning_rate": 0.0019628846084357382, "loss": 3.1432, "step": 4257 }, { "epoch": 0.11, "learning_rate": 0.0019628611117458125, "loss": 2.6281, "step": 4258 }, { "epoch": 0.11, "learning_rate": 0.0019628376077614226, "loss": 2.3697, "step": 4259 }, { "epoch": 0.11, "learning_rate": 0.001962814096482748, "loss": 2.73, "step": 4260 }, { "epoch": 0.11, "learning_rate": 0.0019627905779099654, "loss": 2.3287, "step": 4261 }, { "epoch": 0.11, "learning_rate": 0.001962767052043253, "loss": 2.6678, "step": 4262 }, { "epoch": 0.11, "learning_rate": 0.0019627435188827903, "loss": 3.0617, "step": 4263 }, { "epoch": 0.11, "learning_rate": 0.001962719978428755, "loss": 2.4467, "step": 4264 }, { "epoch": 0.11, "learning_rate": 0.0019626964306813247, "loss": 2.9967, "step": 4265 }, { "epoch": 0.11, "learning_rate": 0.001962672875640679, "loss": 2.9404, "step": 4266 }, { "epoch": 0.11, "learning_rate": 0.001962649313306995, "loss": 2.9689, "step": 4267 }, { "epoch": 0.11, "learning_rate": 0.001962625743680452, "loss": 2.5887, "step": 4268 }, { "epoch": 0.11, "learning_rate": 0.0019626021667612284, "loss": 2.9823, "step": 4269 }, { "epoch": 0.11, "learning_rate": 0.0019625785825495034, "loss": 2.6097, "step": 4270 }, { "epoch": 0.11, "learning_rate": 0.0019625549910454545, "loss": 2.8449, "step": 4271 }, { "epoch": 0.11, "learning_rate": 0.0019625313922492617, "loss": 2.6057, "step": 4272 }, { "epoch": 0.11, "learning_rate": 0.001962507786161103, "loss": 2.5274, "step": 4273 }, { "epoch": 0.11, "learning_rate": 0.001962484172781157, "loss": 2.8492, "step": 4274 }, { "epoch": 0.11, "learning_rate": 0.0019624605521096033, "loss": 2.7189, "step": 4275 }, { "epoch": 0.11, "learning_rate": 0.0019624369241466205, "loss": 2.7829, "step": 4276 }, { "epoch": 0.11, "learning_rate": 0.0019624132888923875, "loss": 2.9511, "step": 4277 }, { "epoch": 0.11, "learning_rate": 0.0019623896463470836, "loss": 2.4532, "step": 4278 }, { "epoch": 0.11, "learning_rate": 0.001962365996510888, "loss": 2.4413, "step": 4279 }, { "epoch": 0.12, "learning_rate": 0.00196234233938398, "loss": 2.3575, "step": 4280 }, { "epoch": 0.12, "learning_rate": 0.0019623186749665377, "loss": 2.9503, "step": 4281 }, { "epoch": 0.12, "learning_rate": 0.001962295003258741, "loss": 2.592, "step": 4282 }, { "epoch": 0.12, "learning_rate": 0.00196227132426077, "loss": 2.7608, "step": 4283 }, { "epoch": 0.12, "learning_rate": 0.0019622476379728034, "loss": 2.4965, "step": 4284 }, { "epoch": 0.12, "learning_rate": 0.001962223944395021, "loss": 2.772, "step": 4285 }, { "epoch": 0.12, "learning_rate": 0.001962200243527601, "loss": 2.6774, "step": 4286 }, { "epoch": 0.12, "learning_rate": 0.001962176535370725, "loss": 2.8057, "step": 4287 }, { "epoch": 0.12, "learning_rate": 0.001962152819924571, "loss": 2.5812, "step": 4288 }, { "epoch": 0.12, "learning_rate": 0.00196212909718932, "loss": 2.5492, "step": 4289 }, { "epoch": 0.12, "learning_rate": 0.0019621053671651503, "loss": 2.8408, "step": 4290 }, { "epoch": 0.12, "learning_rate": 0.0019620816298522425, "loss": 2.54, "step": 4291 }, { "epoch": 0.12, "learning_rate": 0.001962057885250776, "loss": 2.7411, "step": 4292 }, { "epoch": 0.12, "learning_rate": 0.0019620341333609313, "loss": 2.9417, "step": 4293 }, { "epoch": 0.12, "learning_rate": 0.001962010374182888, "loss": 2.8615, "step": 4294 }, { "epoch": 0.12, "learning_rate": 0.001961986607716826, "loss": 2.8751, "step": 4295 }, { "epoch": 0.12, "learning_rate": 0.0019619628339629254, "loss": 2.8717, "step": 4296 }, { "epoch": 0.12, "learning_rate": 0.0019619390529213667, "loss": 2.5552, "step": 4297 }, { "epoch": 0.12, "learning_rate": 0.0019619152645923292, "loss": 2.6226, "step": 4298 }, { "epoch": 0.12, "learning_rate": 0.0019618914689759942, "loss": 2.7661, "step": 4299 }, { "epoch": 0.12, "learning_rate": 0.001961867666072541, "loss": 2.766, "step": 4300 }, { "epoch": 0.12, "learning_rate": 0.0019618438558821503, "loss": 2.8414, "step": 4301 }, { "epoch": 0.12, "learning_rate": 0.0019618200384050027, "loss": 2.9436, "step": 4302 }, { "epoch": 0.12, "learning_rate": 0.0019617962136412783, "loss": 2.8295, "step": 4303 }, { "epoch": 0.12, "learning_rate": 0.0019617723815911576, "loss": 2.9537, "step": 4304 }, { "epoch": 0.12, "learning_rate": 0.0019617485422548215, "loss": 2.5746, "step": 4305 }, { "epoch": 0.12, "learning_rate": 0.0019617246956324507, "loss": 2.8062, "step": 4306 }, { "epoch": 0.12, "learning_rate": 0.001961700841724225, "loss": 2.5573, "step": 4307 }, { "epoch": 0.12, "learning_rate": 0.001961676980530326, "loss": 2.3861, "step": 4308 }, { "epoch": 0.12, "learning_rate": 0.001961653112050934, "loss": 2.7795, "step": 4309 }, { "epoch": 0.12, "learning_rate": 0.00196162923628623, "loss": 2.5114, "step": 4310 }, { "epoch": 0.12, "learning_rate": 0.001961605353236395, "loss": 2.8674, "step": 4311 }, { "epoch": 0.12, "learning_rate": 0.0019615814629016094, "loss": 2.6964, "step": 4312 }, { "epoch": 0.12, "learning_rate": 0.0019615575652820547, "loss": 2.3493, "step": 4313 }, { "epoch": 0.12, "learning_rate": 0.0019615336603779118, "loss": 2.9495, "step": 4314 }, { "epoch": 0.12, "learning_rate": 0.0019615097481893618, "loss": 2.6834, "step": 4315 }, { "epoch": 0.12, "learning_rate": 0.0019614858287165856, "loss": 2.6131, "step": 4316 }, { "epoch": 0.12, "learning_rate": 0.001961461901959765, "loss": 2.4394, "step": 4317 }, { "epoch": 0.12, "learning_rate": 0.001961437967919081, "loss": 2.5631, "step": 4318 }, { "epoch": 0.12, "learning_rate": 0.0019614140265947146, "loss": 3.3189, "step": 4319 }, { "epoch": 0.12, "learning_rate": 0.0019613900779868474, "loss": 2.7275, "step": 4320 }, { "epoch": 0.12, "learning_rate": 0.0019613661220956612, "loss": 2.648, "step": 4321 }, { "epoch": 0.12, "learning_rate": 0.0019613421589213366, "loss": 2.6632, "step": 4322 }, { "epoch": 0.12, "learning_rate": 0.001961318188464056, "loss": 2.9236, "step": 4323 }, { "epoch": 0.12, "learning_rate": 0.001961294210724001, "loss": 2.9416, "step": 4324 }, { "epoch": 0.12, "learning_rate": 0.0019612702257013523, "loss": 2.7569, "step": 4325 }, { "epoch": 0.12, "learning_rate": 0.0019612462333962926, "loss": 2.5865, "step": 4326 }, { "epoch": 0.12, "learning_rate": 0.0019612222338090033, "loss": 2.6495, "step": 4327 }, { "epoch": 0.12, "learning_rate": 0.0019611982269396658, "loss": 2.8052, "step": 4328 }, { "epoch": 0.12, "learning_rate": 0.0019611742127884626, "loss": 2.9228, "step": 4329 }, { "epoch": 0.12, "learning_rate": 0.0019611501913555755, "loss": 2.7729, "step": 4330 }, { "epoch": 0.12, "learning_rate": 0.0019611261626411866, "loss": 2.7889, "step": 4331 }, { "epoch": 0.12, "learning_rate": 0.0019611021266454772, "loss": 2.8885, "step": 4332 }, { "epoch": 0.12, "learning_rate": 0.0019610780833686304, "loss": 2.6265, "step": 4333 }, { "epoch": 0.12, "learning_rate": 0.0019610540328108277, "loss": 2.6309, "step": 4334 }, { "epoch": 0.12, "learning_rate": 0.0019610299749722514, "loss": 2.5749, "step": 4335 }, { "epoch": 0.12, "learning_rate": 0.0019610059098530835, "loss": 2.4863, "step": 4336 }, { "epoch": 0.12, "learning_rate": 0.0019609818374535072, "loss": 3.0312, "step": 4337 }, { "epoch": 0.12, "learning_rate": 0.001960957757773704, "loss": 2.9231, "step": 4338 }, { "epoch": 0.12, "learning_rate": 0.001960933670813857, "loss": 2.9009, "step": 4339 }, { "epoch": 0.12, "learning_rate": 0.001960909576574148, "loss": 2.7489, "step": 4340 }, { "epoch": 0.12, "learning_rate": 0.0019608854750547597, "loss": 3.0316, "step": 4341 }, { "epoch": 0.12, "learning_rate": 0.001960861366255875, "loss": 2.5119, "step": 4342 }, { "epoch": 0.12, "learning_rate": 0.0019608372501776767, "loss": 2.7214, "step": 4343 }, { "epoch": 0.12, "learning_rate": 0.001960813126820347, "loss": 2.5092, "step": 4344 }, { "epoch": 0.12, "learning_rate": 0.001960788996184068, "loss": 2.7348, "step": 4345 }, { "epoch": 0.12, "learning_rate": 0.0019607648582690247, "loss": 2.7217, "step": 4346 }, { "epoch": 0.12, "learning_rate": 0.0019607407130753977, "loss": 2.5477, "step": 4347 }, { "epoch": 0.12, "learning_rate": 0.001960716560603371, "loss": 3.0212, "step": 4348 }, { "epoch": 0.12, "learning_rate": 0.0019606924008531276, "loss": 2.589, "step": 4349 }, { "epoch": 0.12, "learning_rate": 0.00196066823382485, "loss": 2.7681, "step": 4350 }, { "epoch": 0.12, "learning_rate": 0.0019606440595187217, "loss": 2.9894, "step": 4351 }, { "epoch": 0.12, "learning_rate": 0.001960619877934926, "loss": 2.5042, "step": 4352 }, { "epoch": 0.12, "learning_rate": 0.0019605956890736457, "loss": 2.5798, "step": 4353 }, { "epoch": 0.12, "learning_rate": 0.0019605714929350642, "loss": 2.8058, "step": 4354 }, { "epoch": 0.12, "learning_rate": 0.0019605472895193646, "loss": 3.1888, "step": 4355 }, { "epoch": 0.12, "learning_rate": 0.0019605230788267308, "loss": 2.6818, "step": 4356 }, { "epoch": 0.12, "learning_rate": 0.0019604988608573457, "loss": 2.6435, "step": 4357 }, { "epoch": 0.12, "learning_rate": 0.0019604746356113928, "loss": 2.9145, "step": 4358 }, { "epoch": 0.12, "learning_rate": 0.0019604504030890564, "loss": 2.713, "step": 4359 }, { "epoch": 0.12, "learning_rate": 0.001960426163290519, "loss": 2.5255, "step": 4360 }, { "epoch": 0.12, "learning_rate": 0.0019604019162159647, "loss": 2.976, "step": 4361 }, { "epoch": 0.12, "learning_rate": 0.001960377661865577, "loss": 2.3282, "step": 4362 }, { "epoch": 0.12, "learning_rate": 0.00196035340023954, "loss": 2.5889, "step": 4363 }, { "epoch": 0.12, "learning_rate": 0.0019603291313380375, "loss": 2.7445, "step": 4364 }, { "epoch": 0.12, "learning_rate": 0.001960304855161253, "loss": 2.4252, "step": 4365 }, { "epoch": 0.12, "learning_rate": 0.0019602805717093704, "loss": 2.5078, "step": 4366 }, { "epoch": 0.12, "learning_rate": 0.0019602562809825745, "loss": 2.3752, "step": 4367 }, { "epoch": 0.12, "learning_rate": 0.0019602319829810483, "loss": 2.4682, "step": 4368 }, { "epoch": 0.12, "learning_rate": 0.001960207677704976, "loss": 2.6658, "step": 4369 }, { "epoch": 0.12, "learning_rate": 0.0019601833651545423, "loss": 2.7614, "step": 4370 }, { "epoch": 0.12, "learning_rate": 0.0019601590453299316, "loss": 2.5818, "step": 4371 }, { "epoch": 0.12, "learning_rate": 0.001960134718231327, "loss": 3.0145, "step": 4372 }, { "epoch": 0.12, "learning_rate": 0.0019601103838589136, "loss": 2.7481, "step": 4373 }, { "epoch": 0.12, "learning_rate": 0.0019600860422128753, "loss": 2.3915, "step": 4374 }, { "epoch": 0.12, "learning_rate": 0.001960061693293397, "loss": 2.1999, "step": 4375 }, { "epoch": 0.12, "learning_rate": 0.001960037337100663, "loss": 2.5931, "step": 4376 }, { "epoch": 0.12, "learning_rate": 0.0019600129736348578, "loss": 2.5259, "step": 4377 }, { "epoch": 0.12, "learning_rate": 0.001959988602896166, "loss": 2.3547, "step": 4378 }, { "epoch": 0.12, "learning_rate": 0.001959964224884772, "loss": 2.6907, "step": 4379 }, { "epoch": 0.12, "learning_rate": 0.0019599398396008606, "loss": 2.5007, "step": 4380 }, { "epoch": 0.12, "learning_rate": 0.001959915447044617, "loss": 2.93, "step": 4381 }, { "epoch": 0.12, "learning_rate": 0.001959891047216225, "loss": 2.3003, "step": 4382 }, { "epoch": 0.12, "learning_rate": 0.0019598666401158702, "loss": 2.6156, "step": 4383 }, { "epoch": 0.12, "learning_rate": 0.0019598422257437378, "loss": 2.8369, "step": 4384 }, { "epoch": 0.12, "learning_rate": 0.0019598178041000123, "loss": 3.0919, "step": 4385 }, { "epoch": 0.12, "learning_rate": 0.0019597933751848784, "loss": 3.1693, "step": 4386 }, { "epoch": 0.12, "learning_rate": 0.001959768938998521, "loss": 2.9094, "step": 4387 }, { "epoch": 0.12, "learning_rate": 0.0019597444955411266, "loss": 2.4152, "step": 4388 }, { "epoch": 0.12, "learning_rate": 0.001959720044812879, "loss": 2.5906, "step": 4389 }, { "epoch": 0.12, "learning_rate": 0.001959695586813964, "loss": 2.5266, "step": 4390 }, { "epoch": 0.12, "learning_rate": 0.001959671121544567, "loss": 3.0207, "step": 4391 }, { "epoch": 0.12, "learning_rate": 0.0019596466490048726, "loss": 2.9768, "step": 4392 }, { "epoch": 0.12, "learning_rate": 0.0019596221691950675, "loss": 2.2865, "step": 4393 }, { "epoch": 0.12, "learning_rate": 0.001959597682115336, "loss": 2.6927, "step": 4394 }, { "epoch": 0.12, "learning_rate": 0.001959573187765864, "loss": 2.3247, "step": 4395 }, { "epoch": 0.12, "learning_rate": 0.001959548686146837, "loss": 3.1246, "step": 4396 }, { "epoch": 0.12, "learning_rate": 0.0019595241772584412, "loss": 2.8596, "step": 4397 }, { "epoch": 0.12, "learning_rate": 0.0019594996611008615, "loss": 2.6067, "step": 4398 }, { "epoch": 0.12, "learning_rate": 0.0019594751376742835, "loss": 2.5336, "step": 4399 }, { "epoch": 0.12, "learning_rate": 0.001959450606978894, "loss": 2.2026, "step": 4400 }, { "epoch": 0.12, "learning_rate": 0.001959426069014878, "loss": 2.5432, "step": 4401 }, { "epoch": 0.12, "learning_rate": 0.0019594015237824215, "loss": 2.6544, "step": 4402 }, { "epoch": 0.12, "learning_rate": 0.001959376971281711, "loss": 2.8709, "step": 4403 }, { "epoch": 0.12, "learning_rate": 0.0019593524115129315, "loss": 2.5829, "step": 4404 }, { "epoch": 0.12, "learning_rate": 0.00195932784447627, "loss": 2.5448, "step": 4405 }, { "epoch": 0.12, "learning_rate": 0.001959303270171912, "loss": 2.8083, "step": 4406 }, { "epoch": 0.12, "learning_rate": 0.0019592786886000442, "loss": 2.4755, "step": 4407 }, { "epoch": 0.12, "learning_rate": 0.0019592540997608525, "loss": 2.6692, "step": 4408 }, { "epoch": 0.12, "learning_rate": 0.0019592295036545233, "loss": 2.876, "step": 4409 }, { "epoch": 0.12, "learning_rate": 0.0019592049002812428, "loss": 2.9285, "step": 4410 }, { "epoch": 0.12, "learning_rate": 0.0019591802896411978, "loss": 3.1933, "step": 4411 }, { "epoch": 0.12, "learning_rate": 0.001959155671734574, "loss": 2.4912, "step": 4412 }, { "epoch": 0.12, "learning_rate": 0.0019591310465615582, "loss": 2.3865, "step": 4413 }, { "epoch": 0.12, "learning_rate": 0.001959106414122337, "loss": 2.8129, "step": 4414 }, { "epoch": 0.12, "learning_rate": 0.0019590817744170974, "loss": 2.8329, "step": 4415 }, { "epoch": 0.12, "learning_rate": 0.0019590571274460257, "loss": 2.6595, "step": 4416 }, { "epoch": 0.12, "learning_rate": 0.001959032473209309, "loss": 2.8706, "step": 4417 }, { "epoch": 0.12, "learning_rate": 0.0019590078117071334, "loss": 2.1057, "step": 4418 }, { "epoch": 0.12, "learning_rate": 0.0019589831429396858, "loss": 2.2082, "step": 4419 }, { "epoch": 0.12, "learning_rate": 0.001958958466907154, "loss": 2.6683, "step": 4420 }, { "epoch": 0.12, "learning_rate": 0.0019589337836097235, "loss": 2.7957, "step": 4421 }, { "epoch": 0.12, "learning_rate": 0.0019589090930475827, "loss": 3.0626, "step": 4422 }, { "epoch": 0.12, "learning_rate": 0.0019588843952209178, "loss": 2.3542, "step": 4423 }, { "epoch": 0.12, "learning_rate": 0.001958859690129916, "loss": 2.6319, "step": 4424 }, { "epoch": 0.12, "learning_rate": 0.0019588349777747652, "loss": 2.7558, "step": 4425 }, { "epoch": 0.12, "learning_rate": 0.0019588102581556514, "loss": 2.7705, "step": 4426 }, { "epoch": 0.12, "learning_rate": 0.001958785531272763, "loss": 2.9525, "step": 4427 }, { "epoch": 0.12, "learning_rate": 0.0019587607971262868, "loss": 2.583, "step": 4428 }, { "epoch": 0.12, "learning_rate": 0.0019587360557164098, "loss": 3.3043, "step": 4429 }, { "epoch": 0.12, "learning_rate": 0.0019587113070433197, "loss": 2.8008, "step": 4430 }, { "epoch": 0.12, "learning_rate": 0.001958686551107205, "loss": 2.3254, "step": 4431 }, { "epoch": 0.12, "learning_rate": 0.0019586617879082517, "loss": 2.7097, "step": 4432 }, { "epoch": 0.12, "learning_rate": 0.0019586370174466483, "loss": 3.2084, "step": 4433 }, { "epoch": 0.12, "learning_rate": 0.0019586122397225823, "loss": 2.819, "step": 4434 }, { "epoch": 0.12, "learning_rate": 0.001958587454736241, "loss": 2.6211, "step": 4435 }, { "epoch": 0.12, "learning_rate": 0.001958562662487813, "loss": 2.7632, "step": 4436 }, { "epoch": 0.12, "learning_rate": 0.0019585378629774853, "loss": 2.1362, "step": 4437 }, { "epoch": 0.12, "learning_rate": 0.0019585130562054464, "loss": 2.5242, "step": 4438 }, { "epoch": 0.12, "learning_rate": 0.0019584882421718837, "loss": 3.0174, "step": 4439 }, { "epoch": 0.12, "learning_rate": 0.0019584634208769857, "loss": 2.506, "step": 4440 }, { "epoch": 0.12, "learning_rate": 0.00195843859232094, "loss": 2.8356, "step": 4441 }, { "epoch": 0.12, "learning_rate": 0.001958413756503935, "loss": 2.5611, "step": 4442 }, { "epoch": 0.12, "learning_rate": 0.0019583889134261586, "loss": 2.4848, "step": 4443 }, { "epoch": 0.12, "learning_rate": 0.001958364063087799, "loss": 2.7783, "step": 4444 }, { "epoch": 0.12, "learning_rate": 0.001958339205489045, "loss": 2.8138, "step": 4445 }, { "epoch": 0.12, "learning_rate": 0.001958314340630084, "loss": 2.757, "step": 4446 }, { "epoch": 0.12, "learning_rate": 0.001958289468511105, "loss": 2.7295, "step": 4447 }, { "epoch": 0.12, "learning_rate": 0.0019582645891322967, "loss": 2.7552, "step": 4448 }, { "epoch": 0.12, "learning_rate": 0.001958239702493847, "loss": 2.3471, "step": 4449 }, { "epoch": 0.12, "learning_rate": 0.0019582148085959448, "loss": 2.7169, "step": 4450 }, { "epoch": 0.12, "learning_rate": 0.001958189907438778, "loss": 2.6297, "step": 4451 }, { "epoch": 0.12, "learning_rate": 0.0019581649990225362, "loss": 2.7465, "step": 4452 }, { "epoch": 0.12, "learning_rate": 0.0019581400833474072, "loss": 3.0916, "step": 4453 }, { "epoch": 0.12, "learning_rate": 0.001958115160413581, "loss": 2.6797, "step": 4454 }, { "epoch": 0.12, "learning_rate": 0.0019580902302212453, "loss": 2.6317, "step": 4455 }, { "epoch": 0.12, "learning_rate": 0.001958065292770589, "loss": 2.5505, "step": 4456 }, { "epoch": 0.12, "learning_rate": 0.0019580403480618015, "loss": 2.4277, "step": 4457 }, { "epoch": 0.12, "learning_rate": 0.001958015396095072, "loss": 2.5946, "step": 4458 }, { "epoch": 0.12, "learning_rate": 0.001957990436870589, "loss": 2.4649, "step": 4459 }, { "epoch": 0.12, "learning_rate": 0.0019579654703885414, "loss": 2.4527, "step": 4460 }, { "epoch": 0.12, "learning_rate": 0.0019579404966491186, "loss": 3.0253, "step": 4461 }, { "epoch": 0.12, "learning_rate": 0.00195791551565251, "loss": 2.6039, "step": 4462 }, { "epoch": 0.12, "learning_rate": 0.001957890527398905, "loss": 2.6641, "step": 4463 }, { "epoch": 0.12, "learning_rate": 0.0019578655318884925, "loss": 2.5413, "step": 4464 }, { "epoch": 0.12, "learning_rate": 0.0019578405291214617, "loss": 2.6978, "step": 4465 }, { "epoch": 0.12, "learning_rate": 0.0019578155190980023, "loss": 2.901, "step": 4466 }, { "epoch": 0.12, "learning_rate": 0.0019577905018183044, "loss": 2.6404, "step": 4467 }, { "epoch": 0.12, "learning_rate": 0.001957765477282556, "loss": 2.7282, "step": 4468 }, { "epoch": 0.12, "learning_rate": 0.0019577404454909483, "loss": 2.6658, "step": 4469 }, { "epoch": 0.12, "learning_rate": 0.0019577154064436696, "loss": 2.9452, "step": 4470 }, { "epoch": 0.12, "learning_rate": 0.001957690360140911, "loss": 2.5691, "step": 4471 }, { "epoch": 0.12, "learning_rate": 0.001957665306582861, "loss": 2.6941, "step": 4472 }, { "epoch": 0.12, "learning_rate": 0.0019576402457697093, "loss": 2.5933, "step": 4473 }, { "epoch": 0.12, "learning_rate": 0.001957615177701647, "loss": 2.5771, "step": 4474 }, { "epoch": 0.12, "learning_rate": 0.0019575901023788636, "loss": 2.6106, "step": 4475 }, { "epoch": 0.12, "learning_rate": 0.001957565019801548, "loss": 2.8445, "step": 4476 }, { "epoch": 0.12, "learning_rate": 0.0019575399299698914, "loss": 3.251, "step": 4477 }, { "epoch": 0.12, "learning_rate": 0.0019575148328840834, "loss": 2.6308, "step": 4478 }, { "epoch": 0.12, "learning_rate": 0.0019574897285443145, "loss": 2.6081, "step": 4479 }, { "epoch": 0.12, "learning_rate": 0.0019574646169507742, "loss": 2.749, "step": 4480 }, { "epoch": 0.12, "learning_rate": 0.001957439498103653, "loss": 2.4567, "step": 4481 }, { "epoch": 0.12, "learning_rate": 0.001957414372003142, "loss": 2.5997, "step": 4482 }, { "epoch": 0.12, "learning_rate": 0.0019573892386494304, "loss": 2.9826, "step": 4483 }, { "epoch": 0.12, "learning_rate": 0.001957364098042709, "loss": 2.4257, "step": 4484 }, { "epoch": 0.12, "learning_rate": 0.0019573389501831686, "loss": 2.8925, "step": 4485 }, { "epoch": 0.12, "learning_rate": 0.0019573137950709995, "loss": 2.5507, "step": 4486 }, { "epoch": 0.12, "learning_rate": 0.0019572886327063922, "loss": 2.5252, "step": 4487 }, { "epoch": 0.12, "learning_rate": 0.0019572634630895375, "loss": 2.3379, "step": 4488 }, { "epoch": 0.12, "learning_rate": 0.001957238286220626, "loss": 2.8451, "step": 4489 }, { "epoch": 0.12, "learning_rate": 0.001957213102099848, "loss": 2.5356, "step": 4490 }, { "epoch": 0.12, "learning_rate": 0.0019571879107273945, "loss": 2.6504, "step": 4491 }, { "epoch": 0.12, "learning_rate": 0.001957162712103457, "loss": 2.7087, "step": 4492 }, { "epoch": 0.12, "learning_rate": 0.001957137506228226, "loss": 2.65, "step": 4493 }, { "epoch": 0.12, "learning_rate": 0.0019571122931018917, "loss": 2.5557, "step": 4494 }, { "epoch": 0.12, "learning_rate": 0.0019570870727246463, "loss": 2.5142, "step": 4495 }, { "epoch": 0.12, "learning_rate": 0.0019570618450966805, "loss": 2.5621, "step": 4496 }, { "epoch": 0.12, "learning_rate": 0.001957036610218185, "loss": 2.4533, "step": 4497 }, { "epoch": 0.12, "learning_rate": 0.001957011368089351, "loss": 2.3463, "step": 4498 }, { "epoch": 0.12, "learning_rate": 0.0019569861187103705, "loss": 2.6571, "step": 4499 }, { "epoch": 0.12, "learning_rate": 0.0019569608620814342, "loss": 2.3965, "step": 4500 }, { "epoch": 0.12, "learning_rate": 0.0019569355982027334, "loss": 2.2745, "step": 4501 }, { "epoch": 0.12, "learning_rate": 0.001956910327074459, "loss": 2.787, "step": 4502 }, { "epoch": 0.12, "learning_rate": 0.0019568850486968038, "loss": 2.9478, "step": 4503 }, { "epoch": 0.12, "learning_rate": 0.0019568597630699584, "loss": 2.9844, "step": 4504 }, { "epoch": 0.12, "learning_rate": 0.0019568344701941143, "loss": 3.1199, "step": 4505 }, { "epoch": 0.12, "learning_rate": 0.0019568091700694636, "loss": 2.8546, "step": 4506 }, { "epoch": 0.12, "learning_rate": 0.001956783862696197, "loss": 2.5767, "step": 4507 }, { "epoch": 0.12, "learning_rate": 0.001956758548074508, "loss": 2.6063, "step": 4508 }, { "epoch": 0.12, "learning_rate": 0.0019567332262045863, "loss": 2.7996, "step": 4509 }, { "epoch": 0.12, "learning_rate": 0.0019567078970866253, "loss": 2.8694, "step": 4510 }, { "epoch": 0.12, "learning_rate": 0.001956682560720816, "loss": 2.8803, "step": 4511 }, { "epoch": 0.12, "learning_rate": 0.0019566572171073513, "loss": 2.4207, "step": 4512 }, { "epoch": 0.12, "learning_rate": 0.0019566318662464217, "loss": 2.8056, "step": 4513 }, { "epoch": 0.12, "learning_rate": 0.0019566065081382204, "loss": 2.6593, "step": 4514 }, { "epoch": 0.12, "learning_rate": 0.0019565811427829393, "loss": 2.7768, "step": 4515 }, { "epoch": 0.12, "learning_rate": 0.0019565557701807707, "loss": 2.9821, "step": 4516 }, { "epoch": 0.12, "learning_rate": 0.0019565303903319063, "loss": 2.2969, "step": 4517 }, { "epoch": 0.12, "learning_rate": 0.001956505003236539, "loss": 2.5219, "step": 4518 }, { "epoch": 0.12, "learning_rate": 0.00195647960889486, "loss": 2.6783, "step": 4519 }, { "epoch": 0.12, "learning_rate": 0.0019564542073070633, "loss": 2.9035, "step": 4520 }, { "epoch": 0.12, "learning_rate": 0.00195642879847334, "loss": 2.693, "step": 4521 }, { "epoch": 0.12, "learning_rate": 0.0019564033823938837, "loss": 2.0036, "step": 4522 }, { "epoch": 0.12, "learning_rate": 0.001956377959068886, "loss": 2.6736, "step": 4523 }, { "epoch": 0.12, "learning_rate": 0.00195635252849854, "loss": 3.0554, "step": 4524 }, { "epoch": 0.12, "learning_rate": 0.0019563270906830382, "loss": 2.8747, "step": 4525 }, { "epoch": 0.12, "learning_rate": 0.0019563016456225733, "loss": 2.7263, "step": 4526 }, { "epoch": 0.12, "learning_rate": 0.001956276193317338, "loss": 2.7823, "step": 4527 }, { "epoch": 0.12, "learning_rate": 0.001956250733767525, "loss": 2.6779, "step": 4528 }, { "epoch": 0.12, "learning_rate": 0.0019562252669733282, "loss": 2.6094, "step": 4529 }, { "epoch": 0.12, "learning_rate": 0.001956199792934939, "loss": 2.3024, "step": 4530 }, { "epoch": 0.12, "learning_rate": 0.0019561743116525516, "loss": 2.8493, "step": 4531 }, { "epoch": 0.12, "learning_rate": 0.0019561488231263583, "loss": 2.669, "step": 4532 }, { "epoch": 0.12, "learning_rate": 0.0019561233273565526, "loss": 2.3894, "step": 4533 }, { "epoch": 0.12, "learning_rate": 0.001956097824343327, "loss": 2.7255, "step": 4534 }, { "epoch": 0.12, "learning_rate": 0.001956072314086876, "loss": 3.1114, "step": 4535 }, { "epoch": 0.12, "learning_rate": 0.0019560467965873914, "loss": 3.0278, "step": 4536 }, { "epoch": 0.12, "learning_rate": 0.001956021271845068, "loss": 2.8573, "step": 4537 }, { "epoch": 0.12, "learning_rate": 0.0019559957398600975, "loss": 3.011, "step": 4538 }, { "epoch": 0.12, "learning_rate": 0.0019559702006326746, "loss": 2.4712, "step": 4539 }, { "epoch": 0.12, "learning_rate": 0.0019559446541629923, "loss": 2.5394, "step": 4540 }, { "epoch": 0.12, "learning_rate": 0.001955919100451244, "loss": 2.863, "step": 4541 }, { "epoch": 0.12, "learning_rate": 0.001955893539497624, "loss": 2.8752, "step": 4542 }, { "epoch": 0.12, "learning_rate": 0.001955867971302325, "loss": 2.8794, "step": 4543 }, { "epoch": 0.12, "learning_rate": 0.0019558423958655415, "loss": 2.6751, "step": 4544 }, { "epoch": 0.12, "learning_rate": 0.0019558168131874666, "loss": 2.6514, "step": 4545 }, { "epoch": 0.12, "learning_rate": 0.0019557912232682946, "loss": 2.2903, "step": 4546 }, { "epoch": 0.12, "learning_rate": 0.001955765626108219, "loss": 2.9123, "step": 4547 }, { "epoch": 0.12, "learning_rate": 0.001955740021707434, "loss": 2.6201, "step": 4548 }, { "epoch": 0.12, "learning_rate": 0.0019557144100661333, "loss": 2.5804, "step": 4549 }, { "epoch": 0.12, "learning_rate": 0.0019556887911845113, "loss": 2.4224, "step": 4550 }, { "epoch": 0.12, "learning_rate": 0.001955663165062762, "loss": 2.7813, "step": 4551 }, { "epoch": 0.12, "learning_rate": 0.001955637531701079, "loss": 2.1946, "step": 4552 }, { "epoch": 0.12, "learning_rate": 0.001955611891099657, "loss": 2.5597, "step": 4553 }, { "epoch": 0.12, "learning_rate": 0.0019555862432586906, "loss": 3.0252, "step": 4554 }, { "epoch": 0.12, "learning_rate": 0.0019555605881783735, "loss": 2.5527, "step": 4555 }, { "epoch": 0.12, "learning_rate": 0.0019555349258589, "loss": 2.9911, "step": 4556 }, { "epoch": 0.12, "learning_rate": 0.0019555092563004646, "loss": 2.9184, "step": 4557 }, { "epoch": 0.12, "learning_rate": 0.0019554835795032623, "loss": 2.5481, "step": 4558 }, { "epoch": 0.12, "learning_rate": 0.001955457895467487, "loss": 2.6782, "step": 4559 }, { "epoch": 0.12, "learning_rate": 0.0019554322041933333, "loss": 2.63, "step": 4560 }, { "epoch": 0.12, "learning_rate": 0.0019554065056809965, "loss": 2.9103, "step": 4561 }, { "epoch": 0.12, "learning_rate": 0.0019553807999306704, "loss": 2.4937, "step": 4562 }, { "epoch": 0.12, "learning_rate": 0.0019553550869425506, "loss": 2.5365, "step": 4563 }, { "epoch": 0.12, "learning_rate": 0.0019553293667168314, "loss": 2.7594, "step": 4564 }, { "epoch": 0.12, "learning_rate": 0.0019553036392537075, "loss": 2.6705, "step": 4565 }, { "epoch": 0.12, "learning_rate": 0.001955277904553374, "loss": 3.0914, "step": 4566 }, { "epoch": 0.12, "learning_rate": 0.001955252162616026, "loss": 2.7969, "step": 4567 }, { "epoch": 0.12, "learning_rate": 0.0019552264134418585, "loss": 2.637, "step": 4568 }, { "epoch": 0.12, "learning_rate": 0.001955200657031066, "loss": 2.6397, "step": 4569 }, { "epoch": 0.12, "learning_rate": 0.001955174893383845, "loss": 2.737, "step": 4570 }, { "epoch": 0.12, "learning_rate": 0.001955149122500389, "loss": 2.7418, "step": 4571 }, { "epoch": 0.12, "learning_rate": 0.001955123344380894, "loss": 2.8079, "step": 4572 }, { "epoch": 0.12, "learning_rate": 0.0019550975590255557, "loss": 2.639, "step": 4573 }, { "epoch": 0.12, "learning_rate": 0.0019550717664345687, "loss": 2.4358, "step": 4574 }, { "epoch": 0.12, "learning_rate": 0.001955045966608129, "loss": 2.7918, "step": 4575 }, { "epoch": 0.12, "learning_rate": 0.001955020159546432, "loss": 3.1939, "step": 4576 }, { "epoch": 0.12, "learning_rate": 0.0019549943452496724, "loss": 2.9212, "step": 4577 }, { "epoch": 0.12, "learning_rate": 0.001954968523718047, "loss": 2.6598, "step": 4578 }, { "epoch": 0.12, "learning_rate": 0.0019549426949517505, "loss": 2.7722, "step": 4579 }, { "epoch": 0.12, "learning_rate": 0.0019549168589509786, "loss": 2.872, "step": 4580 }, { "epoch": 0.12, "learning_rate": 0.0019548910157159275, "loss": 2.6648, "step": 4581 }, { "epoch": 0.12, "learning_rate": 0.001954865165246793, "loss": 2.5808, "step": 4582 }, { "epoch": 0.12, "learning_rate": 0.0019548393075437707, "loss": 2.5159, "step": 4583 }, { "epoch": 0.12, "learning_rate": 0.001954813442607056, "loss": 2.7205, "step": 4584 }, { "epoch": 0.12, "learning_rate": 0.001954787570436846, "loss": 2.4704, "step": 4585 }, { "epoch": 0.12, "learning_rate": 0.0019547616910333358, "loss": 2.3729, "step": 4586 }, { "epoch": 0.12, "learning_rate": 0.001954735804396722, "loss": 2.912, "step": 4587 }, { "epoch": 0.12, "learning_rate": 0.0019547099105272003, "loss": 2.7632, "step": 4588 }, { "epoch": 0.12, "learning_rate": 0.001954684009424967, "loss": 2.4683, "step": 4589 }, { "epoch": 0.12, "learning_rate": 0.001954658101090218, "loss": 2.8269, "step": 4590 }, { "epoch": 0.12, "learning_rate": 0.0019546321855231498, "loss": 2.4577, "step": 4591 }, { "epoch": 0.12, "learning_rate": 0.0019546062627239596, "loss": 2.5112, "step": 4592 }, { "epoch": 0.12, "learning_rate": 0.0019545803326928425, "loss": 2.9109, "step": 4593 }, { "epoch": 0.12, "learning_rate": 0.0019545543954299954, "loss": 2.6763, "step": 4594 }, { "epoch": 0.12, "learning_rate": 0.001954528450935615, "loss": 3.0948, "step": 4595 }, { "epoch": 0.12, "learning_rate": 0.0019545024992098977, "loss": 2.8499, "step": 4596 }, { "epoch": 0.12, "learning_rate": 0.0019544765402530404, "loss": 2.9802, "step": 4597 }, { "epoch": 0.12, "learning_rate": 0.001954450574065239, "loss": 2.5788, "step": 4598 }, { "epoch": 0.12, "learning_rate": 0.001954424600646691, "loss": 2.4295, "step": 4599 }, { "epoch": 0.12, "learning_rate": 0.0019543986199975927, "loss": 2.7152, "step": 4600 }, { "epoch": 0.12, "learning_rate": 0.001954372632118141, "loss": 2.5478, "step": 4601 }, { "epoch": 0.12, "learning_rate": 0.001954346637008533, "loss": 2.4898, "step": 4602 }, { "epoch": 0.12, "learning_rate": 0.0019543206346689657, "loss": 2.7864, "step": 4603 }, { "epoch": 0.12, "learning_rate": 0.0019542946250996358, "loss": 2.5155, "step": 4604 }, { "epoch": 0.12, "learning_rate": 0.00195426860830074, "loss": 2.6522, "step": 4605 }, { "epoch": 0.12, "learning_rate": 0.0019542425842724765, "loss": 2.7745, "step": 4606 }, { "epoch": 0.12, "learning_rate": 0.0019542165530150413, "loss": 3.0812, "step": 4607 }, { "epoch": 0.12, "learning_rate": 0.001954190514528632, "loss": 2.8813, "step": 4608 }, { "epoch": 0.12, "learning_rate": 0.0019541644688134464, "loss": 2.7722, "step": 4609 }, { "epoch": 0.12, "learning_rate": 0.001954138415869681, "loss": 2.9139, "step": 4610 }, { "epoch": 0.12, "learning_rate": 0.001954112355697534, "loss": 2.8379, "step": 4611 }, { "epoch": 0.12, "learning_rate": 0.001954086288297202, "loss": 3.0131, "step": 4612 }, { "epoch": 0.12, "learning_rate": 0.0019540602136688826, "loss": 3.1686, "step": 4613 }, { "epoch": 0.12, "learning_rate": 0.001954034131812774, "loss": 2.478, "step": 4614 }, { "epoch": 0.12, "learning_rate": 0.0019540080427290735, "loss": 2.8458, "step": 4615 }, { "epoch": 0.12, "learning_rate": 0.0019539819464179783, "loss": 2.6338, "step": 4616 }, { "epoch": 0.12, "learning_rate": 0.0019539558428796865, "loss": 2.8023, "step": 4617 }, { "epoch": 0.12, "learning_rate": 0.0019539297321143957, "loss": 2.6821, "step": 4618 }, { "epoch": 0.12, "learning_rate": 0.001953903614122304, "loss": 2.8128, "step": 4619 }, { "epoch": 0.12, "learning_rate": 0.001953877488903609, "loss": 2.3583, "step": 4620 }, { "epoch": 0.12, "learning_rate": 0.001953851356458509, "loss": 2.8573, "step": 4621 }, { "epoch": 0.12, "learning_rate": 0.0019538252167872012, "loss": 2.4413, "step": 4622 }, { "epoch": 0.12, "learning_rate": 0.0019537990698898842, "loss": 2.7509, "step": 4623 }, { "epoch": 0.12, "learning_rate": 0.001953772915766756, "loss": 2.9212, "step": 4624 }, { "epoch": 0.12, "learning_rate": 0.001953746754418015, "loss": 3.4121, "step": 4625 }, { "epoch": 0.12, "learning_rate": 0.0019537205858438586, "loss": 2.6834, "step": 4626 }, { "epoch": 0.12, "learning_rate": 0.001953694410044486, "loss": 2.5556, "step": 4627 }, { "epoch": 0.12, "learning_rate": 0.0019536682270200945, "loss": 2.768, "step": 4628 }, { "epoch": 0.12, "learning_rate": 0.0019536420367708834, "loss": 2.5472, "step": 4629 }, { "epoch": 0.12, "learning_rate": 0.001953615839297051, "loss": 2.5836, "step": 4630 }, { "epoch": 0.12, "learning_rate": 0.001953589634598795, "loss": 2.4925, "step": 4631 }, { "epoch": 0.12, "learning_rate": 0.0019535634226763143, "loss": 2.8136, "step": 4632 }, { "epoch": 0.12, "learning_rate": 0.001953537203529808, "loss": 2.8331, "step": 4633 }, { "epoch": 0.12, "learning_rate": 0.0019535109771594743, "loss": 2.5933, "step": 4634 }, { "epoch": 0.12, "learning_rate": 0.001953484743565512, "loss": 2.8318, "step": 4635 }, { "epoch": 0.12, "learning_rate": 0.001953458502748119, "loss": 2.507, "step": 4636 }, { "epoch": 0.12, "learning_rate": 0.0019534322547074953, "loss": 2.6036, "step": 4637 }, { "epoch": 0.12, "learning_rate": 0.0019534059994438394, "loss": 2.6707, "step": 4638 }, { "epoch": 0.12, "learning_rate": 0.00195337973695735, "loss": 2.9058, "step": 4639 }, { "epoch": 0.12, "learning_rate": 0.0019533534672482263, "loss": 3.0845, "step": 4640 }, { "epoch": 0.12, "learning_rate": 0.0019533271903166673, "loss": 2.4493, "step": 4641 }, { "epoch": 0.12, "learning_rate": 0.001953300906162872, "loss": 2.7175, "step": 4642 }, { "epoch": 0.12, "learning_rate": 0.001953274614787039, "loss": 2.9349, "step": 4643 }, { "epoch": 0.12, "learning_rate": 0.0019532483161893684, "loss": 2.5667, "step": 4644 }, { "epoch": 0.12, "learning_rate": 0.0019532220103700582, "loss": 2.6026, "step": 4645 }, { "epoch": 0.12, "learning_rate": 0.0019531956973293093, "loss": 2.7092, "step": 4646 }, { "epoch": 0.12, "learning_rate": 0.00195316937706732, "loss": 3.1785, "step": 4647 }, { "epoch": 0.12, "learning_rate": 0.00195314304958429, "loss": 2.7657, "step": 4648 }, { "epoch": 0.12, "learning_rate": 0.0019531167148804185, "loss": 2.2034, "step": 4649 }, { "epoch": 0.12, "learning_rate": 0.001953090372955905, "loss": 2.901, "step": 4650 }, { "epoch": 0.12, "learning_rate": 0.0019530640238109495, "loss": 3.0948, "step": 4651 }, { "epoch": 0.13, "learning_rate": 0.0019530376674457514, "loss": 2.7908, "step": 4652 }, { "epoch": 0.13, "learning_rate": 0.0019530113038605103, "loss": 2.9847, "step": 4653 }, { "epoch": 0.13, "learning_rate": 0.0019529849330554257, "loss": 2.1443, "step": 4654 }, { "epoch": 0.13, "learning_rate": 0.0019529585550306977, "loss": 2.9034, "step": 4655 }, { "epoch": 0.13, "learning_rate": 0.0019529321697865259, "loss": 2.4907, "step": 4656 }, { "epoch": 0.13, "learning_rate": 0.0019529057773231106, "loss": 2.9546, "step": 4657 }, { "epoch": 0.13, "learning_rate": 0.0019528793776406514, "loss": 2.5243, "step": 4658 }, { "epoch": 0.13, "learning_rate": 0.0019528529707393484, "loss": 2.6118, "step": 4659 }, { "epoch": 0.13, "learning_rate": 0.001952826556619402, "loss": 2.732, "step": 4660 }, { "epoch": 0.13, "learning_rate": 0.0019528001352810116, "loss": 2.6866, "step": 4661 }, { "epoch": 0.13, "learning_rate": 0.001952773706724378, "loss": 2.2785, "step": 4662 }, { "epoch": 0.13, "learning_rate": 0.0019527472709497005, "loss": 2.4463, "step": 4663 }, { "epoch": 0.13, "learning_rate": 0.0019527208279571805, "loss": 2.559, "step": 4664 }, { "epoch": 0.13, "learning_rate": 0.001952694377747018, "loss": 2.8323, "step": 4665 }, { "epoch": 0.13, "learning_rate": 0.0019526679203194126, "loss": 2.5688, "step": 4666 }, { "epoch": 0.13, "learning_rate": 0.001952641455674566, "loss": 2.8611, "step": 4667 }, { "epoch": 0.13, "learning_rate": 0.0019526149838126777, "loss": 2.6264, "step": 4668 }, { "epoch": 0.13, "learning_rate": 0.0019525885047339488, "loss": 2.6065, "step": 4669 }, { "epoch": 0.13, "learning_rate": 0.0019525620184385796, "loss": 2.5818, "step": 4670 }, { "epoch": 0.13, "learning_rate": 0.0019525355249267707, "loss": 2.6825, "step": 4671 }, { "epoch": 0.13, "learning_rate": 0.0019525090241987232, "loss": 3.0341, "step": 4672 }, { "epoch": 0.13, "learning_rate": 0.001952482516254637, "loss": 2.7321, "step": 4673 }, { "epoch": 0.13, "learning_rate": 0.0019524560010947144, "loss": 2.6789, "step": 4674 }, { "epoch": 0.13, "learning_rate": 0.001952429478719155, "loss": 2.7334, "step": 4675 }, { "epoch": 0.13, "learning_rate": 0.0019524029491281604, "loss": 2.4719, "step": 4676 }, { "epoch": 0.13, "learning_rate": 0.001952376412321931, "loss": 2.7589, "step": 4677 }, { "epoch": 0.13, "learning_rate": 0.0019523498683006683, "loss": 2.7196, "step": 4678 }, { "epoch": 0.13, "learning_rate": 0.0019523233170645733, "loss": 2.8339, "step": 4679 }, { "epoch": 0.13, "learning_rate": 0.001952296758613847, "loss": 2.4804, "step": 4680 }, { "epoch": 0.13, "learning_rate": 0.0019522701929486908, "loss": 2.7779, "step": 4681 }, { "epoch": 0.13, "learning_rate": 0.0019522436200693058, "loss": 2.6556, "step": 4682 }, { "epoch": 0.13, "learning_rate": 0.0019522170399758937, "loss": 2.8839, "step": 4683 }, { "epoch": 0.13, "learning_rate": 0.0019521904526686553, "loss": 2.7039, "step": 4684 }, { "epoch": 0.13, "learning_rate": 0.001952163858147792, "loss": 3.1255, "step": 4685 }, { "epoch": 0.13, "learning_rate": 0.001952137256413506, "loss": 2.6665, "step": 4686 }, { "epoch": 0.13, "learning_rate": 0.0019521106474659979, "loss": 2.4436, "step": 4687 }, { "epoch": 0.13, "learning_rate": 0.0019520840313054703, "loss": 2.5973, "step": 4688 }, { "epoch": 0.13, "learning_rate": 0.0019520574079321242, "loss": 2.7295, "step": 4689 }, { "epoch": 0.13, "learning_rate": 0.001952030777346161, "loss": 2.7919, "step": 4690 }, { "epoch": 0.13, "learning_rate": 0.0019520041395477833, "loss": 2.862, "step": 4691 }, { "epoch": 0.13, "learning_rate": 0.001951977494537192, "loss": 2.8148, "step": 4692 }, { "epoch": 0.13, "learning_rate": 0.0019519508423145894, "loss": 2.6271, "step": 4693 }, { "epoch": 0.13, "learning_rate": 0.0019519241828801776, "loss": 2.842, "step": 4694 }, { "epoch": 0.13, "learning_rate": 0.0019518975162341585, "loss": 2.9963, "step": 4695 }, { "epoch": 0.13, "learning_rate": 0.001951870842376734, "loss": 2.6343, "step": 4696 }, { "epoch": 0.13, "learning_rate": 0.0019518441613081059, "loss": 2.6239, "step": 4697 }, { "epoch": 0.13, "learning_rate": 0.001951817473028477, "loss": 2.6671, "step": 4698 }, { "epoch": 0.13, "learning_rate": 0.0019517907775380486, "loss": 2.7364, "step": 4699 }, { "epoch": 0.13, "learning_rate": 0.0019517640748370239, "loss": 2.8006, "step": 4700 }, { "epoch": 0.13, "learning_rate": 0.0019517373649256045, "loss": 3.0279, "step": 4701 }, { "epoch": 0.13, "learning_rate": 0.001951710647803993, "loss": 2.709, "step": 4702 }, { "epoch": 0.13, "learning_rate": 0.0019516839234723917, "loss": 2.8674, "step": 4703 }, { "epoch": 0.13, "learning_rate": 0.001951657191931003, "loss": 2.7042, "step": 4704 }, { "epoch": 0.13, "learning_rate": 0.0019516304531800302, "loss": 2.8912, "step": 4705 }, { "epoch": 0.13, "learning_rate": 0.0019516037072196746, "loss": 2.8043, "step": 4706 }, { "epoch": 0.13, "learning_rate": 0.0019515769540501397, "loss": 2.7082, "step": 4707 }, { "epoch": 0.13, "learning_rate": 0.0019515501936716278, "loss": 2.7809, "step": 4708 }, { "epoch": 0.13, "learning_rate": 0.001951523426084342, "loss": 2.4664, "step": 4709 }, { "epoch": 0.13, "learning_rate": 0.0019514966512884846, "loss": 2.6689, "step": 4710 }, { "epoch": 0.13, "learning_rate": 0.0019514698692842587, "loss": 2.579, "step": 4711 }, { "epoch": 0.13, "learning_rate": 0.0019514430800718673, "loss": 2.2322, "step": 4712 }, { "epoch": 0.13, "learning_rate": 0.001951416283651513, "loss": 2.8119, "step": 4713 }, { "epoch": 0.13, "learning_rate": 0.001951389480023399, "loss": 2.7808, "step": 4714 }, { "epoch": 0.13, "learning_rate": 0.0019513626691877288, "loss": 2.7977, "step": 4715 }, { "epoch": 0.13, "learning_rate": 0.0019513358511447049, "loss": 2.8172, "step": 4716 }, { "epoch": 0.13, "learning_rate": 0.0019513090258945307, "loss": 2.7485, "step": 4717 }, { "epoch": 0.13, "learning_rate": 0.0019512821934374092, "loss": 2.5943, "step": 4718 }, { "epoch": 0.13, "learning_rate": 0.001951255353773544, "loss": 2.8386, "step": 4719 }, { "epoch": 0.13, "learning_rate": 0.0019512285069031386, "loss": 2.5554, "step": 4720 }, { "epoch": 0.13, "learning_rate": 0.0019512016528263959, "loss": 2.6771, "step": 4721 }, { "epoch": 0.13, "learning_rate": 0.0019511747915435193, "loss": 2.5342, "step": 4722 }, { "epoch": 0.13, "learning_rate": 0.0019511479230547126, "loss": 2.5894, "step": 4723 }, { "epoch": 0.13, "learning_rate": 0.0019511210473601795, "loss": 2.9401, "step": 4724 }, { "epoch": 0.13, "learning_rate": 0.0019510941644601233, "loss": 2.5846, "step": 4725 }, { "epoch": 0.13, "learning_rate": 0.0019510672743547476, "loss": 2.8446, "step": 4726 }, { "epoch": 0.13, "learning_rate": 0.0019510403770442565, "loss": 2.8928, "step": 4727 }, { "epoch": 0.13, "learning_rate": 0.0019510134725288532, "loss": 2.7158, "step": 4728 }, { "epoch": 0.13, "learning_rate": 0.0019509865608087424, "loss": 2.6623, "step": 4729 }, { "epoch": 0.13, "learning_rate": 0.001950959641884127, "loss": 3.0338, "step": 4730 }, { "epoch": 0.13, "learning_rate": 0.0019509327157552115, "loss": 2.9519, "step": 4731 }, { "epoch": 0.13, "learning_rate": 0.0019509057824221997, "loss": 2.8648, "step": 4732 }, { "epoch": 0.13, "learning_rate": 0.0019508788418852957, "loss": 2.459, "step": 4733 }, { "epoch": 0.13, "learning_rate": 0.0019508518941447038, "loss": 3.3122, "step": 4734 }, { "epoch": 0.13, "learning_rate": 0.0019508249392006277, "loss": 2.7769, "step": 4735 }, { "epoch": 0.13, "learning_rate": 0.0019507979770532718, "loss": 3.0999, "step": 4736 }, { "epoch": 0.13, "learning_rate": 0.0019507710077028408, "loss": 2.4893, "step": 4737 }, { "epoch": 0.13, "learning_rate": 0.0019507440311495382, "loss": 2.865, "step": 4738 }, { "epoch": 0.13, "learning_rate": 0.001950717047393569, "loss": 2.6569, "step": 4739 }, { "epoch": 0.13, "learning_rate": 0.0019506900564351373, "loss": 2.8894, "step": 4740 }, { "epoch": 0.13, "learning_rate": 0.001950663058274448, "loss": 2.5607, "step": 4741 }, { "epoch": 0.13, "learning_rate": 0.0019506360529117051, "loss": 2.8373, "step": 4742 }, { "epoch": 0.13, "learning_rate": 0.0019506090403471133, "loss": 2.5334, "step": 4743 }, { "epoch": 0.13, "learning_rate": 0.0019505820205808775, "loss": 2.6408, "step": 4744 }, { "epoch": 0.13, "learning_rate": 0.0019505549936132023, "loss": 3.2396, "step": 4745 }, { "epoch": 0.13, "learning_rate": 0.0019505279594442923, "loss": 2.6644, "step": 4746 }, { "epoch": 0.13, "learning_rate": 0.0019505009180743524, "loss": 2.8042, "step": 4747 }, { "epoch": 0.13, "learning_rate": 0.0019504738695035877, "loss": 2.8027, "step": 4748 }, { "epoch": 0.13, "learning_rate": 0.001950446813732203, "loss": 2.7123, "step": 4749 }, { "epoch": 0.13, "learning_rate": 0.001950419750760403, "loss": 2.9792, "step": 4750 }, { "epoch": 0.13, "learning_rate": 0.0019503926805883927, "loss": 2.4349, "step": 4751 }, { "epoch": 0.13, "learning_rate": 0.0019503656032163774, "loss": 2.6702, "step": 4752 }, { "epoch": 0.13, "learning_rate": 0.0019503385186445624, "loss": 2.9275, "step": 4753 }, { "epoch": 0.13, "learning_rate": 0.0019503114268731526, "loss": 2.4213, "step": 4754 }, { "epoch": 0.13, "learning_rate": 0.0019502843279023533, "loss": 2.9046, "step": 4755 }, { "epoch": 0.13, "learning_rate": 0.0019502572217323696, "loss": 2.7908, "step": 4756 }, { "epoch": 0.13, "learning_rate": 0.0019502301083634075, "loss": 2.851, "step": 4757 }, { "epoch": 0.13, "learning_rate": 0.0019502029877956715, "loss": 2.8959, "step": 4758 }, { "epoch": 0.13, "learning_rate": 0.001950175860029368, "loss": 2.4445, "step": 4759 }, { "epoch": 0.13, "learning_rate": 0.001950148725064702, "loss": 2.6649, "step": 4760 }, { "epoch": 0.13, "learning_rate": 0.001950121582901879, "loss": 3.0123, "step": 4761 }, { "epoch": 0.13, "learning_rate": 0.0019500944335411048, "loss": 2.5867, "step": 4762 }, { "epoch": 0.13, "learning_rate": 0.0019500672769825849, "loss": 3.1206, "step": 4763 }, { "epoch": 0.13, "learning_rate": 0.0019500401132265253, "loss": 2.9574, "step": 4764 }, { "epoch": 0.13, "learning_rate": 0.0019500129422731316, "loss": 2.5305, "step": 4765 }, { "epoch": 0.13, "learning_rate": 0.0019499857641226098, "loss": 2.5022, "step": 4766 }, { "epoch": 0.13, "learning_rate": 0.0019499585787751657, "loss": 2.9385, "step": 4767 }, { "epoch": 0.13, "learning_rate": 0.001949931386231005, "loss": 2.747, "step": 4768 }, { "epoch": 0.13, "learning_rate": 0.0019499041864903342, "loss": 2.624, "step": 4769 }, { "epoch": 0.13, "learning_rate": 0.0019498769795533591, "loss": 2.3954, "step": 4770 }, { "epoch": 0.13, "learning_rate": 0.0019498497654202858, "loss": 2.5078, "step": 4771 }, { "epoch": 0.13, "learning_rate": 0.00194982254409132, "loss": 2.6613, "step": 4772 }, { "epoch": 0.13, "learning_rate": 0.0019497953155666692, "loss": 2.6289, "step": 4773 }, { "epoch": 0.13, "learning_rate": 0.0019497680798465384, "loss": 2.8259, "step": 4774 }, { "epoch": 0.13, "learning_rate": 0.0019497408369311348, "loss": 2.7326, "step": 4775 }, { "epoch": 0.13, "learning_rate": 0.0019497135868206642, "loss": 2.5629, "step": 4776 }, { "epoch": 0.13, "learning_rate": 0.0019496863295153332, "loss": 2.8535, "step": 4777 }, { "epoch": 0.13, "learning_rate": 0.0019496590650153482, "loss": 2.8367, "step": 4778 }, { "epoch": 0.13, "learning_rate": 0.0019496317933209162, "loss": 2.7601, "step": 4779 }, { "epoch": 0.13, "learning_rate": 0.0019496045144322437, "loss": 3.1163, "step": 4780 }, { "epoch": 0.13, "learning_rate": 0.0019495772283495368, "loss": 2.6473, "step": 4781 }, { "epoch": 0.13, "learning_rate": 0.0019495499350730028, "loss": 2.9995, "step": 4782 }, { "epoch": 0.13, "learning_rate": 0.0019495226346028481, "loss": 2.5655, "step": 4783 }, { "epoch": 0.13, "learning_rate": 0.0019494953269392796, "loss": 2.7229, "step": 4784 }, { "epoch": 0.13, "learning_rate": 0.0019494680120825043, "loss": 2.608, "step": 4785 }, { "epoch": 0.13, "learning_rate": 0.0019494406900327293, "loss": 2.8441, "step": 4786 }, { "epoch": 0.13, "learning_rate": 0.001949413360790161, "loss": 3.0204, "step": 4787 }, { "epoch": 0.13, "learning_rate": 0.0019493860243550074, "loss": 2.8962, "step": 4788 }, { "epoch": 0.13, "learning_rate": 0.0019493586807274746, "loss": 2.9782, "step": 4789 }, { "epoch": 0.13, "learning_rate": 0.0019493313299077705, "loss": 2.4667, "step": 4790 }, { "epoch": 0.13, "learning_rate": 0.0019493039718961015, "loss": 2.4523, "step": 4791 }, { "epoch": 0.13, "learning_rate": 0.0019492766066926755, "loss": 2.7076, "step": 4792 }, { "epoch": 0.13, "learning_rate": 0.0019492492342976996, "loss": 2.5151, "step": 4793 }, { "epoch": 0.13, "learning_rate": 0.0019492218547113814, "loss": 2.4927, "step": 4794 }, { "epoch": 0.13, "learning_rate": 0.001949194467933928, "loss": 2.2002, "step": 4795 }, { "epoch": 0.13, "learning_rate": 0.0019491670739655471, "loss": 2.7251, "step": 4796 }, { "epoch": 0.13, "learning_rate": 0.001949139672806446, "loss": 2.3582, "step": 4797 }, { "epoch": 0.13, "learning_rate": 0.0019491122644568328, "loss": 2.6495, "step": 4798 }, { "epoch": 0.13, "learning_rate": 0.0019490848489169144, "loss": 2.8121, "step": 4799 }, { "epoch": 0.13, "learning_rate": 0.001949057426186899, "loss": 2.3494, "step": 4800 }, { "epoch": 0.13, "learning_rate": 0.0019490299962669942, "loss": 2.4926, "step": 4801 }, { "epoch": 0.13, "learning_rate": 0.0019490025591574077, "loss": 2.7626, "step": 4802 }, { "epoch": 0.13, "learning_rate": 0.0019489751148583476, "loss": 3.0088, "step": 4803 }, { "epoch": 0.13, "learning_rate": 0.0019489476633700216, "loss": 2.3126, "step": 4804 }, { "epoch": 0.13, "learning_rate": 0.0019489202046926377, "loss": 2.6101, "step": 4805 }, { "epoch": 0.13, "learning_rate": 0.0019488927388264042, "loss": 2.6038, "step": 4806 }, { "epoch": 0.13, "learning_rate": 0.0019488652657715288, "loss": 2.5787, "step": 4807 }, { "epoch": 0.13, "learning_rate": 0.00194883778552822, "loss": 2.546, "step": 4808 }, { "epoch": 0.13, "learning_rate": 0.0019488102980966856, "loss": 2.567, "step": 4809 }, { "epoch": 0.13, "learning_rate": 0.0019487828034771338, "loss": 2.7185, "step": 4810 }, { "epoch": 0.13, "learning_rate": 0.0019487553016697735, "loss": 3.0284, "step": 4811 }, { "epoch": 0.13, "learning_rate": 0.0019487277926748124, "loss": 2.6432, "step": 4812 }, { "epoch": 0.13, "learning_rate": 0.0019487002764924594, "loss": 2.7887, "step": 4813 }, { "epoch": 0.13, "learning_rate": 0.0019486727531229226, "loss": 2.9409, "step": 4814 }, { "epoch": 0.13, "learning_rate": 0.0019486452225664103, "loss": 2.3182, "step": 4815 }, { "epoch": 0.13, "learning_rate": 0.001948617684823132, "loss": 2.7214, "step": 4816 }, { "epoch": 0.13, "learning_rate": 0.0019485901398932953, "loss": 2.6023, "step": 4817 }, { "epoch": 0.13, "learning_rate": 0.0019485625877771094, "loss": 2.8377, "step": 4818 }, { "epoch": 0.13, "learning_rate": 0.001948535028474783, "loss": 2.6935, "step": 4819 }, { "epoch": 0.13, "learning_rate": 0.0019485074619865247, "loss": 2.854, "step": 4820 }, { "epoch": 0.13, "learning_rate": 0.0019484798883125435, "loss": 2.5642, "step": 4821 }, { "epoch": 0.13, "learning_rate": 0.001948452307453048, "loss": 2.6032, "step": 4822 }, { "epoch": 0.13, "learning_rate": 0.0019484247194082478, "loss": 3.0796, "step": 4823 }, { "epoch": 0.13, "learning_rate": 0.0019483971241783511, "loss": 2.7066, "step": 4824 }, { "epoch": 0.13, "learning_rate": 0.0019483695217635676, "loss": 2.7672, "step": 4825 }, { "epoch": 0.13, "learning_rate": 0.001948341912164106, "loss": 2.5978, "step": 4826 }, { "epoch": 0.13, "learning_rate": 0.0019483142953801759, "loss": 2.5715, "step": 4827 }, { "epoch": 0.13, "learning_rate": 0.001948286671411986, "loss": 2.6464, "step": 4828 }, { "epoch": 0.13, "learning_rate": 0.0019482590402597458, "loss": 2.5516, "step": 4829 }, { "epoch": 0.13, "learning_rate": 0.0019482314019236648, "loss": 2.7783, "step": 4830 }, { "epoch": 0.13, "learning_rate": 0.0019482037564039522, "loss": 2.4649, "step": 4831 }, { "epoch": 0.13, "learning_rate": 0.0019481761037008173, "loss": 2.8654, "step": 4832 }, { "epoch": 0.13, "learning_rate": 0.0019481484438144698, "loss": 2.6675, "step": 4833 }, { "epoch": 0.13, "learning_rate": 0.0019481207767451192, "loss": 2.5955, "step": 4834 }, { "epoch": 0.13, "learning_rate": 0.0019480931024929752, "loss": 3.1112, "step": 4835 }, { "epoch": 0.13, "learning_rate": 0.0019480654210582474, "loss": 2.8849, "step": 4836 }, { "epoch": 0.13, "learning_rate": 0.0019480377324411454, "loss": 2.7556, "step": 4837 }, { "epoch": 0.13, "learning_rate": 0.001948010036641879, "loss": 3.0814, "step": 4838 }, { "epoch": 0.13, "learning_rate": 0.001947982333660658, "loss": 2.4526, "step": 4839 }, { "epoch": 0.13, "learning_rate": 0.0019479546234976923, "loss": 2.8684, "step": 4840 }, { "epoch": 0.13, "learning_rate": 0.0019479269061531922, "loss": 2.8167, "step": 4841 }, { "epoch": 0.13, "learning_rate": 0.001947899181627367, "loss": 2.8555, "step": 4842 }, { "epoch": 0.13, "learning_rate": 0.001947871449920427, "loss": 2.7294, "step": 4843 }, { "epoch": 0.13, "learning_rate": 0.0019478437110325825, "loss": 2.7285, "step": 4844 }, { "epoch": 0.13, "learning_rate": 0.0019478159649640437, "loss": 2.9037, "step": 4845 }, { "epoch": 0.13, "learning_rate": 0.0019477882117150203, "loss": 2.6992, "step": 4846 }, { "epoch": 0.13, "learning_rate": 0.001947760451285723, "loss": 2.9655, "step": 4847 }, { "epoch": 0.13, "learning_rate": 0.001947732683676362, "loss": 2.5465, "step": 4848 }, { "epoch": 0.13, "learning_rate": 0.0019477049088871474, "loss": 2.7906, "step": 4849 }, { "epoch": 0.13, "learning_rate": 0.0019476771269182902, "loss": 2.6326, "step": 4850 }, { "epoch": 0.13, "learning_rate": 0.0019476493377700002, "loss": 2.7102, "step": 4851 }, { "epoch": 0.13, "learning_rate": 0.0019476215414424886, "loss": 2.6842, "step": 4852 }, { "epoch": 0.13, "learning_rate": 0.0019475937379359652, "loss": 2.7089, "step": 4853 }, { "epoch": 0.13, "learning_rate": 0.0019475659272506411, "loss": 3.0108, "step": 4854 }, { "epoch": 0.13, "learning_rate": 0.001947538109386727, "loss": 3.0837, "step": 4855 }, { "epoch": 0.13, "learning_rate": 0.0019475102843444338, "loss": 2.516, "step": 4856 }, { "epoch": 0.13, "learning_rate": 0.001947482452123972, "loss": 2.6699, "step": 4857 }, { "epoch": 0.13, "learning_rate": 0.0019474546127255525, "loss": 2.987, "step": 4858 }, { "epoch": 0.13, "learning_rate": 0.0019474267661493863, "loss": 2.74, "step": 4859 }, { "epoch": 0.13, "learning_rate": 0.001947398912395684, "loss": 2.7202, "step": 4860 }, { "epoch": 0.13, "learning_rate": 0.0019473710514646574, "loss": 2.6123, "step": 4861 }, { "epoch": 0.13, "learning_rate": 0.0019473431833565166, "loss": 2.4712, "step": 4862 }, { "epoch": 0.13, "learning_rate": 0.0019473153080714735, "loss": 3.1242, "step": 4863 }, { "epoch": 0.13, "learning_rate": 0.001947287425609739, "loss": 2.8015, "step": 4864 }, { "epoch": 0.13, "learning_rate": 0.0019472595359715243, "loss": 2.3842, "step": 4865 }, { "epoch": 0.13, "learning_rate": 0.0019472316391570407, "loss": 2.6767, "step": 4866 }, { "epoch": 0.13, "learning_rate": 0.0019472037351664995, "loss": 2.8076, "step": 4867 }, { "epoch": 0.13, "learning_rate": 0.0019471758240001123, "loss": 2.4616, "step": 4868 }, { "epoch": 0.13, "learning_rate": 0.0019471479056580902, "loss": 2.9018, "step": 4869 }, { "epoch": 0.13, "learning_rate": 0.001947119980140645, "loss": 2.6996, "step": 4870 }, { "epoch": 0.13, "learning_rate": 0.0019470920474479881, "loss": 2.5938, "step": 4871 }, { "epoch": 0.13, "learning_rate": 0.001947064107580331, "loss": 2.38, "step": 4872 }, { "epoch": 0.13, "learning_rate": 0.0019470361605378858, "loss": 2.5989, "step": 4873 }, { "epoch": 0.13, "learning_rate": 0.0019470082063208641, "loss": 2.7393, "step": 4874 }, { "epoch": 0.13, "learning_rate": 0.0019469802449294774, "loss": 2.8954, "step": 4875 }, { "epoch": 0.13, "learning_rate": 0.0019469522763639377, "loss": 2.5619, "step": 4876 }, { "epoch": 0.13, "learning_rate": 0.0019469243006244566, "loss": 2.4372, "step": 4877 }, { "epoch": 0.13, "learning_rate": 0.0019468963177112465, "loss": 2.4361, "step": 4878 }, { "epoch": 0.13, "learning_rate": 0.001946868327624519, "loss": 2.465, "step": 4879 }, { "epoch": 0.13, "learning_rate": 0.0019468403303644867, "loss": 2.581, "step": 4880 }, { "epoch": 0.13, "learning_rate": 0.0019468123259313611, "loss": 2.7095, "step": 4881 }, { "epoch": 0.13, "learning_rate": 0.0019467843143253546, "loss": 2.5776, "step": 4882 }, { "epoch": 0.13, "learning_rate": 0.0019467562955466794, "loss": 2.9993, "step": 4883 }, { "epoch": 0.13, "learning_rate": 0.0019467282695955477, "loss": 2.4432, "step": 4884 }, { "epoch": 0.13, "learning_rate": 0.001946700236472172, "loss": 2.8494, "step": 4885 }, { "epoch": 0.13, "learning_rate": 0.0019466721961767647, "loss": 2.6094, "step": 4886 }, { "epoch": 0.13, "learning_rate": 0.0019466441487095377, "loss": 2.8607, "step": 4887 }, { "epoch": 0.13, "learning_rate": 0.0019466160940707043, "loss": 3.0272, "step": 4888 }, { "epoch": 0.13, "learning_rate": 0.0019465880322604764, "loss": 2.5129, "step": 4889 }, { "epoch": 0.13, "learning_rate": 0.0019465599632790666, "loss": 2.5159, "step": 4890 }, { "epoch": 0.13, "learning_rate": 0.001946531887126688, "loss": 2.6748, "step": 4891 }, { "epoch": 0.13, "learning_rate": 0.001946503803803553, "loss": 2.7641, "step": 4892 }, { "epoch": 0.13, "learning_rate": 0.0019464757133098743, "loss": 3.0382, "step": 4893 }, { "epoch": 0.13, "learning_rate": 0.001946447615645865, "loss": 3.029, "step": 4894 }, { "epoch": 0.13, "learning_rate": 0.0019464195108117378, "loss": 2.9356, "step": 4895 }, { "epoch": 0.13, "learning_rate": 0.0019463913988077054, "loss": 2.5479, "step": 4896 }, { "epoch": 0.13, "learning_rate": 0.0019463632796339811, "loss": 2.674, "step": 4897 }, { "epoch": 0.13, "learning_rate": 0.0019463351532907778, "loss": 2.7454, "step": 4898 }, { "epoch": 0.13, "learning_rate": 0.0019463070197783083, "loss": 2.5168, "step": 4899 }, { "epoch": 0.13, "learning_rate": 0.0019462788790967863, "loss": 2.7873, "step": 4900 }, { "epoch": 0.13, "learning_rate": 0.0019462507312464244, "loss": 2.6635, "step": 4901 }, { "epoch": 0.13, "learning_rate": 0.0019462225762274367, "loss": 2.8559, "step": 4902 }, { "epoch": 0.13, "learning_rate": 0.0019461944140400354, "loss": 2.6204, "step": 4903 }, { "epoch": 0.13, "learning_rate": 0.0019461662446844344, "loss": 2.577, "step": 4904 }, { "epoch": 0.13, "learning_rate": 0.0019461380681608472, "loss": 2.6039, "step": 4905 }, { "epoch": 0.13, "learning_rate": 0.0019461098844694874, "loss": 2.6692, "step": 4906 }, { "epoch": 0.13, "learning_rate": 0.001946081693610568, "loss": 2.4181, "step": 4907 }, { "epoch": 0.13, "learning_rate": 0.0019460534955843029, "loss": 2.6171, "step": 4908 }, { "epoch": 0.13, "learning_rate": 0.0019460252903909054, "loss": 2.8522, "step": 4909 }, { "epoch": 0.13, "learning_rate": 0.0019459970780305897, "loss": 2.6613, "step": 4910 }, { "epoch": 0.13, "learning_rate": 0.0019459688585035694, "loss": 3.0585, "step": 4911 }, { "epoch": 0.13, "learning_rate": 0.0019459406318100578, "loss": 2.4104, "step": 4912 }, { "epoch": 0.13, "learning_rate": 0.0019459123979502693, "loss": 2.5971, "step": 4913 }, { "epoch": 0.13, "learning_rate": 0.0019458841569244174, "loss": 2.8771, "step": 4914 }, { "epoch": 0.13, "learning_rate": 0.0019458559087327165, "loss": 3.2581, "step": 4915 }, { "epoch": 0.13, "learning_rate": 0.0019458276533753803, "loss": 2.5683, "step": 4916 }, { "epoch": 0.13, "learning_rate": 0.0019457993908526228, "loss": 2.8352, "step": 4917 }, { "epoch": 0.13, "learning_rate": 0.0019457711211646582, "loss": 2.5825, "step": 4918 }, { "epoch": 0.13, "learning_rate": 0.0019457428443117007, "loss": 2.5723, "step": 4919 }, { "epoch": 0.13, "learning_rate": 0.0019457145602939645, "loss": 2.837, "step": 4920 }, { "epoch": 0.13, "learning_rate": 0.001945686269111664, "loss": 2.7729, "step": 4921 }, { "epoch": 0.13, "learning_rate": 0.001945657970765013, "loss": 3.0353, "step": 4922 }, { "epoch": 0.13, "learning_rate": 0.0019456296652542266, "loss": 2.7794, "step": 4923 }, { "epoch": 0.13, "learning_rate": 0.0019456013525795191, "loss": 2.9659, "step": 4924 }, { "epoch": 0.13, "learning_rate": 0.0019455730327411045, "loss": 2.4999, "step": 4925 }, { "epoch": 0.13, "learning_rate": 0.0019455447057391978, "loss": 2.8427, "step": 4926 }, { "epoch": 0.13, "learning_rate": 0.0019455163715740133, "loss": 2.4442, "step": 4927 }, { "epoch": 0.13, "learning_rate": 0.001945488030245766, "loss": 2.7873, "step": 4928 }, { "epoch": 0.13, "learning_rate": 0.0019454596817546702, "loss": 2.7259, "step": 4929 }, { "epoch": 0.13, "learning_rate": 0.001945431326100941, "loss": 2.6175, "step": 4930 }, { "epoch": 0.13, "learning_rate": 0.0019454029632847934, "loss": 2.7519, "step": 4931 }, { "epoch": 0.13, "learning_rate": 0.0019453745933064415, "loss": 2.5984, "step": 4932 }, { "epoch": 0.13, "learning_rate": 0.0019453462161661008, "loss": 2.6226, "step": 4933 }, { "epoch": 0.13, "learning_rate": 0.0019453178318639863, "loss": 2.7446, "step": 4934 }, { "epoch": 0.13, "learning_rate": 0.001945289440400313, "loss": 3.0431, "step": 4935 }, { "epoch": 0.13, "learning_rate": 0.0019452610417752957, "loss": 3.007, "step": 4936 }, { "epoch": 0.13, "learning_rate": 0.0019452326359891497, "loss": 2.3533, "step": 4937 }, { "epoch": 0.13, "learning_rate": 0.0019452042230420905, "loss": 2.5065, "step": 4938 }, { "epoch": 0.13, "learning_rate": 0.001945175802934333, "loss": 2.3661, "step": 4939 }, { "epoch": 0.13, "learning_rate": 0.0019451473756660924, "loss": 2.5174, "step": 4940 }, { "epoch": 0.13, "learning_rate": 0.0019451189412375844, "loss": 2.5989, "step": 4941 }, { "epoch": 0.13, "learning_rate": 0.0019450904996490244, "loss": 2.5232, "step": 4942 }, { "epoch": 0.13, "learning_rate": 0.0019450620509006277, "loss": 2.5596, "step": 4943 }, { "epoch": 0.13, "learning_rate": 0.0019450335949926097, "loss": 2.5664, "step": 4944 }, { "epoch": 0.13, "learning_rate": 0.001945005131925186, "loss": 2.4762, "step": 4945 }, { "epoch": 0.13, "learning_rate": 0.0019449766616985728, "loss": 2.4131, "step": 4946 }, { "epoch": 0.13, "learning_rate": 0.001944948184312985, "loss": 2.8611, "step": 4947 }, { "epoch": 0.13, "learning_rate": 0.0019449196997686391, "loss": 2.9707, "step": 4948 }, { "epoch": 0.13, "learning_rate": 0.0019448912080657502, "loss": 2.7369, "step": 4949 }, { "epoch": 0.13, "learning_rate": 0.0019448627092045344, "loss": 2.9547, "step": 4950 }, { "epoch": 0.13, "learning_rate": 0.0019448342031852077, "loss": 2.72, "step": 4951 }, { "epoch": 0.13, "learning_rate": 0.001944805690007986, "loss": 2.5144, "step": 4952 }, { "epoch": 0.13, "learning_rate": 0.0019447771696730854, "loss": 2.5407, "step": 4953 }, { "epoch": 0.13, "learning_rate": 0.0019447486421807216, "loss": 2.7096, "step": 4954 }, { "epoch": 0.13, "learning_rate": 0.0019447201075311114, "loss": 2.6708, "step": 4955 }, { "epoch": 0.13, "learning_rate": 0.0019446915657244702, "loss": 2.6283, "step": 4956 }, { "epoch": 0.13, "learning_rate": 0.0019446630167610148, "loss": 2.3441, "step": 4957 }, { "epoch": 0.13, "learning_rate": 0.0019446344606409611, "loss": 2.6494, "step": 4958 }, { "epoch": 0.13, "learning_rate": 0.001944605897364526, "loss": 2.6794, "step": 4959 }, { "epoch": 0.13, "learning_rate": 0.0019445773269319252, "loss": 2.9535, "step": 4960 }, { "epoch": 0.13, "learning_rate": 0.0019445487493433755, "loss": 2.2121, "step": 4961 }, { "epoch": 0.13, "learning_rate": 0.0019445201645990934, "loss": 2.4625, "step": 4962 }, { "epoch": 0.13, "learning_rate": 0.0019444915726992953, "loss": 2.8716, "step": 4963 }, { "epoch": 0.13, "learning_rate": 0.001944462973644198, "loss": 2.8336, "step": 4964 }, { "epoch": 0.13, "learning_rate": 0.0019444343674340178, "loss": 2.5215, "step": 4965 }, { "epoch": 0.13, "learning_rate": 0.001944405754068972, "loss": 2.5163, "step": 4966 }, { "epoch": 0.13, "learning_rate": 0.0019443771335492768, "loss": 2.4637, "step": 4967 }, { "epoch": 0.13, "learning_rate": 0.0019443485058751495, "loss": 2.5095, "step": 4968 }, { "epoch": 0.13, "learning_rate": 0.0019443198710468066, "loss": 2.8227, "step": 4969 }, { "epoch": 0.13, "learning_rate": 0.0019442912290644652, "loss": 2.3306, "step": 4970 }, { "epoch": 0.13, "learning_rate": 0.0019442625799283425, "loss": 2.6949, "step": 4971 }, { "epoch": 0.13, "learning_rate": 0.001944233923638655, "loss": 2.437, "step": 4972 }, { "epoch": 0.13, "learning_rate": 0.00194420526019562, "loss": 2.1387, "step": 4973 }, { "epoch": 0.13, "learning_rate": 0.0019441765895994551, "loss": 2.8025, "step": 4974 }, { "epoch": 0.13, "learning_rate": 0.0019441479118503771, "loss": 2.7416, "step": 4975 }, { "epoch": 0.13, "learning_rate": 0.0019441192269486032, "loss": 3.2077, "step": 4976 }, { "epoch": 0.13, "learning_rate": 0.0019440905348943511, "loss": 2.5416, "step": 4977 }, { "epoch": 0.13, "learning_rate": 0.0019440618356878377, "loss": 2.4879, "step": 4978 }, { "epoch": 0.13, "learning_rate": 0.0019440331293292805, "loss": 2.9134, "step": 4979 }, { "epoch": 0.13, "learning_rate": 0.0019440044158188972, "loss": 2.4043, "step": 4980 }, { "epoch": 0.13, "learning_rate": 0.0019439756951569053, "loss": 2.4453, "step": 4981 }, { "epoch": 0.13, "learning_rate": 0.0019439469673435221, "loss": 2.9465, "step": 4982 }, { "epoch": 0.13, "learning_rate": 0.0019439182323789655, "loss": 2.7953, "step": 4983 }, { "epoch": 0.13, "learning_rate": 0.0019438894902634534, "loss": 2.816, "step": 4984 }, { "epoch": 0.13, "learning_rate": 0.001943860740997203, "loss": 2.4354, "step": 4985 }, { "epoch": 0.13, "learning_rate": 0.0019438319845804322, "loss": 3.0554, "step": 4986 }, { "epoch": 0.13, "learning_rate": 0.0019438032210133593, "loss": 2.8068, "step": 4987 }, { "epoch": 0.13, "learning_rate": 0.0019437744502962021, "loss": 2.6588, "step": 4988 }, { "epoch": 0.13, "learning_rate": 0.001943745672429178, "loss": 2.34, "step": 4989 }, { "epoch": 0.13, "learning_rate": 0.0019437168874125055, "loss": 2.4599, "step": 4990 }, { "epoch": 0.13, "learning_rate": 0.0019436880952464028, "loss": 2.9704, "step": 4991 }, { "epoch": 0.13, "learning_rate": 0.0019436592959310877, "loss": 2.6759, "step": 4992 }, { "epoch": 0.13, "learning_rate": 0.0019436304894667785, "loss": 2.6082, "step": 4993 }, { "epoch": 0.13, "learning_rate": 0.0019436016758536934, "loss": 2.8536, "step": 4994 }, { "epoch": 0.13, "learning_rate": 0.0019435728550920505, "loss": 2.7812, "step": 4995 }, { "epoch": 0.13, "learning_rate": 0.0019435440271820688, "loss": 2.6617, "step": 4996 }, { "epoch": 0.13, "learning_rate": 0.0019435151921239659, "loss": 2.8439, "step": 4997 }, { "epoch": 0.13, "learning_rate": 0.0019434863499179606, "loss": 2.7952, "step": 4998 }, { "epoch": 0.13, "learning_rate": 0.0019434575005642715, "loss": 2.4422, "step": 4999 }, { "epoch": 0.13, "learning_rate": 0.001943428644063117, "loss": 2.9449, "step": 5000 }, { "epoch": 0.13, "learning_rate": 0.0019433997804147159, "loss": 2.5238, "step": 5001 }, { "epoch": 0.13, "learning_rate": 0.0019433709096192864, "loss": 2.2946, "step": 5002 }, { "epoch": 0.13, "learning_rate": 0.0019433420316770477, "loss": 2.5744, "step": 5003 }, { "epoch": 0.13, "learning_rate": 0.0019433131465882185, "loss": 2.5727, "step": 5004 }, { "epoch": 0.13, "learning_rate": 0.0019432842543530176, "loss": 2.4274, "step": 5005 }, { "epoch": 0.13, "learning_rate": 0.001943255354971664, "loss": 2.7862, "step": 5006 }, { "epoch": 0.13, "learning_rate": 0.001943226448444376, "loss": 2.8435, "step": 5007 }, { "epoch": 0.13, "learning_rate": 0.001943197534771373, "loss": 2.745, "step": 5008 }, { "epoch": 0.13, "learning_rate": 0.0019431686139528745, "loss": 2.1992, "step": 5009 }, { "epoch": 0.13, "learning_rate": 0.0019431396859890993, "loss": 2.8231, "step": 5010 }, { "epoch": 0.13, "learning_rate": 0.001943110750880266, "loss": 2.7225, "step": 5011 }, { "epoch": 0.13, "learning_rate": 0.0019430818086265947, "loss": 2.932, "step": 5012 }, { "epoch": 0.13, "learning_rate": 0.001943052859228304, "loss": 2.5465, "step": 5013 }, { "epoch": 0.13, "learning_rate": 0.0019430239026856136, "loss": 2.3804, "step": 5014 }, { "epoch": 0.13, "learning_rate": 0.0019429949389987424, "loss": 2.6263, "step": 5015 }, { "epoch": 0.13, "learning_rate": 0.0019429659681679105, "loss": 2.6911, "step": 5016 }, { "epoch": 0.13, "learning_rate": 0.0019429369901933368, "loss": 2.4473, "step": 5017 }, { "epoch": 0.13, "learning_rate": 0.0019429080050752407, "loss": 3.0742, "step": 5018 }, { "epoch": 0.13, "learning_rate": 0.0019428790128138427, "loss": 2.6438, "step": 5019 }, { "epoch": 0.13, "learning_rate": 0.0019428500134093616, "loss": 2.7941, "step": 5020 }, { "epoch": 0.13, "learning_rate": 0.0019428210068620176, "loss": 2.4878, "step": 5021 }, { "epoch": 0.13, "learning_rate": 0.00194279199317203, "loss": 2.815, "step": 5022 }, { "epoch": 0.13, "learning_rate": 0.0019427629723396188, "loss": 2.9157, "step": 5023 }, { "epoch": 0.14, "learning_rate": 0.001942733944365004, "loss": 2.987, "step": 5024 }, { "epoch": 0.14, "learning_rate": 0.0019427049092484053, "loss": 2.8387, "step": 5025 }, { "epoch": 0.14, "learning_rate": 0.0019426758669900427, "loss": 3.049, "step": 5026 }, { "epoch": 0.14, "learning_rate": 0.0019426468175901363, "loss": 2.3185, "step": 5027 }, { "epoch": 0.14, "learning_rate": 0.0019426177610489062, "loss": 3.0277, "step": 5028 }, { "epoch": 0.14, "learning_rate": 0.0019425886973665726, "loss": 2.7887, "step": 5029 }, { "epoch": 0.14, "learning_rate": 0.0019425596265433551, "loss": 2.9025, "step": 5030 }, { "epoch": 0.14, "learning_rate": 0.0019425305485794749, "loss": 2.4636, "step": 5031 }, { "epoch": 0.14, "learning_rate": 0.0019425014634751514, "loss": 2.684, "step": 5032 }, { "epoch": 0.14, "learning_rate": 0.0019424723712306053, "loss": 2.6972, "step": 5033 }, { "epoch": 0.14, "learning_rate": 0.0019424432718460575, "loss": 2.7506, "step": 5034 }, { "epoch": 0.14, "learning_rate": 0.0019424141653217276, "loss": 2.8379, "step": 5035 }, { "epoch": 0.14, "learning_rate": 0.0019423850516578365, "loss": 2.8404, "step": 5036 }, { "epoch": 0.14, "learning_rate": 0.0019423559308546045, "loss": 2.4837, "step": 5037 }, { "epoch": 0.14, "learning_rate": 0.0019423268029122528, "loss": 2.8273, "step": 5038 }, { "epoch": 0.14, "learning_rate": 0.0019422976678310016, "loss": 2.9059, "step": 5039 }, { "epoch": 0.14, "learning_rate": 0.0019422685256110716, "loss": 3.1951, "step": 5040 }, { "epoch": 0.14, "learning_rate": 0.001942239376252684, "loss": 2.9625, "step": 5041 }, { "epoch": 0.14, "learning_rate": 0.0019422102197560593, "loss": 2.6825, "step": 5042 }, { "epoch": 0.14, "learning_rate": 0.0019421810561214181, "loss": 2.855, "step": 5043 }, { "epoch": 0.14, "learning_rate": 0.001942151885348982, "loss": 2.714, "step": 5044 }, { "epoch": 0.14, "learning_rate": 0.0019421227074389715, "loss": 2.4176, "step": 5045 }, { "epoch": 0.14, "learning_rate": 0.0019420935223916078, "loss": 2.5405, "step": 5046 }, { "epoch": 0.14, "learning_rate": 0.0019420643302071122, "loss": 2.5843, "step": 5047 }, { "epoch": 0.14, "learning_rate": 0.0019420351308857054, "loss": 2.7975, "step": 5048 }, { "epoch": 0.14, "learning_rate": 0.001942005924427609, "loss": 2.5833, "step": 5049 }, { "epoch": 0.14, "learning_rate": 0.0019419767108330439, "loss": 2.7547, "step": 5050 }, { "epoch": 0.14, "learning_rate": 0.001941947490102232, "loss": 2.6762, "step": 5051 }, { "epoch": 0.14, "learning_rate": 0.0019419182622353941, "loss": 3.0815, "step": 5052 }, { "epoch": 0.14, "learning_rate": 0.0019418890272327519, "loss": 2.8205, "step": 5053 }, { "epoch": 0.14, "learning_rate": 0.0019418597850945267, "loss": 2.6614, "step": 5054 }, { "epoch": 0.14, "learning_rate": 0.0019418305358209404, "loss": 3.0898, "step": 5055 }, { "epoch": 0.14, "learning_rate": 0.0019418012794122144, "loss": 2.7887, "step": 5056 }, { "epoch": 0.14, "learning_rate": 0.0019417720158685702, "loss": 2.8289, "step": 5057 }, { "epoch": 0.14, "learning_rate": 0.0019417427451902294, "loss": 2.886, "step": 5058 }, { "epoch": 0.14, "learning_rate": 0.0019417134673774142, "loss": 2.5649, "step": 5059 }, { "epoch": 0.14, "learning_rate": 0.001941684182430346, "loss": 2.6489, "step": 5060 }, { "epoch": 0.14, "learning_rate": 0.0019416548903492465, "loss": 2.526, "step": 5061 }, { "epoch": 0.14, "learning_rate": 0.001941625591134338, "loss": 2.8649, "step": 5062 }, { "epoch": 0.14, "learning_rate": 0.0019415962847858426, "loss": 2.6377, "step": 5063 }, { "epoch": 0.14, "learning_rate": 0.0019415669713039822, "loss": 2.8115, "step": 5064 }, { "epoch": 0.14, "learning_rate": 0.0019415376506889785, "loss": 2.6635, "step": 5065 }, { "epoch": 0.14, "learning_rate": 0.001941508322941054, "loss": 2.5573, "step": 5066 }, { "epoch": 0.14, "learning_rate": 0.001941478988060431, "loss": 2.6329, "step": 5067 }, { "epoch": 0.14, "learning_rate": 0.001941449646047331, "loss": 2.9198, "step": 5068 }, { "epoch": 0.14, "learning_rate": 0.001941420296901977, "loss": 2.7891, "step": 5069 }, { "epoch": 0.14, "learning_rate": 0.0019413909406245913, "loss": 2.9484, "step": 5070 }, { "epoch": 0.14, "learning_rate": 0.001941361577215396, "loss": 2.602, "step": 5071 }, { "epoch": 0.14, "learning_rate": 0.0019413322066746137, "loss": 2.8084, "step": 5072 }, { "epoch": 0.14, "learning_rate": 0.001941302829002467, "loss": 3.0104, "step": 5073 }, { "epoch": 0.14, "learning_rate": 0.0019412734441991782, "loss": 2.7275, "step": 5074 }, { "epoch": 0.14, "learning_rate": 0.00194124405226497, "loss": 2.95, "step": 5075 }, { "epoch": 0.14, "learning_rate": 0.0019412146532000654, "loss": 2.4999, "step": 5076 }, { "epoch": 0.14, "learning_rate": 0.0019411852470046869, "loss": 2.7737, "step": 5077 }, { "epoch": 0.14, "learning_rate": 0.001941155833679057, "loss": 2.703, "step": 5078 }, { "epoch": 0.14, "learning_rate": 0.0019411264132233987, "loss": 2.5464, "step": 5079 }, { "epoch": 0.14, "learning_rate": 0.0019410969856379352, "loss": 2.417, "step": 5080 }, { "epoch": 0.14, "learning_rate": 0.001941067550922889, "loss": 2.72, "step": 5081 }, { "epoch": 0.14, "learning_rate": 0.0019410381090784834, "loss": 2.2025, "step": 5082 }, { "epoch": 0.14, "learning_rate": 0.0019410086601049413, "loss": 2.5462, "step": 5083 }, { "epoch": 0.14, "learning_rate": 0.001940979204002486, "loss": 2.934, "step": 5084 }, { "epoch": 0.14, "learning_rate": 0.00194094974077134, "loss": 2.9092, "step": 5085 }, { "epoch": 0.14, "learning_rate": 0.0019409202704117276, "loss": 2.6642, "step": 5086 }, { "epoch": 0.14, "learning_rate": 0.0019408907929238711, "loss": 2.8059, "step": 5087 }, { "epoch": 0.14, "learning_rate": 0.001940861308307994, "loss": 2.5145, "step": 5088 }, { "epoch": 0.14, "learning_rate": 0.00194083181656432, "loss": 2.7504, "step": 5089 }, { "epoch": 0.14, "learning_rate": 0.0019408023176930725, "loss": 2.4611, "step": 5090 }, { "epoch": 0.14, "learning_rate": 0.0019407728116944748, "loss": 2.6951, "step": 5091 }, { "epoch": 0.14, "learning_rate": 0.0019407432985687504, "loss": 2.6349, "step": 5092 }, { "epoch": 0.14, "learning_rate": 0.0019407137783161229, "loss": 3.1052, "step": 5093 }, { "epoch": 0.14, "learning_rate": 0.0019406842509368163, "loss": 2.6831, "step": 5094 }, { "epoch": 0.14, "learning_rate": 0.0019406547164310536, "loss": 2.7714, "step": 5095 }, { "epoch": 0.14, "learning_rate": 0.001940625174799059, "loss": 2.4191, "step": 5096 }, { "epoch": 0.14, "learning_rate": 0.0019405956260410565, "loss": 3.0027, "step": 5097 }, { "epoch": 0.14, "learning_rate": 0.0019405660701572697, "loss": 2.779, "step": 5098 }, { "epoch": 0.14, "learning_rate": 0.0019405365071479223, "loss": 2.8019, "step": 5099 }, { "epoch": 0.14, "learning_rate": 0.0019405069370132387, "loss": 2.4848, "step": 5100 }, { "epoch": 0.14, "learning_rate": 0.0019404773597534424, "loss": 2.9729, "step": 5101 }, { "epoch": 0.14, "learning_rate": 0.001940447775368758, "loss": 2.9015, "step": 5102 }, { "epoch": 0.14, "learning_rate": 0.0019404181838594092, "loss": 2.5722, "step": 5103 }, { "epoch": 0.14, "learning_rate": 0.0019403885852256205, "loss": 2.9082, "step": 5104 }, { "epoch": 0.14, "learning_rate": 0.001940358979467616, "loss": 2.6789, "step": 5105 }, { "epoch": 0.14, "learning_rate": 0.00194032936658562, "loss": 2.8925, "step": 5106 }, { "epoch": 0.14, "learning_rate": 0.0019402997465798567, "loss": 2.791, "step": 5107 }, { "epoch": 0.14, "learning_rate": 0.0019402701194505508, "loss": 2.5326, "step": 5108 }, { "epoch": 0.14, "learning_rate": 0.0019402404851979265, "loss": 2.6657, "step": 5109 }, { "epoch": 0.14, "learning_rate": 0.0019402108438222084, "loss": 2.456, "step": 5110 }, { "epoch": 0.14, "learning_rate": 0.0019401811953236208, "loss": 2.9594, "step": 5111 }, { "epoch": 0.14, "learning_rate": 0.0019401515397023889, "loss": 2.7211, "step": 5112 }, { "epoch": 0.14, "learning_rate": 0.0019401218769587367, "loss": 2.7679, "step": 5113 }, { "epoch": 0.14, "learning_rate": 0.0019400922070928897, "loss": 2.4341, "step": 5114 }, { "epoch": 0.14, "learning_rate": 0.001940062530105072, "loss": 3.0433, "step": 5115 }, { "epoch": 0.14, "learning_rate": 0.0019400328459955086, "loss": 2.9081, "step": 5116 }, { "epoch": 0.14, "learning_rate": 0.0019400031547644244, "loss": 2.6286, "step": 5117 }, { "epoch": 0.14, "learning_rate": 0.0019399734564120444, "loss": 3.0491, "step": 5118 }, { "epoch": 0.14, "learning_rate": 0.0019399437509385936, "loss": 3.011, "step": 5119 }, { "epoch": 0.14, "learning_rate": 0.0019399140383442965, "loss": 2.6593, "step": 5120 }, { "epoch": 0.14, "learning_rate": 0.0019398843186293794, "loss": 3.1892, "step": 5121 }, { "epoch": 0.14, "learning_rate": 0.0019398545917940662, "loss": 2.4529, "step": 5122 }, { "epoch": 0.14, "learning_rate": 0.001939824857838583, "loss": 2.5329, "step": 5123 }, { "epoch": 0.14, "learning_rate": 0.0019397951167631545, "loss": 2.5422, "step": 5124 }, { "epoch": 0.14, "learning_rate": 0.0019397653685680064, "loss": 2.6438, "step": 5125 }, { "epoch": 0.14, "learning_rate": 0.0019397356132533636, "loss": 2.6597, "step": 5126 }, { "epoch": 0.14, "learning_rate": 0.0019397058508194521, "loss": 2.7207, "step": 5127 }, { "epoch": 0.14, "learning_rate": 0.001939676081266497, "loss": 2.4435, "step": 5128 }, { "epoch": 0.14, "learning_rate": 0.001939646304594724, "loss": 2.2858, "step": 5129 }, { "epoch": 0.14, "learning_rate": 0.0019396165208043583, "loss": 3.1156, "step": 5130 }, { "epoch": 0.14, "learning_rate": 0.001939586729895626, "loss": 2.6656, "step": 5131 }, { "epoch": 0.14, "learning_rate": 0.0019395569318687526, "loss": 2.5681, "step": 5132 }, { "epoch": 0.14, "learning_rate": 0.0019395271267239637, "loss": 2.4769, "step": 5133 }, { "epoch": 0.14, "learning_rate": 0.0019394973144614856, "loss": 2.6345, "step": 5134 }, { "epoch": 0.14, "learning_rate": 0.0019394674950815433, "loss": 2.8987, "step": 5135 }, { "epoch": 0.14, "learning_rate": 0.0019394376685843637, "loss": 2.7732, "step": 5136 }, { "epoch": 0.14, "learning_rate": 0.0019394078349701722, "loss": 1.8828, "step": 5137 }, { "epoch": 0.14, "learning_rate": 0.0019393779942391946, "loss": 2.679, "step": 5138 }, { "epoch": 0.14, "learning_rate": 0.0019393481463916575, "loss": 2.7807, "step": 5139 }, { "epoch": 0.14, "learning_rate": 0.0019393182914277868, "loss": 2.7076, "step": 5140 }, { "epoch": 0.14, "learning_rate": 0.0019392884293478088, "loss": 2.7288, "step": 5141 }, { "epoch": 0.14, "learning_rate": 0.0019392585601519493, "loss": 2.9839, "step": 5142 }, { "epoch": 0.14, "learning_rate": 0.0019392286838404349, "loss": 2.6571, "step": 5143 }, { "epoch": 0.14, "learning_rate": 0.0019391988004134923, "loss": 2.6196, "step": 5144 }, { "epoch": 0.14, "learning_rate": 0.0019391689098713467, "loss": 3.1624, "step": 5145 }, { "epoch": 0.14, "learning_rate": 0.001939139012214226, "loss": 2.94, "step": 5146 }, { "epoch": 0.14, "learning_rate": 0.0019391091074423559, "loss": 2.9456, "step": 5147 }, { "epoch": 0.14, "learning_rate": 0.001939079195555963, "loss": 2.9937, "step": 5148 }, { "epoch": 0.14, "learning_rate": 0.001939049276555274, "loss": 2.7095, "step": 5149 }, { "epoch": 0.14, "learning_rate": 0.0019390193504405157, "loss": 2.8411, "step": 5150 }, { "epoch": 0.14, "learning_rate": 0.0019389894172119147, "loss": 2.5458, "step": 5151 }, { "epoch": 0.14, "learning_rate": 0.0019389594768696977, "loss": 2.4722, "step": 5152 }, { "epoch": 0.14, "learning_rate": 0.0019389295294140916, "loss": 2.5266, "step": 5153 }, { "epoch": 0.14, "learning_rate": 0.001938899574845323, "loss": 2.6867, "step": 5154 }, { "epoch": 0.14, "learning_rate": 0.0019388696131636195, "loss": 2.4058, "step": 5155 }, { "epoch": 0.14, "learning_rate": 0.0019388396443692077, "loss": 2.8102, "step": 5156 }, { "epoch": 0.14, "learning_rate": 0.001938809668462314, "loss": 2.4698, "step": 5157 }, { "epoch": 0.14, "learning_rate": 0.0019387796854431665, "loss": 2.8396, "step": 5158 }, { "epoch": 0.14, "learning_rate": 0.0019387496953119918, "loss": 2.87, "step": 5159 }, { "epoch": 0.14, "learning_rate": 0.0019387196980690175, "loss": 2.7622, "step": 5160 }, { "epoch": 0.14, "learning_rate": 0.0019386896937144704, "loss": 2.5441, "step": 5161 }, { "epoch": 0.14, "learning_rate": 0.001938659682248578, "loss": 2.3164, "step": 5162 }, { "epoch": 0.14, "learning_rate": 0.0019386296636715677, "loss": 2.775, "step": 5163 }, { "epoch": 0.14, "learning_rate": 0.0019385996379836668, "loss": 2.8865, "step": 5164 }, { "epoch": 0.14, "learning_rate": 0.001938569605185103, "loss": 2.685, "step": 5165 }, { "epoch": 0.14, "learning_rate": 0.0019385395652761035, "loss": 2.7241, "step": 5166 }, { "epoch": 0.14, "learning_rate": 0.0019385095182568963, "loss": 2.5984, "step": 5167 }, { "epoch": 0.14, "learning_rate": 0.0019384794641277084, "loss": 2.7432, "step": 5168 }, { "epoch": 0.14, "learning_rate": 0.0019384494028887682, "loss": 2.4432, "step": 5169 }, { "epoch": 0.14, "learning_rate": 0.001938419334540303, "loss": 2.7252, "step": 5170 }, { "epoch": 0.14, "learning_rate": 0.0019383892590825408, "loss": 2.7666, "step": 5171 }, { "epoch": 0.14, "learning_rate": 0.0019383591765157091, "loss": 2.1735, "step": 5172 }, { "epoch": 0.14, "learning_rate": 0.0019383290868400362, "loss": 2.9586, "step": 5173 }, { "epoch": 0.14, "learning_rate": 0.00193829899005575, "loss": 2.7327, "step": 5174 }, { "epoch": 0.14, "learning_rate": 0.001938268886163078, "loss": 2.5766, "step": 5175 }, { "epoch": 0.14, "learning_rate": 0.001938238775162249, "loss": 2.9246, "step": 5176 }, { "epoch": 0.14, "learning_rate": 0.0019382086570534907, "loss": 2.2947, "step": 5177 }, { "epoch": 0.14, "learning_rate": 0.0019381785318370315, "loss": 2.835, "step": 5178 }, { "epoch": 0.14, "learning_rate": 0.001938148399513099, "loss": 2.6021, "step": 5179 }, { "epoch": 0.14, "learning_rate": 0.0019381182600819225, "loss": 3.014, "step": 5180 }, { "epoch": 0.14, "learning_rate": 0.0019380881135437297, "loss": 3.2705, "step": 5181 }, { "epoch": 0.14, "learning_rate": 0.0019380579598987486, "loss": 2.816, "step": 5182 }, { "epoch": 0.14, "learning_rate": 0.0019380277991472086, "loss": 2.7959, "step": 5183 }, { "epoch": 0.14, "learning_rate": 0.0019379976312893375, "loss": 2.6668, "step": 5184 }, { "epoch": 0.14, "learning_rate": 0.0019379674563253643, "loss": 2.6329, "step": 5185 }, { "epoch": 0.14, "learning_rate": 0.0019379372742555168, "loss": 2.4046, "step": 5186 }, { "epoch": 0.14, "learning_rate": 0.0019379070850800246, "loss": 2.8412, "step": 5187 }, { "epoch": 0.14, "learning_rate": 0.0019378768887991157, "loss": 2.8227, "step": 5188 }, { "epoch": 0.14, "learning_rate": 0.0019378466854130198, "loss": 2.9421, "step": 5189 }, { "epoch": 0.14, "learning_rate": 0.0019378164749219646, "loss": 2.7054, "step": 5190 }, { "epoch": 0.14, "learning_rate": 0.0019377862573261796, "loss": 2.852, "step": 5191 }, { "epoch": 0.14, "learning_rate": 0.0019377560326258934, "loss": 2.5889, "step": 5192 }, { "epoch": 0.14, "learning_rate": 0.0019377258008213352, "loss": 2.7756, "step": 5193 }, { "epoch": 0.14, "learning_rate": 0.0019376955619127341, "loss": 2.516, "step": 5194 }, { "epoch": 0.14, "learning_rate": 0.0019376653159003188, "loss": 2.6334, "step": 5195 }, { "epoch": 0.14, "learning_rate": 0.001937635062784319, "loss": 2.9865, "step": 5196 }, { "epoch": 0.14, "learning_rate": 0.0019376048025649636, "loss": 2.7537, "step": 5197 }, { "epoch": 0.14, "learning_rate": 0.0019375745352424817, "loss": 2.5768, "step": 5198 }, { "epoch": 0.14, "learning_rate": 0.0019375442608171028, "loss": 2.3493, "step": 5199 }, { "epoch": 0.14, "learning_rate": 0.0019375139792890562, "loss": 2.6842, "step": 5200 }, { "epoch": 0.14, "learning_rate": 0.0019374836906585714, "loss": 2.9229, "step": 5201 }, { "epoch": 0.14, "learning_rate": 0.0019374533949258774, "loss": 2.6665, "step": 5202 }, { "epoch": 0.14, "learning_rate": 0.0019374230920912044, "loss": 2.8748, "step": 5203 }, { "epoch": 0.14, "learning_rate": 0.0019373927821547817, "loss": 2.7783, "step": 5204 }, { "epoch": 0.14, "learning_rate": 0.0019373624651168387, "loss": 2.7197, "step": 5205 }, { "epoch": 0.14, "learning_rate": 0.0019373321409776052, "loss": 2.9278, "step": 5206 }, { "epoch": 0.14, "learning_rate": 0.0019373018097373113, "loss": 2.5765, "step": 5207 }, { "epoch": 0.14, "learning_rate": 0.0019372714713961861, "loss": 3.0844, "step": 5208 }, { "epoch": 0.14, "learning_rate": 0.00193724112595446, "loss": 2.746, "step": 5209 }, { "epoch": 0.14, "learning_rate": 0.0019372107734123628, "loss": 2.8396, "step": 5210 }, { "epoch": 0.14, "learning_rate": 0.001937180413770124, "loss": 2.7309, "step": 5211 }, { "epoch": 0.14, "learning_rate": 0.0019371500470279743, "loss": 2.7496, "step": 5212 }, { "epoch": 0.14, "learning_rate": 0.001937119673186143, "loss": 2.8202, "step": 5213 }, { "epoch": 0.14, "learning_rate": 0.001937089292244861, "loss": 2.8954, "step": 5214 }, { "epoch": 0.14, "learning_rate": 0.0019370589042043578, "loss": 2.8177, "step": 5215 }, { "epoch": 0.14, "learning_rate": 0.0019370285090648638, "loss": 2.7549, "step": 5216 }, { "epoch": 0.14, "learning_rate": 0.0019369981068266097, "loss": 2.8902, "step": 5217 }, { "epoch": 0.14, "learning_rate": 0.0019369676974898252, "loss": 2.5817, "step": 5218 }, { "epoch": 0.14, "learning_rate": 0.001936937281054741, "loss": 2.8489, "step": 5219 }, { "epoch": 0.14, "learning_rate": 0.0019369068575215876, "loss": 2.4834, "step": 5220 }, { "epoch": 0.14, "learning_rate": 0.0019368764268905953, "loss": 3.3111, "step": 5221 }, { "epoch": 0.14, "learning_rate": 0.0019368459891619943, "loss": 2.7515, "step": 5222 }, { "epoch": 0.14, "learning_rate": 0.001936815544336016, "loss": 2.5219, "step": 5223 }, { "epoch": 0.14, "learning_rate": 0.0019367850924128902, "loss": 2.7165, "step": 5224 }, { "epoch": 0.14, "learning_rate": 0.0019367546333928485, "loss": 2.5115, "step": 5225 }, { "epoch": 0.14, "learning_rate": 0.0019367241672761208, "loss": 2.552, "step": 5226 }, { "epoch": 0.14, "learning_rate": 0.0019366936940629388, "loss": 2.6496, "step": 5227 }, { "epoch": 0.14, "learning_rate": 0.0019366632137535326, "loss": 2.7402, "step": 5228 }, { "epoch": 0.14, "learning_rate": 0.001936632726348133, "loss": 2.6081, "step": 5229 }, { "epoch": 0.14, "learning_rate": 0.0019366022318469717, "loss": 2.5458, "step": 5230 }, { "epoch": 0.14, "learning_rate": 0.0019365717302502793, "loss": 2.3808, "step": 5231 }, { "epoch": 0.14, "learning_rate": 0.0019365412215582864, "loss": 2.333, "step": 5232 }, { "epoch": 0.14, "learning_rate": 0.0019365107057712253, "loss": 2.8498, "step": 5233 }, { "epoch": 0.14, "learning_rate": 0.0019364801828893263, "loss": 2.5092, "step": 5234 }, { "epoch": 0.14, "learning_rate": 0.0019364496529128208, "loss": 2.8393, "step": 5235 }, { "epoch": 0.14, "learning_rate": 0.0019364191158419404, "loss": 2.3213, "step": 5236 }, { "epoch": 0.14, "learning_rate": 0.001936388571676916, "loss": 2.4816, "step": 5237 }, { "epoch": 0.14, "learning_rate": 0.0019363580204179792, "loss": 2.7343, "step": 5238 }, { "epoch": 0.14, "learning_rate": 0.0019363274620653613, "loss": 2.7352, "step": 5239 }, { "epoch": 0.14, "learning_rate": 0.001936296896619294, "loss": 2.9848, "step": 5240 }, { "epoch": 0.14, "learning_rate": 0.001936266324080009, "loss": 2.5997, "step": 5241 }, { "epoch": 0.14, "learning_rate": 0.0019362357444477377, "loss": 2.871, "step": 5242 }, { "epoch": 0.14, "learning_rate": 0.0019362051577227115, "loss": 2.4924, "step": 5243 }, { "epoch": 0.14, "learning_rate": 0.0019361745639051627, "loss": 2.906, "step": 5244 }, { "epoch": 0.14, "learning_rate": 0.0019361439629953226, "loss": 2.8166, "step": 5245 }, { "epoch": 0.14, "learning_rate": 0.0019361133549934233, "loss": 2.7533, "step": 5246 }, { "epoch": 0.14, "learning_rate": 0.0019360827398996966, "loss": 2.9509, "step": 5247 }, { "epoch": 0.14, "learning_rate": 0.0019360521177143744, "loss": 2.6745, "step": 5248 }, { "epoch": 0.14, "learning_rate": 0.0019360214884376887, "loss": 2.5653, "step": 5249 }, { "epoch": 0.14, "learning_rate": 0.0019359908520698715, "loss": 2.3884, "step": 5250 }, { "epoch": 0.14, "learning_rate": 0.001935960208611155, "loss": 2.1794, "step": 5251 }, { "epoch": 0.14, "learning_rate": 0.0019359295580617714, "loss": 2.6201, "step": 5252 }, { "epoch": 0.14, "learning_rate": 0.0019358989004219524, "loss": 2.8426, "step": 5253 }, { "epoch": 0.14, "learning_rate": 0.0019358682356919311, "loss": 2.6138, "step": 5254 }, { "epoch": 0.14, "learning_rate": 0.0019358375638719393, "loss": 2.41, "step": 5255 }, { "epoch": 0.14, "learning_rate": 0.0019358068849622092, "loss": 2.847, "step": 5256 }, { "epoch": 0.14, "learning_rate": 0.0019357761989629734, "loss": 2.7354, "step": 5257 }, { "epoch": 0.14, "learning_rate": 0.0019357455058744647, "loss": 2.4463, "step": 5258 }, { "epoch": 0.14, "learning_rate": 0.001935714805696915, "loss": 3.2057, "step": 5259 }, { "epoch": 0.14, "learning_rate": 0.0019356840984305578, "loss": 2.5274, "step": 5260 }, { "epoch": 0.14, "learning_rate": 0.0019356533840756245, "loss": 2.5544, "step": 5261 }, { "epoch": 0.14, "learning_rate": 0.001935622662632349, "loss": 2.8535, "step": 5262 }, { "epoch": 0.14, "learning_rate": 0.0019355919341009632, "loss": 2.3465, "step": 5263 }, { "epoch": 0.14, "learning_rate": 0.0019355611984817002, "loss": 2.3841, "step": 5264 }, { "epoch": 0.14, "learning_rate": 0.0019355304557747927, "loss": 2.3784, "step": 5265 }, { "epoch": 0.14, "learning_rate": 0.0019354997059804738, "loss": 2.8258, "step": 5266 }, { "epoch": 0.14, "learning_rate": 0.0019354689490989766, "loss": 2.6453, "step": 5267 }, { "epoch": 0.14, "learning_rate": 0.0019354381851305336, "loss": 3.1698, "step": 5268 }, { "epoch": 0.14, "learning_rate": 0.001935407414075378, "loss": 2.5105, "step": 5269 }, { "epoch": 0.14, "learning_rate": 0.0019353766359337438, "loss": 2.4979, "step": 5270 }, { "epoch": 0.14, "learning_rate": 0.0019353458507058627, "loss": 2.8189, "step": 5271 }, { "epoch": 0.14, "learning_rate": 0.001935315058391969, "loss": 3.0868, "step": 5272 }, { "epoch": 0.14, "learning_rate": 0.0019352842589922955, "loss": 2.6988, "step": 5273 }, { "epoch": 0.14, "learning_rate": 0.0019352534525070757, "loss": 2.4412, "step": 5274 }, { "epoch": 0.14, "learning_rate": 0.0019352226389365431, "loss": 2.5429, "step": 5275 }, { "epoch": 0.14, "learning_rate": 0.0019351918182809308, "loss": 3.0608, "step": 5276 }, { "epoch": 0.14, "learning_rate": 0.0019351609905404726, "loss": 2.5783, "step": 5277 }, { "epoch": 0.14, "learning_rate": 0.0019351301557154017, "loss": 2.846, "step": 5278 }, { "epoch": 0.14, "learning_rate": 0.001935099313805952, "loss": 2.6105, "step": 5279 }, { "epoch": 0.14, "learning_rate": 0.0019350684648123573, "loss": 2.8542, "step": 5280 }, { "epoch": 0.14, "learning_rate": 0.0019350376087348508, "loss": 2.594, "step": 5281 }, { "epoch": 0.14, "learning_rate": 0.0019350067455736668, "loss": 2.7825, "step": 5282 }, { "epoch": 0.14, "learning_rate": 0.0019349758753290389, "loss": 2.7895, "step": 5283 }, { "epoch": 0.14, "learning_rate": 0.0019349449980012009, "loss": 2.8526, "step": 5284 }, { "epoch": 0.14, "learning_rate": 0.0019349141135903865, "loss": 3.0643, "step": 5285 }, { "epoch": 0.14, "learning_rate": 0.00193488322209683, "loss": 2.9194, "step": 5286 }, { "epoch": 0.14, "learning_rate": 0.0019348523235207657, "loss": 2.6422, "step": 5287 }, { "epoch": 0.14, "learning_rate": 0.001934821417862427, "loss": 2.649, "step": 5288 }, { "epoch": 0.14, "learning_rate": 0.0019347905051220482, "loss": 2.7522, "step": 5289 }, { "epoch": 0.14, "learning_rate": 0.0019347595852998638, "loss": 2.518, "step": 5290 }, { "epoch": 0.14, "learning_rate": 0.0019347286583961082, "loss": 2.6502, "step": 5291 }, { "epoch": 0.14, "learning_rate": 0.001934697724411015, "loss": 2.8767, "step": 5292 }, { "epoch": 0.14, "learning_rate": 0.0019346667833448192, "loss": 2.6531, "step": 5293 }, { "epoch": 0.14, "learning_rate": 0.0019346358351977548, "loss": 3.2936, "step": 5294 }, { "epoch": 0.14, "learning_rate": 0.0019346048799700566, "loss": 2.5371, "step": 5295 }, { "epoch": 0.14, "learning_rate": 0.0019345739176619588, "loss": 2.3939, "step": 5296 }, { "epoch": 0.14, "learning_rate": 0.001934542948273696, "loss": 3.0644, "step": 5297 }, { "epoch": 0.14, "learning_rate": 0.0019345119718055031, "loss": 2.9559, "step": 5298 }, { "epoch": 0.14, "learning_rate": 0.0019344809882576146, "loss": 2.7447, "step": 5299 }, { "epoch": 0.14, "learning_rate": 0.001934449997630265, "loss": 2.5522, "step": 5300 }, { "epoch": 0.14, "learning_rate": 0.0019344189999236892, "loss": 2.52, "step": 5301 }, { "epoch": 0.14, "learning_rate": 0.0019343879951381222, "loss": 2.223, "step": 5302 }, { "epoch": 0.14, "learning_rate": 0.0019343569832737991, "loss": 2.5241, "step": 5303 }, { "epoch": 0.14, "learning_rate": 0.0019343259643309543, "loss": 2.7366, "step": 5304 }, { "epoch": 0.14, "learning_rate": 0.0019342949383098229, "loss": 2.3458, "step": 5305 }, { "epoch": 0.14, "learning_rate": 0.0019342639052106403, "loss": 3.2006, "step": 5306 }, { "epoch": 0.14, "learning_rate": 0.0019342328650336414, "loss": 2.2586, "step": 5307 }, { "epoch": 0.14, "learning_rate": 0.0019342018177790612, "loss": 2.6595, "step": 5308 }, { "epoch": 0.14, "learning_rate": 0.0019341707634471352, "loss": 3.1822, "step": 5309 }, { "epoch": 0.14, "learning_rate": 0.0019341397020380983, "loss": 2.7344, "step": 5310 }, { "epoch": 0.14, "learning_rate": 0.0019341086335521863, "loss": 2.7807, "step": 5311 }, { "epoch": 0.14, "learning_rate": 0.0019340775579896339, "loss": 2.0981, "step": 5312 }, { "epoch": 0.14, "learning_rate": 0.0019340464753506775, "loss": 3.0164, "step": 5313 }, { "epoch": 0.14, "learning_rate": 0.0019340153856355516, "loss": 2.6791, "step": 5314 }, { "epoch": 0.14, "learning_rate": 0.001933984288844492, "loss": 3.0792, "step": 5315 }, { "epoch": 0.14, "learning_rate": 0.0019339531849777347, "loss": 3.1251, "step": 5316 }, { "epoch": 0.14, "learning_rate": 0.0019339220740355147, "loss": 2.8488, "step": 5317 }, { "epoch": 0.14, "learning_rate": 0.0019338909560180685, "loss": 3.0876, "step": 5318 }, { "epoch": 0.14, "learning_rate": 0.001933859830925631, "loss": 2.6169, "step": 5319 }, { "epoch": 0.14, "learning_rate": 0.0019338286987584385, "loss": 2.6438, "step": 5320 }, { "epoch": 0.14, "learning_rate": 0.001933797559516727, "loss": 2.9828, "step": 5321 }, { "epoch": 0.14, "learning_rate": 0.0019337664132007318, "loss": 2.6136, "step": 5322 }, { "epoch": 0.14, "learning_rate": 0.0019337352598106892, "loss": 2.7787, "step": 5323 }, { "epoch": 0.14, "learning_rate": 0.0019337040993468353, "loss": 2.6276, "step": 5324 }, { "epoch": 0.14, "learning_rate": 0.001933672931809406, "loss": 2.5673, "step": 5325 }, { "epoch": 0.14, "learning_rate": 0.0019336417571986378, "loss": 2.4232, "step": 5326 }, { "epoch": 0.14, "learning_rate": 0.0019336105755147664, "loss": 2.4612, "step": 5327 }, { "epoch": 0.14, "learning_rate": 0.0019335793867580279, "loss": 2.931, "step": 5328 }, { "epoch": 0.14, "learning_rate": 0.0019335481909286592, "loss": 2.4811, "step": 5329 }, { "epoch": 0.14, "learning_rate": 0.0019335169880268961, "loss": 2.6317, "step": 5330 }, { "epoch": 0.14, "learning_rate": 0.0019334857780529753, "loss": 2.4959, "step": 5331 }, { "epoch": 0.14, "learning_rate": 0.0019334545610071331, "loss": 2.9309, "step": 5332 }, { "epoch": 0.14, "learning_rate": 0.0019334233368896061, "loss": 2.9102, "step": 5333 }, { "epoch": 0.14, "learning_rate": 0.001933392105700631, "loss": 2.7277, "step": 5334 }, { "epoch": 0.14, "learning_rate": 0.001933360867440444, "loss": 2.6946, "step": 5335 }, { "epoch": 0.14, "learning_rate": 0.0019333296221092815, "loss": 2.6534, "step": 5336 }, { "epoch": 0.14, "learning_rate": 0.0019332983697073812, "loss": 2.7936, "step": 5337 }, { "epoch": 0.14, "learning_rate": 0.0019332671102349791, "loss": 2.7363, "step": 5338 }, { "epoch": 0.14, "learning_rate": 0.0019332358436923124, "loss": 2.6718, "step": 5339 }, { "epoch": 0.14, "learning_rate": 0.0019332045700796174, "loss": 2.7993, "step": 5340 }, { "epoch": 0.14, "learning_rate": 0.0019331732893971317, "loss": 2.9974, "step": 5341 }, { "epoch": 0.14, "learning_rate": 0.001933142001645092, "loss": 2.7281, "step": 5342 }, { "epoch": 0.14, "learning_rate": 0.0019331107068237352, "loss": 2.9864, "step": 5343 }, { "epoch": 0.14, "learning_rate": 0.0019330794049332988, "loss": 2.6905, "step": 5344 }, { "epoch": 0.14, "learning_rate": 0.0019330480959740192, "loss": 2.6382, "step": 5345 }, { "epoch": 0.14, "learning_rate": 0.0019330167799461344, "loss": 3.3043, "step": 5346 }, { "epoch": 0.14, "learning_rate": 0.0019329854568498812, "loss": 2.7089, "step": 5347 }, { "epoch": 0.14, "learning_rate": 0.001932954126685497, "loss": 2.6076, "step": 5348 }, { "epoch": 0.14, "learning_rate": 0.001932922789453219, "loss": 2.58, "step": 5349 }, { "epoch": 0.14, "learning_rate": 0.0019328914451532848, "loss": 3.1534, "step": 5350 }, { "epoch": 0.14, "learning_rate": 0.0019328600937859317, "loss": 2.5627, "step": 5351 }, { "epoch": 0.14, "learning_rate": 0.0019328287353513975, "loss": 2.7962, "step": 5352 }, { "epoch": 0.14, "learning_rate": 0.0019327973698499196, "loss": 3.017, "step": 5353 }, { "epoch": 0.14, "learning_rate": 0.0019327659972817356, "loss": 3.0079, "step": 5354 }, { "epoch": 0.14, "learning_rate": 0.001932734617647083, "loss": 2.4989, "step": 5355 }, { "epoch": 0.14, "learning_rate": 0.0019327032309461997, "loss": 2.639, "step": 5356 }, { "epoch": 0.14, "learning_rate": 0.0019326718371793236, "loss": 2.2273, "step": 5357 }, { "epoch": 0.14, "learning_rate": 0.0019326404363466923, "loss": 2.5606, "step": 5358 }, { "epoch": 0.14, "learning_rate": 0.0019326090284485437, "loss": 2.5143, "step": 5359 }, { "epoch": 0.14, "learning_rate": 0.0019325776134851162, "loss": 2.6788, "step": 5360 }, { "epoch": 0.14, "learning_rate": 0.001932546191456647, "loss": 2.8648, "step": 5361 }, { "epoch": 0.14, "learning_rate": 0.0019325147623633749, "loss": 2.9273, "step": 5362 }, { "epoch": 0.14, "learning_rate": 0.0019324833262055377, "loss": 2.6138, "step": 5363 }, { "epoch": 0.14, "learning_rate": 0.0019324518829833732, "loss": 2.8647, "step": 5364 }, { "epoch": 0.14, "learning_rate": 0.0019324204326971201, "loss": 3.1288, "step": 5365 }, { "epoch": 0.14, "learning_rate": 0.0019323889753470164, "loss": 2.8557, "step": 5366 }, { "epoch": 0.14, "learning_rate": 0.0019323575109333007, "loss": 2.4565, "step": 5367 }, { "epoch": 0.14, "learning_rate": 0.0019323260394562114, "loss": 2.3128, "step": 5368 }, { "epoch": 0.14, "learning_rate": 0.0019322945609159864, "loss": 2.7126, "step": 5369 }, { "epoch": 0.14, "learning_rate": 0.0019322630753128645, "loss": 2.8961, "step": 5370 }, { "epoch": 0.14, "learning_rate": 0.0019322315826470842, "loss": 2.1362, "step": 5371 }, { "epoch": 0.14, "learning_rate": 0.0019322000829188842, "loss": 2.4523, "step": 5372 }, { "epoch": 0.14, "learning_rate": 0.0019321685761285031, "loss": 2.871, "step": 5373 }, { "epoch": 0.14, "learning_rate": 0.0019321370622761794, "loss": 2.6512, "step": 5374 }, { "epoch": 0.14, "learning_rate": 0.0019321055413621519, "loss": 2.6917, "step": 5375 }, { "epoch": 0.14, "learning_rate": 0.0019320740133866594, "loss": 2.4332, "step": 5376 }, { "epoch": 0.14, "learning_rate": 0.0019320424783499412, "loss": 2.9923, "step": 5377 }, { "epoch": 0.14, "learning_rate": 0.0019320109362522353, "loss": 2.9381, "step": 5378 }, { "epoch": 0.14, "learning_rate": 0.0019319793870937816, "loss": 2.4168, "step": 5379 }, { "epoch": 0.14, "learning_rate": 0.0019319478308748184, "loss": 2.6897, "step": 5380 }, { "epoch": 0.14, "learning_rate": 0.0019319162675955851, "loss": 2.5844, "step": 5381 }, { "epoch": 0.14, "learning_rate": 0.0019318846972563209, "loss": 2.5986, "step": 5382 }, { "epoch": 0.14, "learning_rate": 0.0019318531198572648, "loss": 2.8717, "step": 5383 }, { "epoch": 0.14, "learning_rate": 0.001931821535398656, "loss": 2.6533, "step": 5384 }, { "epoch": 0.14, "learning_rate": 0.0019317899438807337, "loss": 2.898, "step": 5385 }, { "epoch": 0.14, "learning_rate": 0.0019317583453037379, "loss": 2.7049, "step": 5386 }, { "epoch": 0.14, "learning_rate": 0.001931726739667907, "loss": 2.6132, "step": 5387 }, { "epoch": 0.14, "learning_rate": 0.001931695126973481, "loss": 2.832, "step": 5388 }, { "epoch": 0.14, "learning_rate": 0.0019316635072206994, "loss": 2.6614, "step": 5389 }, { "epoch": 0.14, "learning_rate": 0.0019316318804098013, "loss": 2.933, "step": 5390 }, { "epoch": 0.14, "learning_rate": 0.001931600246541027, "loss": 2.8894, "step": 5391 }, { "epoch": 0.14, "learning_rate": 0.0019315686056146158, "loss": 2.523, "step": 5392 }, { "epoch": 0.14, "learning_rate": 0.001931536957630807, "loss": 2.6655, "step": 5393 }, { "epoch": 0.14, "learning_rate": 0.0019315053025898412, "loss": 2.7894, "step": 5394 }, { "epoch": 0.14, "learning_rate": 0.0019314736404919576, "loss": 2.6166, "step": 5395 }, { "epoch": 0.15, "learning_rate": 0.0019314419713373963, "loss": 2.6241, "step": 5396 }, { "epoch": 0.15, "learning_rate": 0.0019314102951263968, "loss": 2.8247, "step": 5397 }, { "epoch": 0.15, "learning_rate": 0.0019313786118592, "loss": 3.1033, "step": 5398 }, { "epoch": 0.15, "learning_rate": 0.0019313469215360448, "loss": 2.8921, "step": 5399 }, { "epoch": 0.15, "learning_rate": 0.001931315224157172, "loss": 2.3809, "step": 5400 }, { "epoch": 0.15, "learning_rate": 0.0019312835197228219, "loss": 2.3474, "step": 5401 }, { "epoch": 0.15, "learning_rate": 0.0019312518082332337, "loss": 3.0539, "step": 5402 }, { "epoch": 0.15, "learning_rate": 0.0019312200896886486, "loss": 2.8147, "step": 5403 }, { "epoch": 0.15, "learning_rate": 0.0019311883640893068, "loss": 2.9021, "step": 5404 }, { "epoch": 0.15, "learning_rate": 0.0019311566314354485, "loss": 2.6686, "step": 5405 }, { "epoch": 0.15, "learning_rate": 0.001931124891727314, "loss": 2.4916, "step": 5406 }, { "epoch": 0.15, "learning_rate": 0.0019310931449651432, "loss": 2.8351, "step": 5407 }, { "epoch": 0.15, "learning_rate": 0.0019310613911491777, "loss": 2.4581, "step": 5408 }, { "epoch": 0.15, "learning_rate": 0.0019310296302796576, "loss": 2.6598, "step": 5409 }, { "epoch": 0.15, "learning_rate": 0.0019309978623568234, "loss": 2.7086, "step": 5410 }, { "epoch": 0.15, "learning_rate": 0.0019309660873809155, "loss": 2.9263, "step": 5411 }, { "epoch": 0.15, "learning_rate": 0.0019309343053521752, "loss": 2.3602, "step": 5412 }, { "epoch": 0.15, "learning_rate": 0.0019309025162708433, "loss": 2.7887, "step": 5413 }, { "epoch": 0.15, "learning_rate": 0.0019308707201371603, "loss": 2.7647, "step": 5414 }, { "epoch": 0.15, "learning_rate": 0.0019308389169513669, "loss": 2.7882, "step": 5415 }, { "epoch": 0.15, "learning_rate": 0.0019308071067137044, "loss": 2.5755, "step": 5416 }, { "epoch": 0.15, "learning_rate": 0.0019307752894244135, "loss": 2.4269, "step": 5417 }, { "epoch": 0.15, "learning_rate": 0.0019307434650837356, "loss": 2.5263, "step": 5418 }, { "epoch": 0.15, "learning_rate": 0.0019307116336919118, "loss": 2.656, "step": 5419 }, { "epoch": 0.15, "learning_rate": 0.0019306797952491825, "loss": 2.4933, "step": 5420 }, { "epoch": 0.15, "learning_rate": 0.00193064794975579, "loss": 2.634, "step": 5421 }, { "epoch": 0.15, "learning_rate": 0.0019306160972119748, "loss": 2.9715, "step": 5422 }, { "epoch": 0.15, "learning_rate": 0.0019305842376179786, "loss": 2.7547, "step": 5423 }, { "epoch": 0.15, "learning_rate": 0.0019305523709740422, "loss": 3.1131, "step": 5424 }, { "epoch": 0.15, "learning_rate": 0.0019305204972804078, "loss": 2.5311, "step": 5425 }, { "epoch": 0.15, "learning_rate": 0.0019304886165373164, "loss": 2.727, "step": 5426 }, { "epoch": 0.15, "learning_rate": 0.0019304567287450095, "loss": 2.5267, "step": 5427 }, { "epoch": 0.15, "learning_rate": 0.0019304248339037287, "loss": 2.4485, "step": 5428 }, { "epoch": 0.15, "learning_rate": 0.001930392932013716, "loss": 2.7304, "step": 5429 }, { "epoch": 0.15, "learning_rate": 0.0019303610230752125, "loss": 2.8675, "step": 5430 }, { "epoch": 0.15, "learning_rate": 0.0019303291070884602, "loss": 2.4571, "step": 5431 }, { "epoch": 0.15, "learning_rate": 0.0019302971840537012, "loss": 2.3092, "step": 5432 }, { "epoch": 0.15, "learning_rate": 0.0019302652539711768, "loss": 2.916, "step": 5433 }, { "epoch": 0.15, "learning_rate": 0.0019302333168411292, "loss": 3.2149, "step": 5434 }, { "epoch": 0.15, "learning_rate": 0.0019302013726638, "loss": 2.5119, "step": 5435 }, { "epoch": 0.15, "learning_rate": 0.001930169421439432, "loss": 2.8584, "step": 5436 }, { "epoch": 0.15, "learning_rate": 0.0019301374631682667, "loss": 2.6686, "step": 5437 }, { "epoch": 0.15, "learning_rate": 0.001930105497850546, "loss": 3.1253, "step": 5438 }, { "epoch": 0.15, "learning_rate": 0.0019300735254865126, "loss": 2.9224, "step": 5439 }, { "epoch": 0.15, "learning_rate": 0.0019300415460764082, "loss": 2.8702, "step": 5440 }, { "epoch": 0.15, "learning_rate": 0.0019300095596204755, "loss": 2.5268, "step": 5441 }, { "epoch": 0.15, "learning_rate": 0.0019299775661189567, "loss": 2.9792, "step": 5442 }, { "epoch": 0.15, "learning_rate": 0.0019299455655720941, "loss": 2.6769, "step": 5443 }, { "epoch": 0.15, "learning_rate": 0.00192991355798013, "loss": 3.0468, "step": 5444 }, { "epoch": 0.15, "learning_rate": 0.0019298815433433072, "loss": 3.3649, "step": 5445 }, { "epoch": 0.15, "learning_rate": 0.001929849521661868, "loss": 2.5153, "step": 5446 }, { "epoch": 0.15, "learning_rate": 0.001929817492936055, "loss": 2.7431, "step": 5447 }, { "epoch": 0.15, "learning_rate": 0.001929785457166111, "loss": 2.4688, "step": 5448 }, { "epoch": 0.15, "learning_rate": 0.0019297534143522786, "loss": 2.8406, "step": 5449 }, { "epoch": 0.15, "learning_rate": 0.0019297213644948004, "loss": 2.4421, "step": 5450 }, { "epoch": 0.15, "learning_rate": 0.0019296893075939198, "loss": 2.6155, "step": 5451 }, { "epoch": 0.15, "learning_rate": 0.0019296572436498787, "loss": 2.6292, "step": 5452 }, { "epoch": 0.15, "learning_rate": 0.0019296251726629208, "loss": 2.7783, "step": 5453 }, { "epoch": 0.15, "learning_rate": 0.001929593094633289, "loss": 2.8736, "step": 5454 }, { "epoch": 0.15, "learning_rate": 0.0019295610095612257, "loss": 2.5678, "step": 5455 }, { "epoch": 0.15, "learning_rate": 0.0019295289174469743, "loss": 2.6707, "step": 5456 }, { "epoch": 0.15, "learning_rate": 0.0019294968182907784, "loss": 2.6084, "step": 5457 }, { "epoch": 0.15, "learning_rate": 0.0019294647120928806, "loss": 2.6835, "step": 5458 }, { "epoch": 0.15, "learning_rate": 0.0019294325988535243, "loss": 2.4867, "step": 5459 }, { "epoch": 0.15, "learning_rate": 0.001929400478572953, "loss": 2.6792, "step": 5460 }, { "epoch": 0.15, "learning_rate": 0.0019293683512514096, "loss": 2.5035, "step": 5461 }, { "epoch": 0.15, "learning_rate": 0.0019293362168891378, "loss": 2.4941, "step": 5462 }, { "epoch": 0.15, "learning_rate": 0.0019293040754863808, "loss": 2.9448, "step": 5463 }, { "epoch": 0.15, "learning_rate": 0.0019292719270433826, "loss": 2.373, "step": 5464 }, { "epoch": 0.15, "learning_rate": 0.0019292397715603862, "loss": 2.4376, "step": 5465 }, { "epoch": 0.15, "learning_rate": 0.0019292076090376353, "loss": 2.4801, "step": 5466 }, { "epoch": 0.15, "learning_rate": 0.0019291754394753743, "loss": 2.6175, "step": 5467 }, { "epoch": 0.15, "learning_rate": 0.0019291432628738457, "loss": 2.9466, "step": 5468 }, { "epoch": 0.15, "learning_rate": 0.001929111079233294, "loss": 2.5951, "step": 5469 }, { "epoch": 0.15, "learning_rate": 0.001929078888553963, "loss": 2.3624, "step": 5470 }, { "epoch": 0.15, "learning_rate": 0.0019290466908360962, "loss": 2.9657, "step": 5471 }, { "epoch": 0.15, "learning_rate": 0.001929014486079938, "loss": 2.957, "step": 5472 }, { "epoch": 0.15, "learning_rate": 0.001928982274285732, "loss": 2.2962, "step": 5473 }, { "epoch": 0.15, "learning_rate": 0.0019289500554537226, "loss": 2.849, "step": 5474 }, { "epoch": 0.15, "learning_rate": 0.0019289178295841532, "loss": 2.7408, "step": 5475 }, { "epoch": 0.15, "learning_rate": 0.0019288855966772688, "loss": 2.5604, "step": 5476 }, { "epoch": 0.15, "learning_rate": 0.001928853356733313, "loss": 3.3106, "step": 5477 }, { "epoch": 0.15, "learning_rate": 0.0019288211097525302, "loss": 2.3782, "step": 5478 }, { "epoch": 0.15, "learning_rate": 0.0019287888557351649, "loss": 2.7815, "step": 5479 }, { "epoch": 0.15, "learning_rate": 0.0019287565946814612, "loss": 2.646, "step": 5480 }, { "epoch": 0.15, "learning_rate": 0.0019287243265916634, "loss": 2.6107, "step": 5481 }, { "epoch": 0.15, "learning_rate": 0.0019286920514660166, "loss": 2.4996, "step": 5482 }, { "epoch": 0.15, "learning_rate": 0.0019286597693047645, "loss": 2.445, "step": 5483 }, { "epoch": 0.15, "learning_rate": 0.001928627480108152, "loss": 2.6711, "step": 5484 }, { "epoch": 0.15, "learning_rate": 0.001928595183876424, "loss": 2.9223, "step": 5485 }, { "epoch": 0.15, "learning_rate": 0.0019285628806098246, "loss": 2.5292, "step": 5486 }, { "epoch": 0.15, "learning_rate": 0.0019285305703085989, "loss": 2.7522, "step": 5487 }, { "epoch": 0.15, "learning_rate": 0.0019284982529729918, "loss": 2.6058, "step": 5488 }, { "epoch": 0.15, "learning_rate": 0.0019284659286032478, "loss": 2.5135, "step": 5489 }, { "epoch": 0.15, "learning_rate": 0.001928433597199612, "loss": 2.6723, "step": 5490 }, { "epoch": 0.15, "learning_rate": 0.0019284012587623292, "loss": 2.892, "step": 5491 }, { "epoch": 0.15, "learning_rate": 0.0019283689132916445, "loss": 2.9991, "step": 5492 }, { "epoch": 0.15, "learning_rate": 0.0019283365607878028, "loss": 3.0492, "step": 5493 }, { "epoch": 0.15, "learning_rate": 0.0019283042012510493, "loss": 2.8331, "step": 5494 }, { "epoch": 0.15, "learning_rate": 0.001928271834681629, "loss": 2.2704, "step": 5495 }, { "epoch": 0.15, "learning_rate": 0.0019282394610797874, "loss": 2.8312, "step": 5496 }, { "epoch": 0.15, "learning_rate": 0.0019282070804457695, "loss": 2.7177, "step": 5497 }, { "epoch": 0.15, "learning_rate": 0.0019281746927798209, "loss": 2.5081, "step": 5498 }, { "epoch": 0.15, "learning_rate": 0.0019281422980821868, "loss": 2.624, "step": 5499 }, { "epoch": 0.15, "learning_rate": 0.0019281098963531123, "loss": 2.5227, "step": 5500 }, { "epoch": 0.15, "learning_rate": 0.0019280774875928433, "loss": 2.6149, "step": 5501 }, { "epoch": 0.15, "learning_rate": 0.0019280450718016252, "loss": 2.5527, "step": 5502 }, { "epoch": 0.15, "learning_rate": 0.0019280126489797035, "loss": 2.7264, "step": 5503 }, { "epoch": 0.15, "learning_rate": 0.0019279802191273239, "loss": 2.7223, "step": 5504 }, { "epoch": 0.15, "learning_rate": 0.0019279477822447323, "loss": 2.7613, "step": 5505 }, { "epoch": 0.15, "learning_rate": 0.001927915338332174, "loss": 2.3806, "step": 5506 }, { "epoch": 0.15, "learning_rate": 0.0019278828873898948, "loss": 2.3183, "step": 5507 }, { "epoch": 0.15, "learning_rate": 0.0019278504294181409, "loss": 2.613, "step": 5508 }, { "epoch": 0.15, "learning_rate": 0.001927817964417158, "loss": 2.9687, "step": 5509 }, { "epoch": 0.15, "learning_rate": 0.001927785492387192, "loss": 2.8125, "step": 5510 }, { "epoch": 0.15, "learning_rate": 0.0019277530133284893, "loss": 2.9141, "step": 5511 }, { "epoch": 0.15, "learning_rate": 0.0019277205272412955, "loss": 2.8121, "step": 5512 }, { "epoch": 0.15, "learning_rate": 0.0019276880341258568, "loss": 2.6716, "step": 5513 }, { "epoch": 0.15, "learning_rate": 0.0019276555339824194, "loss": 2.8823, "step": 5514 }, { "epoch": 0.15, "learning_rate": 0.0019276230268112293, "loss": 2.8799, "step": 5515 }, { "epoch": 0.15, "learning_rate": 0.0019275905126125332, "loss": 2.9512, "step": 5516 }, { "epoch": 0.15, "learning_rate": 0.0019275579913865775, "loss": 2.5708, "step": 5517 }, { "epoch": 0.15, "learning_rate": 0.0019275254631336079, "loss": 2.6503, "step": 5518 }, { "epoch": 0.15, "learning_rate": 0.0019274929278538713, "loss": 2.7052, "step": 5519 }, { "epoch": 0.15, "learning_rate": 0.0019274603855476142, "loss": 2.4272, "step": 5520 }, { "epoch": 0.15, "learning_rate": 0.001927427836215083, "loss": 2.6208, "step": 5521 }, { "epoch": 0.15, "learning_rate": 0.0019273952798565244, "loss": 2.8823, "step": 5522 }, { "epoch": 0.15, "learning_rate": 0.0019273627164721847, "loss": 2.6114, "step": 5523 }, { "epoch": 0.15, "learning_rate": 0.0019273301460623112, "loss": 2.3788, "step": 5524 }, { "epoch": 0.15, "learning_rate": 0.00192729756862715, "loss": 2.4657, "step": 5525 }, { "epoch": 0.15, "learning_rate": 0.0019272649841669484, "loss": 2.8907, "step": 5526 }, { "epoch": 0.15, "learning_rate": 0.0019272323926819528, "loss": 2.7082, "step": 5527 }, { "epoch": 0.15, "learning_rate": 0.0019271997941724104, "loss": 2.7858, "step": 5528 }, { "epoch": 0.15, "learning_rate": 0.0019271671886385683, "loss": 2.5956, "step": 5529 }, { "epoch": 0.15, "learning_rate": 0.0019271345760806735, "loss": 2.303, "step": 5530 }, { "epoch": 0.15, "learning_rate": 0.0019271019564989728, "loss": 2.8951, "step": 5531 }, { "epoch": 0.15, "learning_rate": 0.0019270693298937133, "loss": 2.8492, "step": 5532 }, { "epoch": 0.15, "learning_rate": 0.0019270366962651421, "loss": 2.7171, "step": 5533 }, { "epoch": 0.15, "learning_rate": 0.001927004055613507, "loss": 2.4389, "step": 5534 }, { "epoch": 0.15, "learning_rate": 0.001926971407939055, "loss": 2.4848, "step": 5535 }, { "epoch": 0.15, "learning_rate": 0.001926938753242033, "loss": 2.845, "step": 5536 }, { "epoch": 0.15, "learning_rate": 0.0019269060915226889, "loss": 2.9888, "step": 5537 }, { "epoch": 0.15, "learning_rate": 0.0019268734227812698, "loss": 2.9893, "step": 5538 }, { "epoch": 0.15, "learning_rate": 0.0019268407470180236, "loss": 2.821, "step": 5539 }, { "epoch": 0.15, "learning_rate": 0.0019268080642331972, "loss": 2.7503, "step": 5540 }, { "epoch": 0.15, "learning_rate": 0.001926775374427039, "loss": 2.9184, "step": 5541 }, { "epoch": 0.15, "learning_rate": 0.0019267426775997963, "loss": 2.6429, "step": 5542 }, { "epoch": 0.15, "learning_rate": 0.0019267099737517164, "loss": 3.0584, "step": 5543 }, { "epoch": 0.15, "learning_rate": 0.0019266772628830477, "loss": 2.5539, "step": 5544 }, { "epoch": 0.15, "learning_rate": 0.0019266445449940377, "loss": 2.5891, "step": 5545 }, { "epoch": 0.15, "learning_rate": 0.0019266118200849344, "loss": 2.4194, "step": 5546 }, { "epoch": 0.15, "learning_rate": 0.0019265790881559854, "loss": 2.5982, "step": 5547 }, { "epoch": 0.15, "learning_rate": 0.001926546349207439, "loss": 2.532, "step": 5548 }, { "epoch": 0.15, "learning_rate": 0.0019265136032395429, "loss": 2.9334, "step": 5549 }, { "epoch": 0.15, "learning_rate": 0.0019264808502525454, "loss": 2.831, "step": 5550 }, { "epoch": 0.15, "learning_rate": 0.0019264480902466948, "loss": 2.4651, "step": 5551 }, { "epoch": 0.15, "learning_rate": 0.0019264153232222392, "loss": 2.6318, "step": 5552 }, { "epoch": 0.15, "learning_rate": 0.0019263825491794267, "loss": 2.6905, "step": 5553 }, { "epoch": 0.15, "learning_rate": 0.0019263497681185054, "loss": 2.7759, "step": 5554 }, { "epoch": 0.15, "learning_rate": 0.001926316980039724, "loss": 2.9152, "step": 5555 }, { "epoch": 0.15, "learning_rate": 0.0019262841849433307, "loss": 2.6409, "step": 5556 }, { "epoch": 0.15, "learning_rate": 0.0019262513828295742, "loss": 2.5567, "step": 5557 }, { "epoch": 0.15, "learning_rate": 0.0019262185736987029, "loss": 2.878, "step": 5558 }, { "epoch": 0.15, "learning_rate": 0.0019261857575509648, "loss": 2.7832, "step": 5559 }, { "epoch": 0.15, "learning_rate": 0.0019261529343866093, "loss": 2.4483, "step": 5560 }, { "epoch": 0.15, "learning_rate": 0.001926120104205885, "loss": 2.4954, "step": 5561 }, { "epoch": 0.15, "learning_rate": 0.0019260872670090398, "loss": 2.9569, "step": 5562 }, { "epoch": 0.15, "learning_rate": 0.0019260544227963235, "loss": 2.6673, "step": 5563 }, { "epoch": 0.15, "learning_rate": 0.0019260215715679841, "loss": 2.7717, "step": 5564 }, { "epoch": 0.15, "learning_rate": 0.001925988713324271, "loss": 3.008, "step": 5565 }, { "epoch": 0.15, "learning_rate": 0.001925955848065433, "loss": 2.5168, "step": 5566 }, { "epoch": 0.15, "learning_rate": 0.001925922975791719, "loss": 2.5596, "step": 5567 }, { "epoch": 0.15, "learning_rate": 0.0019258900965033782, "loss": 2.6777, "step": 5568 }, { "epoch": 0.15, "learning_rate": 0.0019258572102006594, "loss": 2.6202, "step": 5569 }, { "epoch": 0.15, "learning_rate": 0.0019258243168838122, "loss": 2.5785, "step": 5570 }, { "epoch": 0.15, "learning_rate": 0.001925791416553085, "loss": 3.0167, "step": 5571 }, { "epoch": 0.15, "learning_rate": 0.0019257585092087278, "loss": 2.8556, "step": 5572 }, { "epoch": 0.15, "learning_rate": 0.0019257255948509897, "loss": 2.7451, "step": 5573 }, { "epoch": 0.15, "learning_rate": 0.0019256926734801199, "loss": 2.6336, "step": 5574 }, { "epoch": 0.15, "learning_rate": 0.0019256597450963678, "loss": 2.2927, "step": 5575 }, { "epoch": 0.15, "learning_rate": 0.0019256268096999834, "loss": 2.8815, "step": 5576 }, { "epoch": 0.15, "learning_rate": 0.0019255938672912154, "loss": 2.776, "step": 5577 }, { "epoch": 0.15, "learning_rate": 0.0019255609178703138, "loss": 2.4607, "step": 5578 }, { "epoch": 0.15, "learning_rate": 0.0019255279614375281, "loss": 2.7582, "step": 5579 }, { "epoch": 0.15, "learning_rate": 0.0019254949979931083, "loss": 2.8199, "step": 5580 }, { "epoch": 0.15, "learning_rate": 0.0019254620275373036, "loss": 2.7484, "step": 5581 }, { "epoch": 0.15, "learning_rate": 0.001925429050070364, "loss": 2.8661, "step": 5582 }, { "epoch": 0.15, "learning_rate": 0.0019253960655925397, "loss": 2.9834, "step": 5583 }, { "epoch": 0.15, "learning_rate": 0.0019253630741040797, "loss": 3.1937, "step": 5584 }, { "epoch": 0.15, "learning_rate": 0.001925330075605235, "loss": 2.8013, "step": 5585 }, { "epoch": 0.15, "learning_rate": 0.0019252970700962548, "loss": 2.5923, "step": 5586 }, { "epoch": 0.15, "learning_rate": 0.0019252640575773896, "loss": 2.7423, "step": 5587 }, { "epoch": 0.15, "learning_rate": 0.001925231038048889, "loss": 2.6467, "step": 5588 }, { "epoch": 0.15, "learning_rate": 0.0019251980115110039, "loss": 2.9145, "step": 5589 }, { "epoch": 0.15, "learning_rate": 0.001925164977963984, "loss": 2.4454, "step": 5590 }, { "epoch": 0.15, "learning_rate": 0.0019251319374080796, "loss": 2.4844, "step": 5591 }, { "epoch": 0.15, "learning_rate": 0.001925098889843541, "loss": 2.8451, "step": 5592 }, { "epoch": 0.15, "learning_rate": 0.0019250658352706186, "loss": 2.3915, "step": 5593 }, { "epoch": 0.15, "learning_rate": 0.0019250327736895626, "loss": 2.9637, "step": 5594 }, { "epoch": 0.15, "learning_rate": 0.0019249997051006239, "loss": 2.5864, "step": 5595 }, { "epoch": 0.15, "learning_rate": 0.0019249666295040528, "loss": 2.5318, "step": 5596 }, { "epoch": 0.15, "learning_rate": 0.0019249335469000996, "loss": 2.58, "step": 5597 }, { "epoch": 0.15, "learning_rate": 0.0019249004572890157, "loss": 2.8404, "step": 5598 }, { "epoch": 0.15, "learning_rate": 0.0019248673606710512, "loss": 2.6588, "step": 5599 }, { "epoch": 0.15, "learning_rate": 0.0019248342570464567, "loss": 2.5972, "step": 5600 }, { "epoch": 0.15, "learning_rate": 0.0019248011464154833, "loss": 2.7609, "step": 5601 }, { "epoch": 0.15, "learning_rate": 0.0019247680287783817, "loss": 1.9775, "step": 5602 }, { "epoch": 0.15, "learning_rate": 0.001924734904135403, "loss": 2.5334, "step": 5603 }, { "epoch": 0.15, "learning_rate": 0.0019247017724867979, "loss": 3.1705, "step": 5604 }, { "epoch": 0.15, "learning_rate": 0.0019246686338328174, "loss": 2.9404, "step": 5605 }, { "epoch": 0.15, "learning_rate": 0.0019246354881737129, "loss": 2.6287, "step": 5606 }, { "epoch": 0.15, "learning_rate": 0.0019246023355097349, "loss": 2.6226, "step": 5607 }, { "epoch": 0.15, "learning_rate": 0.0019245691758411352, "loss": 2.4065, "step": 5608 }, { "epoch": 0.15, "learning_rate": 0.0019245360091681648, "loss": 2.5111, "step": 5609 }, { "epoch": 0.15, "learning_rate": 0.0019245028354910746, "loss": 2.7885, "step": 5610 }, { "epoch": 0.15, "learning_rate": 0.0019244696548101161, "loss": 2.7792, "step": 5611 }, { "epoch": 0.15, "learning_rate": 0.001924436467125541, "loss": 2.3969, "step": 5612 }, { "epoch": 0.15, "learning_rate": 0.0019244032724376006, "loss": 2.7461, "step": 5613 }, { "epoch": 0.15, "learning_rate": 0.001924370070746546, "loss": 3.4588, "step": 5614 }, { "epoch": 0.15, "learning_rate": 0.0019243368620526294, "loss": 2.367, "step": 5615 }, { "epoch": 0.15, "learning_rate": 0.0019243036463561017, "loss": 2.659, "step": 5616 }, { "epoch": 0.15, "learning_rate": 0.0019242704236572148, "loss": 2.4741, "step": 5617 }, { "epoch": 0.15, "learning_rate": 0.0019242371939562207, "loss": 2.7427, "step": 5618 }, { "epoch": 0.15, "learning_rate": 0.0019242039572533705, "loss": 2.969, "step": 5619 }, { "epoch": 0.15, "learning_rate": 0.0019241707135489166, "loss": 3.219, "step": 5620 }, { "epoch": 0.15, "learning_rate": 0.0019241374628431104, "loss": 2.8379, "step": 5621 }, { "epoch": 0.15, "learning_rate": 0.001924104205136204, "loss": 2.9936, "step": 5622 }, { "epoch": 0.15, "learning_rate": 0.0019240709404284497, "loss": 2.4764, "step": 5623 }, { "epoch": 0.15, "learning_rate": 0.0019240376687200988, "loss": 2.2813, "step": 5624 }, { "epoch": 0.15, "learning_rate": 0.001924004390011404, "loss": 2.8188, "step": 5625 }, { "epoch": 0.15, "learning_rate": 0.001923971104302617, "loss": 1.9956, "step": 5626 }, { "epoch": 0.15, "learning_rate": 0.0019239378115939898, "loss": 2.8699, "step": 5627 }, { "epoch": 0.15, "learning_rate": 0.0019239045118857755, "loss": 3.2597, "step": 5628 }, { "epoch": 0.15, "learning_rate": 0.0019238712051782255, "loss": 2.3204, "step": 5629 }, { "epoch": 0.15, "learning_rate": 0.0019238378914715924, "loss": 2.8181, "step": 5630 }, { "epoch": 0.15, "learning_rate": 0.0019238045707661287, "loss": 3.0441, "step": 5631 }, { "epoch": 0.15, "learning_rate": 0.0019237712430620866, "loss": 2.897, "step": 5632 }, { "epoch": 0.15, "learning_rate": 0.0019237379083597186, "loss": 2.9224, "step": 5633 }, { "epoch": 0.15, "learning_rate": 0.0019237045666592777, "loss": 2.443, "step": 5634 }, { "epoch": 0.15, "learning_rate": 0.001923671217961016, "loss": 2.6641, "step": 5635 }, { "epoch": 0.15, "learning_rate": 0.0019236378622651863, "loss": 3.0019, "step": 5636 }, { "epoch": 0.15, "learning_rate": 0.0019236044995720413, "loss": 2.6665, "step": 5637 }, { "epoch": 0.15, "learning_rate": 0.0019235711298818336, "loss": 3.0458, "step": 5638 }, { "epoch": 0.15, "learning_rate": 0.0019235377531948163, "loss": 2.0893, "step": 5639 }, { "epoch": 0.15, "learning_rate": 0.001923504369511242, "loss": 3.191, "step": 5640 }, { "epoch": 0.15, "learning_rate": 0.0019234709788313637, "loss": 2.8095, "step": 5641 }, { "epoch": 0.15, "learning_rate": 0.0019234375811554344, "loss": 2.4884, "step": 5642 }, { "epoch": 0.15, "learning_rate": 0.001923404176483707, "loss": 2.5757, "step": 5643 }, { "epoch": 0.15, "learning_rate": 0.001923370764816435, "loss": 2.4396, "step": 5644 }, { "epoch": 0.15, "learning_rate": 0.0019233373461538708, "loss": 2.7748, "step": 5645 }, { "epoch": 0.15, "learning_rate": 0.0019233039204962679, "loss": 2.5844, "step": 5646 }, { "epoch": 0.15, "learning_rate": 0.0019232704878438798, "loss": 2.3769, "step": 5647 }, { "epoch": 0.15, "learning_rate": 0.0019232370481969596, "loss": 2.5011, "step": 5648 }, { "epoch": 0.15, "learning_rate": 0.0019232036015557603, "loss": 2.7621, "step": 5649 }, { "epoch": 0.15, "learning_rate": 0.0019231701479205357, "loss": 2.6531, "step": 5650 }, { "epoch": 0.15, "learning_rate": 0.0019231366872915392, "loss": 2.9754, "step": 5651 }, { "epoch": 0.15, "learning_rate": 0.001923103219669024, "loss": 2.3321, "step": 5652 }, { "epoch": 0.15, "learning_rate": 0.001923069745053244, "loss": 2.399, "step": 5653 }, { "epoch": 0.15, "learning_rate": 0.0019230362634444526, "loss": 2.5971, "step": 5654 }, { "epoch": 0.15, "learning_rate": 0.0019230027748429036, "loss": 2.6846, "step": 5655 }, { "epoch": 0.15, "learning_rate": 0.0019229692792488505, "loss": 2.5435, "step": 5656 }, { "epoch": 0.15, "learning_rate": 0.001922935776662547, "loss": 2.695, "step": 5657 }, { "epoch": 0.15, "learning_rate": 0.0019229022670842473, "loss": 2.5623, "step": 5658 }, { "epoch": 0.15, "learning_rate": 0.001922868750514205, "loss": 2.7773, "step": 5659 }, { "epoch": 0.15, "learning_rate": 0.0019228352269526738, "loss": 2.2697, "step": 5660 }, { "epoch": 0.15, "learning_rate": 0.0019228016963999083, "loss": 2.7064, "step": 5661 }, { "epoch": 0.15, "learning_rate": 0.0019227681588561616, "loss": 2.2393, "step": 5662 }, { "epoch": 0.15, "learning_rate": 0.0019227346143216887, "loss": 2.8261, "step": 5663 }, { "epoch": 0.15, "learning_rate": 0.0019227010627967435, "loss": 2.9701, "step": 5664 }, { "epoch": 0.15, "learning_rate": 0.0019226675042815795, "loss": 2.4552, "step": 5665 }, { "epoch": 0.15, "learning_rate": 0.0019226339387764517, "loss": 2.7909, "step": 5666 }, { "epoch": 0.15, "learning_rate": 0.001922600366281614, "loss": 2.8949, "step": 5667 }, { "epoch": 0.15, "learning_rate": 0.0019225667867973214, "loss": 2.5545, "step": 5668 }, { "epoch": 0.15, "learning_rate": 0.0019225332003238271, "loss": 2.5091, "step": 5669 }, { "epoch": 0.15, "learning_rate": 0.0019224996068613865, "loss": 2.6891, "step": 5670 }, { "epoch": 0.15, "learning_rate": 0.0019224660064102537, "loss": 2.6697, "step": 5671 }, { "epoch": 0.15, "learning_rate": 0.0019224323989706835, "loss": 2.7914, "step": 5672 }, { "epoch": 0.15, "learning_rate": 0.0019223987845429305, "loss": 2.9121, "step": 5673 }, { "epoch": 0.15, "learning_rate": 0.0019223651631272488, "loss": 2.6312, "step": 5674 }, { "epoch": 0.15, "learning_rate": 0.0019223315347238938, "loss": 2.2629, "step": 5675 }, { "epoch": 0.15, "learning_rate": 0.00192229789933312, "loss": 2.625, "step": 5676 }, { "epoch": 0.15, "learning_rate": 0.001922264256955182, "loss": 2.8258, "step": 5677 }, { "epoch": 0.15, "learning_rate": 0.001922230607590335, "loss": 2.7349, "step": 5678 }, { "epoch": 0.15, "learning_rate": 0.001922196951238834, "loss": 2.8999, "step": 5679 }, { "epoch": 0.15, "learning_rate": 0.0019221632879009335, "loss": 3.1515, "step": 5680 }, { "epoch": 0.15, "learning_rate": 0.0019221296175768888, "loss": 2.922, "step": 5681 }, { "epoch": 0.15, "learning_rate": 0.0019220959402669552, "loss": 2.8204, "step": 5682 }, { "epoch": 0.15, "learning_rate": 0.0019220622559713873, "loss": 2.2871, "step": 5683 }, { "epoch": 0.15, "learning_rate": 0.0019220285646904408, "loss": 2.6308, "step": 5684 }, { "epoch": 0.15, "learning_rate": 0.0019219948664243706, "loss": 2.5256, "step": 5685 }, { "epoch": 0.15, "learning_rate": 0.0019219611611734325, "loss": 2.6437, "step": 5686 }, { "epoch": 0.15, "learning_rate": 0.0019219274489378812, "loss": 2.8488, "step": 5687 }, { "epoch": 0.15, "learning_rate": 0.001921893729717972, "loss": 2.5876, "step": 5688 }, { "epoch": 0.15, "learning_rate": 0.0019218600035139613, "loss": 2.346, "step": 5689 }, { "epoch": 0.15, "learning_rate": 0.0019218262703261037, "loss": 2.5462, "step": 5690 }, { "epoch": 0.15, "learning_rate": 0.0019217925301546553, "loss": 2.3783, "step": 5691 }, { "epoch": 0.15, "learning_rate": 0.0019217587829998713, "loss": 2.3581, "step": 5692 }, { "epoch": 0.15, "learning_rate": 0.0019217250288620078, "loss": 3.2029, "step": 5693 }, { "epoch": 0.15, "learning_rate": 0.0019216912677413201, "loss": 2.5821, "step": 5694 }, { "epoch": 0.15, "learning_rate": 0.001921657499638064, "loss": 2.6013, "step": 5695 }, { "epoch": 0.15, "learning_rate": 0.0019216237245524956, "loss": 2.6053, "step": 5696 }, { "epoch": 0.15, "learning_rate": 0.0019215899424848708, "loss": 2.7767, "step": 5697 }, { "epoch": 0.15, "learning_rate": 0.0019215561534354454, "loss": 2.5338, "step": 5698 }, { "epoch": 0.15, "learning_rate": 0.0019215223574044749, "loss": 2.6148, "step": 5699 }, { "epoch": 0.15, "learning_rate": 0.0019214885543922162, "loss": 2.6711, "step": 5700 }, { "epoch": 0.15, "learning_rate": 0.0019214547443989248, "loss": 2.3979, "step": 5701 }, { "epoch": 0.15, "learning_rate": 0.0019214209274248568, "loss": 2.3197, "step": 5702 }, { "epoch": 0.15, "learning_rate": 0.0019213871034702691, "loss": 2.8668, "step": 5703 }, { "epoch": 0.15, "learning_rate": 0.0019213532725354168, "loss": 2.3312, "step": 5704 }, { "epoch": 0.15, "learning_rate": 0.0019213194346205573, "loss": 2.8927, "step": 5705 }, { "epoch": 0.15, "learning_rate": 0.0019212855897259465, "loss": 2.8742, "step": 5706 }, { "epoch": 0.15, "learning_rate": 0.0019212517378518403, "loss": 2.5002, "step": 5707 }, { "epoch": 0.15, "learning_rate": 0.0019212178789984962, "loss": 2.5698, "step": 5708 }, { "epoch": 0.15, "learning_rate": 0.0019211840131661698, "loss": 2.4231, "step": 5709 }, { "epoch": 0.15, "learning_rate": 0.001921150140355118, "loss": 2.7929, "step": 5710 }, { "epoch": 0.15, "learning_rate": 0.0019211162605655976, "loss": 2.6953, "step": 5711 }, { "epoch": 0.15, "learning_rate": 0.0019210823737978648, "loss": 2.5825, "step": 5712 }, { "epoch": 0.15, "learning_rate": 0.0019210484800521771, "loss": 2.6712, "step": 5713 }, { "epoch": 0.15, "learning_rate": 0.0019210145793287904, "loss": 2.9008, "step": 5714 }, { "epoch": 0.15, "learning_rate": 0.0019209806716279619, "loss": 3.0272, "step": 5715 }, { "epoch": 0.15, "learning_rate": 0.0019209467569499489, "loss": 2.4733, "step": 5716 }, { "epoch": 0.15, "learning_rate": 0.0019209128352950073, "loss": 2.6945, "step": 5717 }, { "epoch": 0.15, "learning_rate": 0.0019208789066633952, "loss": 2.565, "step": 5718 }, { "epoch": 0.15, "learning_rate": 0.0019208449710553688, "loss": 2.7254, "step": 5719 }, { "epoch": 0.15, "learning_rate": 0.001920811028471186, "loss": 2.7905, "step": 5720 }, { "epoch": 0.15, "learning_rate": 0.001920777078911103, "loss": 2.5994, "step": 5721 }, { "epoch": 0.15, "learning_rate": 0.0019207431223753778, "loss": 2.37, "step": 5722 }, { "epoch": 0.15, "learning_rate": 0.001920709158864267, "loss": 2.6943, "step": 5723 }, { "epoch": 0.15, "learning_rate": 0.0019206751883780284, "loss": 2.5931, "step": 5724 }, { "epoch": 0.15, "learning_rate": 0.001920641210916919, "loss": 2.4727, "step": 5725 }, { "epoch": 0.15, "learning_rate": 0.0019206072264811964, "loss": 2.8423, "step": 5726 }, { "epoch": 0.15, "learning_rate": 0.0019205732350711182, "loss": 2.8291, "step": 5727 }, { "epoch": 0.15, "learning_rate": 0.001920539236686942, "loss": 2.6877, "step": 5728 }, { "epoch": 0.15, "learning_rate": 0.0019205052313289249, "loss": 2.6028, "step": 5729 }, { "epoch": 0.15, "learning_rate": 0.0019204712189973246, "loss": 2.0788, "step": 5730 }, { "epoch": 0.15, "learning_rate": 0.0019204371996923988, "loss": 2.7694, "step": 5731 }, { "epoch": 0.15, "learning_rate": 0.0019204031734144057, "loss": 2.4975, "step": 5732 }, { "epoch": 0.15, "learning_rate": 0.0019203691401636026, "loss": 2.6031, "step": 5733 }, { "epoch": 0.15, "learning_rate": 0.0019203350999402473, "loss": 2.9282, "step": 5734 }, { "epoch": 0.15, "learning_rate": 0.0019203010527445979, "loss": 2.7625, "step": 5735 }, { "epoch": 0.15, "learning_rate": 0.001920266998576912, "loss": 2.6739, "step": 5736 }, { "epoch": 0.15, "learning_rate": 0.0019202329374374482, "loss": 2.6378, "step": 5737 }, { "epoch": 0.15, "learning_rate": 0.0019201988693264642, "loss": 2.6318, "step": 5738 }, { "epoch": 0.15, "learning_rate": 0.001920164794244218, "loss": 3.0277, "step": 5739 }, { "epoch": 0.15, "learning_rate": 0.0019201307121909678, "loss": 2.203, "step": 5740 }, { "epoch": 0.15, "learning_rate": 0.0019200966231669718, "loss": 2.3482, "step": 5741 }, { "epoch": 0.15, "learning_rate": 0.0019200625271724885, "loss": 2.4722, "step": 5742 }, { "epoch": 0.15, "learning_rate": 0.0019200284242077757, "loss": 2.5567, "step": 5743 }, { "epoch": 0.15, "learning_rate": 0.001919994314273092, "loss": 2.4918, "step": 5744 }, { "epoch": 0.15, "learning_rate": 0.0019199601973686961, "loss": 2.6627, "step": 5745 }, { "epoch": 0.15, "learning_rate": 0.001919926073494846, "loss": 2.724, "step": 5746 }, { "epoch": 0.15, "learning_rate": 0.0019198919426518008, "loss": 2.5422, "step": 5747 }, { "epoch": 0.15, "learning_rate": 0.0019198578048398183, "loss": 2.7884, "step": 5748 }, { "epoch": 0.15, "learning_rate": 0.0019198236600591577, "loss": 2.7008, "step": 5749 }, { "epoch": 0.15, "learning_rate": 0.0019197895083100773, "loss": 2.6008, "step": 5750 }, { "epoch": 0.15, "learning_rate": 0.0019197553495928364, "loss": 2.4591, "step": 5751 }, { "epoch": 0.15, "learning_rate": 0.0019197211839076932, "loss": 2.9741, "step": 5752 }, { "epoch": 0.15, "learning_rate": 0.001919687011254907, "loss": 2.697, "step": 5753 }, { "epoch": 0.15, "learning_rate": 0.001919652831634736, "loss": 2.604, "step": 5754 }, { "epoch": 0.15, "learning_rate": 0.0019196186450474398, "loss": 2.2559, "step": 5755 }, { "epoch": 0.15, "learning_rate": 0.001919584451493277, "loss": 2.6589, "step": 5756 }, { "epoch": 0.15, "learning_rate": 0.001919550250972507, "loss": 2.9713, "step": 5757 }, { "epoch": 0.15, "learning_rate": 0.0019195160434853885, "loss": 2.3879, "step": 5758 }, { "epoch": 0.15, "learning_rate": 0.001919481829032181, "loss": 2.6773, "step": 5759 }, { "epoch": 0.15, "learning_rate": 0.0019194476076131437, "loss": 2.5165, "step": 5760 }, { "epoch": 0.15, "learning_rate": 0.0019194133792285353, "loss": 2.647, "step": 5761 }, { "epoch": 0.15, "learning_rate": 0.001919379143878616, "loss": 2.7458, "step": 5762 }, { "epoch": 0.15, "learning_rate": 0.0019193449015636444, "loss": 2.7501, "step": 5763 }, { "epoch": 0.15, "learning_rate": 0.0019193106522838801, "loss": 2.6259, "step": 5764 }, { "epoch": 0.15, "learning_rate": 0.0019192763960395828, "loss": 2.7527, "step": 5765 }, { "epoch": 0.15, "learning_rate": 0.0019192421328310116, "loss": 2.8087, "step": 5766 }, { "epoch": 0.15, "learning_rate": 0.0019192078626584267, "loss": 2.7155, "step": 5767 }, { "epoch": 0.16, "learning_rate": 0.0019191735855220871, "loss": 2.8187, "step": 5768 }, { "epoch": 0.16, "learning_rate": 0.0019191393014222529, "loss": 2.6513, "step": 5769 }, { "epoch": 0.16, "learning_rate": 0.001919105010359184, "loss": 2.679, "step": 5770 }, { "epoch": 0.16, "learning_rate": 0.0019190707123331392, "loss": 2.7961, "step": 5771 }, { "epoch": 0.16, "learning_rate": 0.0019190364073443794, "loss": 2.7787, "step": 5772 }, { "epoch": 0.16, "learning_rate": 0.001919002095393164, "loss": 2.87, "step": 5773 }, { "epoch": 0.16, "learning_rate": 0.0019189677764797533, "loss": 2.9189, "step": 5774 }, { "epoch": 0.16, "learning_rate": 0.0019189334506044067, "loss": 2.9941, "step": 5775 }, { "epoch": 0.16, "learning_rate": 0.0019188991177673846, "loss": 3.2142, "step": 5776 }, { "epoch": 0.16, "learning_rate": 0.0019188647779689472, "loss": 2.4996, "step": 5777 }, { "epoch": 0.16, "learning_rate": 0.0019188304312093543, "loss": 2.2178, "step": 5778 }, { "epoch": 0.16, "learning_rate": 0.0019187960774888664, "loss": 2.6794, "step": 5779 }, { "epoch": 0.16, "learning_rate": 0.0019187617168077438, "loss": 2.9308, "step": 5780 }, { "epoch": 0.16, "learning_rate": 0.0019187273491662468, "loss": 2.3741, "step": 5781 }, { "epoch": 0.16, "learning_rate": 0.0019186929745646354, "loss": 2.6613, "step": 5782 }, { "epoch": 0.16, "learning_rate": 0.0019186585930031704, "loss": 2.5315, "step": 5783 }, { "epoch": 0.16, "learning_rate": 0.001918624204482112, "loss": 3.0023, "step": 5784 }, { "epoch": 0.16, "learning_rate": 0.0019185898090017211, "loss": 2.6819, "step": 5785 }, { "epoch": 0.16, "learning_rate": 0.0019185554065622578, "loss": 2.8355, "step": 5786 }, { "epoch": 0.16, "learning_rate": 0.001918520997163983, "loss": 2.5436, "step": 5787 }, { "epoch": 0.16, "learning_rate": 0.0019184865808071572, "loss": 2.7024, "step": 5788 }, { "epoch": 0.16, "learning_rate": 0.0019184521574920415, "loss": 2.8901, "step": 5789 }, { "epoch": 0.16, "learning_rate": 0.0019184177272188966, "loss": 2.6793, "step": 5790 }, { "epoch": 0.16, "learning_rate": 0.001918383289987983, "loss": 2.508, "step": 5791 }, { "epoch": 0.16, "learning_rate": 0.001918348845799562, "loss": 2.6614, "step": 5792 }, { "epoch": 0.16, "learning_rate": 0.001918314394653894, "loss": 2.5147, "step": 5793 }, { "epoch": 0.16, "learning_rate": 0.0019182799365512404, "loss": 2.7426, "step": 5794 }, { "epoch": 0.16, "learning_rate": 0.0019182454714918623, "loss": 2.7298, "step": 5795 }, { "epoch": 0.16, "learning_rate": 0.0019182109994760204, "loss": 2.4816, "step": 5796 }, { "epoch": 0.16, "learning_rate": 0.0019181765205039765, "loss": 2.9616, "step": 5797 }, { "epoch": 0.16, "learning_rate": 0.0019181420345759914, "loss": 2.8566, "step": 5798 }, { "epoch": 0.16, "learning_rate": 0.0019181075416923263, "loss": 2.889, "step": 5799 }, { "epoch": 0.16, "learning_rate": 0.0019180730418532424, "loss": 2.8701, "step": 5800 }, { "epoch": 0.16, "learning_rate": 0.0019180385350590014, "loss": 2.5401, "step": 5801 }, { "epoch": 0.16, "learning_rate": 0.0019180040213098647, "loss": 2.88, "step": 5802 }, { "epoch": 0.16, "learning_rate": 0.0019179695006060937, "loss": 2.3145, "step": 5803 }, { "epoch": 0.16, "learning_rate": 0.0019179349729479497, "loss": 2.4924, "step": 5804 }, { "epoch": 0.16, "learning_rate": 0.0019179004383356943, "loss": 2.7722, "step": 5805 }, { "epoch": 0.16, "learning_rate": 0.0019178658967695897, "loss": 2.356, "step": 5806 }, { "epoch": 0.16, "learning_rate": 0.001917831348249897, "loss": 3.0572, "step": 5807 }, { "epoch": 0.16, "learning_rate": 0.001917796792776878, "loss": 2.6679, "step": 5808 }, { "epoch": 0.16, "learning_rate": 0.0019177622303507946, "loss": 2.3871, "step": 5809 }, { "epoch": 0.16, "learning_rate": 0.001917727660971909, "loss": 2.5746, "step": 5810 }, { "epoch": 0.16, "learning_rate": 0.0019176930846404824, "loss": 2.5101, "step": 5811 }, { "epoch": 0.16, "learning_rate": 0.0019176585013567769, "loss": 2.6426, "step": 5812 }, { "epoch": 0.16, "learning_rate": 0.001917623911121055, "loss": 2.6679, "step": 5813 }, { "epoch": 0.16, "learning_rate": 0.001917589313933578, "loss": 2.3692, "step": 5814 }, { "epoch": 0.16, "learning_rate": 0.0019175547097946086, "loss": 2.3929, "step": 5815 }, { "epoch": 0.16, "learning_rate": 0.0019175200987044088, "loss": 2.42, "step": 5816 }, { "epoch": 0.16, "learning_rate": 0.001917485480663241, "loss": 2.6387, "step": 5817 }, { "epoch": 0.16, "learning_rate": 0.001917450855671367, "loss": 2.5774, "step": 5818 }, { "epoch": 0.16, "learning_rate": 0.0019174162237290493, "loss": 2.5622, "step": 5819 }, { "epoch": 0.16, "learning_rate": 0.0019173815848365502, "loss": 3.1618, "step": 5820 }, { "epoch": 0.16, "learning_rate": 0.0019173469389941326, "loss": 2.5708, "step": 5821 }, { "epoch": 0.16, "learning_rate": 0.001917312286202058, "loss": 2.703, "step": 5822 }, { "epoch": 0.16, "learning_rate": 0.00191727762646059, "loss": 2.9351, "step": 5823 }, { "epoch": 0.16, "learning_rate": 0.0019172429597699905, "loss": 2.4675, "step": 5824 }, { "epoch": 0.16, "learning_rate": 0.0019172082861305224, "loss": 2.3562, "step": 5825 }, { "epoch": 0.16, "learning_rate": 0.0019171736055424485, "loss": 2.554, "step": 5826 }, { "epoch": 0.16, "learning_rate": 0.0019171389180060313, "loss": 2.8199, "step": 5827 }, { "epoch": 0.16, "learning_rate": 0.0019171042235215333, "loss": 3.0751, "step": 5828 }, { "epoch": 0.16, "learning_rate": 0.0019170695220892178, "loss": 2.6455, "step": 5829 }, { "epoch": 0.16, "learning_rate": 0.0019170348137093477, "loss": 2.8422, "step": 5830 }, { "epoch": 0.16, "learning_rate": 0.0019170000983821855, "loss": 2.6314, "step": 5831 }, { "epoch": 0.16, "learning_rate": 0.0019169653761079949, "loss": 2.6857, "step": 5832 }, { "epoch": 0.16, "learning_rate": 0.0019169306468870381, "loss": 2.5137, "step": 5833 }, { "epoch": 0.16, "learning_rate": 0.0019168959107195792, "loss": 2.5905, "step": 5834 }, { "epoch": 0.16, "learning_rate": 0.0019168611676058803, "loss": 2.7097, "step": 5835 }, { "epoch": 0.16, "learning_rate": 0.0019168264175462052, "loss": 3.3323, "step": 5836 }, { "epoch": 0.16, "learning_rate": 0.0019167916605408173, "loss": 2.7895, "step": 5837 }, { "epoch": 0.16, "learning_rate": 0.0019167568965899795, "loss": 3.0687, "step": 5838 }, { "epoch": 0.16, "learning_rate": 0.0019167221256939555, "loss": 2.8797, "step": 5839 }, { "epoch": 0.16, "learning_rate": 0.0019166873478530086, "loss": 2.8398, "step": 5840 }, { "epoch": 0.16, "learning_rate": 0.0019166525630674022, "loss": 2.5643, "step": 5841 }, { "epoch": 0.16, "learning_rate": 0.0019166177713373998, "loss": 2.78, "step": 5842 }, { "epoch": 0.16, "learning_rate": 0.001916582972663265, "loss": 2.4429, "step": 5843 }, { "epoch": 0.16, "learning_rate": 0.0019165481670452614, "loss": 2.3916, "step": 5844 }, { "epoch": 0.16, "learning_rate": 0.0019165133544836528, "loss": 2.6995, "step": 5845 }, { "epoch": 0.16, "learning_rate": 0.0019164785349787034, "loss": 3.1419, "step": 5846 }, { "epoch": 0.16, "learning_rate": 0.0019164437085306756, "loss": 2.7869, "step": 5847 }, { "epoch": 0.16, "learning_rate": 0.0019164088751398346, "loss": 2.9454, "step": 5848 }, { "epoch": 0.16, "learning_rate": 0.0019163740348064437, "loss": 2.5224, "step": 5849 }, { "epoch": 0.16, "learning_rate": 0.0019163391875307672, "loss": 2.2502, "step": 5850 }, { "epoch": 0.16, "learning_rate": 0.0019163043333130685, "loss": 2.7106, "step": 5851 }, { "epoch": 0.16, "learning_rate": 0.001916269472153612, "loss": 2.8569, "step": 5852 }, { "epoch": 0.16, "learning_rate": 0.001916234604052662, "loss": 2.7404, "step": 5853 }, { "epoch": 0.16, "learning_rate": 0.0019161997290104823, "loss": 2.449, "step": 5854 }, { "epoch": 0.16, "learning_rate": 0.0019161648470273373, "loss": 2.9922, "step": 5855 }, { "epoch": 0.16, "learning_rate": 0.0019161299581034912, "loss": 2.571, "step": 5856 }, { "epoch": 0.16, "learning_rate": 0.0019160950622392084, "loss": 3.0287, "step": 5857 }, { "epoch": 0.16, "learning_rate": 0.0019160601594347532, "loss": 2.8497, "step": 5858 }, { "epoch": 0.16, "learning_rate": 0.00191602524969039, "loss": 2.5385, "step": 5859 }, { "epoch": 0.16, "learning_rate": 0.0019159903330063831, "loss": 2.7712, "step": 5860 }, { "epoch": 0.16, "learning_rate": 0.0019159554093829971, "loss": 3.1048, "step": 5861 }, { "epoch": 0.16, "learning_rate": 0.0019159204788204971, "loss": 2.5292, "step": 5862 }, { "epoch": 0.16, "learning_rate": 0.0019158855413191473, "loss": 2.2494, "step": 5863 }, { "epoch": 0.16, "learning_rate": 0.0019158505968792118, "loss": 2.8651, "step": 5864 }, { "epoch": 0.16, "learning_rate": 0.0019158156455009565, "loss": 2.3985, "step": 5865 }, { "epoch": 0.16, "learning_rate": 0.0019157806871846455, "loss": 2.9401, "step": 5866 }, { "epoch": 0.16, "learning_rate": 0.0019157457219305437, "loss": 2.5318, "step": 5867 }, { "epoch": 0.16, "learning_rate": 0.0019157107497389156, "loss": 2.8827, "step": 5868 }, { "epoch": 0.16, "learning_rate": 0.0019156757706100271, "loss": 2.8769, "step": 5869 }, { "epoch": 0.16, "learning_rate": 0.0019156407845441427, "loss": 2.459, "step": 5870 }, { "epoch": 0.16, "learning_rate": 0.0019156057915415271, "loss": 2.5178, "step": 5871 }, { "epoch": 0.16, "learning_rate": 0.0019155707916024458, "loss": 2.4529, "step": 5872 }, { "epoch": 0.16, "learning_rate": 0.001915535784727164, "loss": 2.3935, "step": 5873 }, { "epoch": 0.16, "learning_rate": 0.0019155007709159466, "loss": 2.4588, "step": 5874 }, { "epoch": 0.16, "learning_rate": 0.0019154657501690591, "loss": 2.7682, "step": 5875 }, { "epoch": 0.16, "learning_rate": 0.001915430722486767, "loss": 3.1792, "step": 5876 }, { "epoch": 0.16, "learning_rate": 0.0019153956878693351, "loss": 2.9017, "step": 5877 }, { "epoch": 0.16, "learning_rate": 0.0019153606463170293, "loss": 2.6377, "step": 5878 }, { "epoch": 0.16, "learning_rate": 0.0019153255978301147, "loss": 2.7014, "step": 5879 }, { "epoch": 0.16, "learning_rate": 0.0019152905424088572, "loss": 2.5768, "step": 5880 }, { "epoch": 0.16, "learning_rate": 0.001915255480053522, "loss": 2.473, "step": 5881 }, { "epoch": 0.16, "learning_rate": 0.0019152204107643752, "loss": 2.9204, "step": 5882 }, { "epoch": 0.16, "learning_rate": 0.001915185334541682, "loss": 2.8753, "step": 5883 }, { "epoch": 0.16, "learning_rate": 0.0019151502513857083, "loss": 2.7436, "step": 5884 }, { "epoch": 0.16, "learning_rate": 0.00191511516129672, "loss": 3.2155, "step": 5885 }, { "epoch": 0.16, "learning_rate": 0.001915080064274983, "loss": 2.497, "step": 5886 }, { "epoch": 0.16, "learning_rate": 0.0019150449603207624, "loss": 2.8057, "step": 5887 }, { "epoch": 0.16, "learning_rate": 0.0019150098494343252, "loss": 2.6294, "step": 5888 }, { "epoch": 0.16, "learning_rate": 0.0019149747316159372, "loss": 2.8959, "step": 5889 }, { "epoch": 0.16, "learning_rate": 0.001914939606865864, "loss": 2.3523, "step": 5890 }, { "epoch": 0.16, "learning_rate": 0.001914904475184372, "loss": 2.5813, "step": 5891 }, { "epoch": 0.16, "learning_rate": 0.001914869336571727, "loss": 2.2058, "step": 5892 }, { "epoch": 0.16, "learning_rate": 0.0019148341910281957, "loss": 2.7507, "step": 5893 }, { "epoch": 0.16, "learning_rate": 0.001914799038554044, "loss": 2.5346, "step": 5894 }, { "epoch": 0.16, "learning_rate": 0.0019147638791495386, "loss": 2.5496, "step": 5895 }, { "epoch": 0.16, "learning_rate": 0.0019147287128149454, "loss": 2.5818, "step": 5896 }, { "epoch": 0.16, "learning_rate": 0.0019146935395505309, "loss": 2.7158, "step": 5897 }, { "epoch": 0.16, "learning_rate": 0.001914658359356562, "loss": 2.9291, "step": 5898 }, { "epoch": 0.16, "learning_rate": 0.0019146231722333045, "loss": 2.8691, "step": 5899 }, { "epoch": 0.16, "learning_rate": 0.0019145879781810257, "loss": 2.8716, "step": 5900 }, { "epoch": 0.16, "learning_rate": 0.0019145527771999916, "loss": 2.6183, "step": 5901 }, { "epoch": 0.16, "learning_rate": 0.0019145175692904693, "loss": 2.5772, "step": 5902 }, { "epoch": 0.16, "learning_rate": 0.0019144823544527255, "loss": 2.9135, "step": 5903 }, { "epoch": 0.16, "learning_rate": 0.0019144471326870268, "loss": 2.6797, "step": 5904 }, { "epoch": 0.16, "learning_rate": 0.00191441190399364, "loss": 2.7299, "step": 5905 }, { "epoch": 0.16, "learning_rate": 0.001914376668372832, "loss": 2.8464, "step": 5906 }, { "epoch": 0.16, "learning_rate": 0.0019143414258248703, "loss": 2.9771, "step": 5907 }, { "epoch": 0.16, "learning_rate": 0.0019143061763500211, "loss": 2.9262, "step": 5908 }, { "epoch": 0.16, "learning_rate": 0.0019142709199485518, "loss": 2.6315, "step": 5909 }, { "epoch": 0.16, "learning_rate": 0.0019142356566207296, "loss": 2.7867, "step": 5910 }, { "epoch": 0.16, "learning_rate": 0.0019142003863668214, "loss": 2.9913, "step": 5911 }, { "epoch": 0.16, "learning_rate": 0.0019141651091870945, "loss": 2.6796, "step": 5912 }, { "epoch": 0.16, "learning_rate": 0.0019141298250818161, "loss": 2.5056, "step": 5913 }, { "epoch": 0.16, "learning_rate": 0.0019140945340512536, "loss": 2.516, "step": 5914 }, { "epoch": 0.16, "learning_rate": 0.0019140592360956746, "loss": 2.4746, "step": 5915 }, { "epoch": 0.16, "learning_rate": 0.001914023931215346, "loss": 3.0453, "step": 5916 }, { "epoch": 0.16, "learning_rate": 0.0019139886194105356, "loss": 2.4371, "step": 5917 }, { "epoch": 0.16, "learning_rate": 0.0019139533006815106, "loss": 2.5716, "step": 5918 }, { "epoch": 0.16, "learning_rate": 0.001913917975028539, "loss": 2.6145, "step": 5919 }, { "epoch": 0.16, "learning_rate": 0.0019138826424518883, "loss": 2.636, "step": 5920 }, { "epoch": 0.16, "learning_rate": 0.001913847302951826, "loss": 2.7834, "step": 5921 }, { "epoch": 0.16, "learning_rate": 0.0019138119565286198, "loss": 2.3049, "step": 5922 }, { "epoch": 0.16, "learning_rate": 0.0019137766031825376, "loss": 2.4495, "step": 5923 }, { "epoch": 0.16, "learning_rate": 0.0019137412429138475, "loss": 3.005, "step": 5924 }, { "epoch": 0.16, "learning_rate": 0.0019137058757228167, "loss": 2.6198, "step": 5925 }, { "epoch": 0.16, "learning_rate": 0.001913670501609714, "loss": 2.9363, "step": 5926 }, { "epoch": 0.16, "learning_rate": 0.0019136351205748066, "loss": 2.6722, "step": 5927 }, { "epoch": 0.16, "learning_rate": 0.0019135997326183629, "loss": 2.5239, "step": 5928 }, { "epoch": 0.16, "learning_rate": 0.0019135643377406512, "loss": 2.4687, "step": 5929 }, { "epoch": 0.16, "learning_rate": 0.001913528935941939, "loss": 2.7155, "step": 5930 }, { "epoch": 0.16, "learning_rate": 0.001913493527222495, "loss": 3.0277, "step": 5931 }, { "epoch": 0.16, "learning_rate": 0.0019134581115825876, "loss": 2.537, "step": 5932 }, { "epoch": 0.16, "learning_rate": 0.0019134226890224848, "loss": 2.8394, "step": 5933 }, { "epoch": 0.16, "learning_rate": 0.001913387259542455, "loss": 2.5392, "step": 5934 }, { "epoch": 0.16, "learning_rate": 0.0019133518231427664, "loss": 2.5663, "step": 5935 }, { "epoch": 0.16, "learning_rate": 0.001913316379823688, "loss": 2.53, "step": 5936 }, { "epoch": 0.16, "learning_rate": 0.0019132809295854879, "loss": 2.579, "step": 5937 }, { "epoch": 0.16, "learning_rate": 0.0019132454724284345, "loss": 2.9664, "step": 5938 }, { "epoch": 0.16, "learning_rate": 0.001913210008352797, "loss": 2.7526, "step": 5939 }, { "epoch": 0.16, "learning_rate": 0.0019131745373588435, "loss": 2.6101, "step": 5940 }, { "epoch": 0.16, "learning_rate": 0.0019131390594468432, "loss": 2.4341, "step": 5941 }, { "epoch": 0.16, "learning_rate": 0.0019131035746170646, "loss": 2.7639, "step": 5942 }, { "epoch": 0.16, "learning_rate": 0.0019130680828697763, "loss": 2.6613, "step": 5943 }, { "epoch": 0.16, "learning_rate": 0.0019130325842052476, "loss": 2.5311, "step": 5944 }, { "epoch": 0.16, "learning_rate": 0.0019129970786237473, "loss": 2.6171, "step": 5945 }, { "epoch": 0.16, "learning_rate": 0.0019129615661255444, "loss": 2.3576, "step": 5946 }, { "epoch": 0.16, "learning_rate": 0.001912926046710908, "loss": 3.0451, "step": 5947 }, { "epoch": 0.16, "learning_rate": 0.001912890520380107, "loss": 2.8793, "step": 5948 }, { "epoch": 0.16, "learning_rate": 0.0019128549871334105, "loss": 2.7872, "step": 5949 }, { "epoch": 0.16, "learning_rate": 0.001912819446971088, "loss": 2.9288, "step": 5950 }, { "epoch": 0.16, "learning_rate": 0.0019127838998934084, "loss": 2.8563, "step": 5951 }, { "epoch": 0.16, "learning_rate": 0.0019127483459006412, "loss": 2.941, "step": 5952 }, { "epoch": 0.16, "learning_rate": 0.0019127127849930558, "loss": 2.6823, "step": 5953 }, { "epoch": 0.16, "learning_rate": 0.0019126772171709214, "loss": 2.8328, "step": 5954 }, { "epoch": 0.16, "learning_rate": 0.0019126416424345076, "loss": 2.7202, "step": 5955 }, { "epoch": 0.16, "learning_rate": 0.001912606060784084, "loss": 2.5198, "step": 5956 }, { "epoch": 0.16, "learning_rate": 0.00191257047221992, "loss": 2.5863, "step": 5957 }, { "epoch": 0.16, "learning_rate": 0.0019125348767422851, "loss": 2.5854, "step": 5958 }, { "epoch": 0.16, "learning_rate": 0.0019124992743514496, "loss": 2.7042, "step": 5959 }, { "epoch": 0.16, "learning_rate": 0.0019124636650476822, "loss": 2.6861, "step": 5960 }, { "epoch": 0.16, "learning_rate": 0.0019124280488312534, "loss": 2.7926, "step": 5961 }, { "epoch": 0.16, "learning_rate": 0.0019123924257024327, "loss": 3.0485, "step": 5962 }, { "epoch": 0.16, "learning_rate": 0.0019123567956614903, "loss": 2.9484, "step": 5963 }, { "epoch": 0.16, "learning_rate": 0.001912321158708696, "loss": 2.8772, "step": 5964 }, { "epoch": 0.16, "learning_rate": 0.0019122855148443194, "loss": 2.8065, "step": 5965 }, { "epoch": 0.16, "learning_rate": 0.001912249864068631, "loss": 2.5801, "step": 5966 }, { "epoch": 0.16, "learning_rate": 0.0019122142063819005, "loss": 2.8945, "step": 5967 }, { "epoch": 0.16, "learning_rate": 0.0019121785417843986, "loss": 2.615, "step": 5968 }, { "epoch": 0.16, "learning_rate": 0.0019121428702763951, "loss": 3.0044, "step": 5969 }, { "epoch": 0.16, "learning_rate": 0.0019121071918581603, "loss": 2.434, "step": 5970 }, { "epoch": 0.16, "learning_rate": 0.0019120715065299642, "loss": 2.5699, "step": 5971 }, { "epoch": 0.16, "learning_rate": 0.0019120358142920776, "loss": 2.6089, "step": 5972 }, { "epoch": 0.16, "learning_rate": 0.001912000115144771, "loss": 2.7594, "step": 5973 }, { "epoch": 0.16, "learning_rate": 0.0019119644090883142, "loss": 2.698, "step": 5974 }, { "epoch": 0.16, "learning_rate": 0.0019119286961229785, "loss": 2.6499, "step": 5975 }, { "epoch": 0.16, "learning_rate": 0.0019118929762490335, "loss": 2.3781, "step": 5976 }, { "epoch": 0.16, "learning_rate": 0.0019118572494667507, "loss": 2.6076, "step": 5977 }, { "epoch": 0.16, "learning_rate": 0.0019118215157764003, "loss": 2.3937, "step": 5978 }, { "epoch": 0.16, "learning_rate": 0.0019117857751782532, "loss": 2.6384, "step": 5979 }, { "epoch": 0.16, "learning_rate": 0.00191175002767258, "loss": 2.7477, "step": 5980 }, { "epoch": 0.16, "learning_rate": 0.0019117142732596516, "loss": 2.2457, "step": 5981 }, { "epoch": 0.16, "learning_rate": 0.0019116785119397389, "loss": 2.6867, "step": 5982 }, { "epoch": 0.16, "learning_rate": 0.0019116427437131124, "loss": 2.584, "step": 5983 }, { "epoch": 0.16, "learning_rate": 0.0019116069685800442, "loss": 2.3275, "step": 5984 }, { "epoch": 0.16, "learning_rate": 0.001911571186540804, "loss": 2.9866, "step": 5985 }, { "epoch": 0.16, "learning_rate": 0.0019115353975956637, "loss": 2.396, "step": 5986 }, { "epoch": 0.16, "learning_rate": 0.001911499601744894, "loss": 2.8883, "step": 5987 }, { "epoch": 0.16, "learning_rate": 0.0019114637989887666, "loss": 2.8741, "step": 5988 }, { "epoch": 0.16, "learning_rate": 0.0019114279893275522, "loss": 3.0132, "step": 5989 }, { "epoch": 0.16, "learning_rate": 0.0019113921727615221, "loss": 2.9606, "step": 5990 }, { "epoch": 0.16, "learning_rate": 0.0019113563492909483, "loss": 2.5529, "step": 5991 }, { "epoch": 0.16, "learning_rate": 0.0019113205189161015, "loss": 3.2312, "step": 5992 }, { "epoch": 0.16, "learning_rate": 0.0019112846816372537, "loss": 3.3321, "step": 5993 }, { "epoch": 0.16, "learning_rate": 0.0019112488374546754, "loss": 2.6986, "step": 5994 }, { "epoch": 0.16, "learning_rate": 0.0019112129863686391, "loss": 3.0046, "step": 5995 }, { "epoch": 0.16, "learning_rate": 0.0019111771283794163, "loss": 2.227, "step": 5996 }, { "epoch": 0.16, "learning_rate": 0.0019111412634872785, "loss": 2.6273, "step": 5997 }, { "epoch": 0.16, "learning_rate": 0.0019111053916924972, "loss": 3.0131, "step": 5998 }, { "epoch": 0.16, "learning_rate": 0.0019110695129953446, "loss": 2.8789, "step": 5999 }, { "epoch": 0.16, "learning_rate": 0.0019110336273960922, "loss": 2.3182, "step": 6000 }, { "epoch": 0.16, "learning_rate": 0.0019109977348950116, "loss": 2.4837, "step": 6001 }, { "epoch": 0.16, "learning_rate": 0.0019109618354923752, "loss": 2.6684, "step": 6002 }, { "epoch": 0.16, "learning_rate": 0.0019109259291884549, "loss": 2.358, "step": 6003 }, { "epoch": 0.16, "learning_rate": 0.0019108900159835226, "loss": 2.6432, "step": 6004 }, { "epoch": 0.16, "learning_rate": 0.0019108540958778502, "loss": 2.6063, "step": 6005 }, { "epoch": 0.16, "learning_rate": 0.0019108181688717103, "loss": 3.0756, "step": 6006 }, { "epoch": 0.16, "learning_rate": 0.0019107822349653746, "loss": 2.715, "step": 6007 }, { "epoch": 0.16, "learning_rate": 0.0019107462941591153, "loss": 2.5703, "step": 6008 }, { "epoch": 0.16, "learning_rate": 0.0019107103464532055, "loss": 2.6732, "step": 6009 }, { "epoch": 0.16, "learning_rate": 0.0019106743918479165, "loss": 2.7183, "step": 6010 }, { "epoch": 0.16, "learning_rate": 0.0019106384303435213, "loss": 2.6844, "step": 6011 }, { "epoch": 0.16, "learning_rate": 0.001910602461940292, "loss": 2.9015, "step": 6012 }, { "epoch": 0.16, "learning_rate": 0.0019105664866385012, "loss": 2.5351, "step": 6013 }, { "epoch": 0.16, "learning_rate": 0.0019105305044384217, "loss": 2.5373, "step": 6014 }, { "epoch": 0.16, "learning_rate": 0.001910494515340326, "loss": 2.6083, "step": 6015 }, { "epoch": 0.16, "learning_rate": 0.0019104585193444863, "loss": 2.6159, "step": 6016 }, { "epoch": 0.16, "learning_rate": 0.0019104225164511756, "loss": 2.5267, "step": 6017 }, { "epoch": 0.16, "learning_rate": 0.0019103865066606672, "loss": 2.8159, "step": 6018 }, { "epoch": 0.16, "learning_rate": 0.0019103504899732329, "loss": 2.854, "step": 6019 }, { "epoch": 0.16, "learning_rate": 0.001910314466389146, "loss": 2.9231, "step": 6020 }, { "epoch": 0.16, "learning_rate": 0.0019102784359086799, "loss": 2.9154, "step": 6021 }, { "epoch": 0.16, "learning_rate": 0.0019102423985321068, "loss": 2.6386, "step": 6022 }, { "epoch": 0.16, "learning_rate": 0.0019102063542597, "loss": 2.4167, "step": 6023 }, { "epoch": 0.16, "learning_rate": 0.0019101703030917326, "loss": 2.8888, "step": 6024 }, { "epoch": 0.16, "learning_rate": 0.0019101342450284777, "loss": 2.808, "step": 6025 }, { "epoch": 0.16, "learning_rate": 0.0019100981800702086, "loss": 2.5894, "step": 6026 }, { "epoch": 0.16, "learning_rate": 0.0019100621082171984, "loss": 2.8623, "step": 6027 }, { "epoch": 0.16, "learning_rate": 0.0019100260294697203, "loss": 2.622, "step": 6028 }, { "epoch": 0.16, "learning_rate": 0.0019099899438280478, "loss": 2.7234, "step": 6029 }, { "epoch": 0.16, "learning_rate": 0.001909953851292454, "loss": 2.5602, "step": 6030 }, { "epoch": 0.16, "learning_rate": 0.0019099177518632127, "loss": 3.1538, "step": 6031 }, { "epoch": 0.16, "learning_rate": 0.0019098816455405969, "loss": 2.6412, "step": 6032 }, { "epoch": 0.16, "learning_rate": 0.0019098455323248809, "loss": 2.833, "step": 6033 }, { "epoch": 0.16, "learning_rate": 0.0019098094122163374, "loss": 2.7651, "step": 6034 }, { "epoch": 0.16, "learning_rate": 0.0019097732852152408, "loss": 2.8744, "step": 6035 }, { "epoch": 0.16, "learning_rate": 0.001909737151321864, "loss": 2.2533, "step": 6036 }, { "epoch": 0.16, "learning_rate": 0.0019097010105364814, "loss": 2.6594, "step": 6037 }, { "epoch": 0.16, "learning_rate": 0.0019096648628593666, "loss": 2.77, "step": 6038 }, { "epoch": 0.16, "learning_rate": 0.0019096287082907932, "loss": 2.7229, "step": 6039 }, { "epoch": 0.16, "learning_rate": 0.0019095925468310359, "loss": 2.2999, "step": 6040 }, { "epoch": 0.16, "learning_rate": 0.0019095563784803675, "loss": 2.9639, "step": 6041 }, { "epoch": 0.16, "learning_rate": 0.001909520203239063, "loss": 2.6407, "step": 6042 }, { "epoch": 0.16, "learning_rate": 0.001909484021107396, "loss": 2.92, "step": 6043 }, { "epoch": 0.16, "learning_rate": 0.0019094478320856403, "loss": 2.7783, "step": 6044 }, { "epoch": 0.16, "learning_rate": 0.0019094116361740709, "loss": 2.7273, "step": 6045 }, { "epoch": 0.16, "learning_rate": 0.0019093754333729608, "loss": 2.5758, "step": 6046 }, { "epoch": 0.16, "learning_rate": 0.001909339223682586, "loss": 2.6405, "step": 6047 }, { "epoch": 0.16, "learning_rate": 0.0019093030071032188, "loss": 2.7549, "step": 6048 }, { "epoch": 0.16, "learning_rate": 0.0019092667836351355, "loss": 2.3418, "step": 6049 }, { "epoch": 0.16, "learning_rate": 0.0019092305532786092, "loss": 2.2836, "step": 6050 }, { "epoch": 0.16, "learning_rate": 0.0019091943160339147, "loss": 2.9169, "step": 6051 }, { "epoch": 0.16, "learning_rate": 0.0019091580719013267, "loss": 2.8445, "step": 6052 }, { "epoch": 0.16, "learning_rate": 0.0019091218208811195, "loss": 2.3503, "step": 6053 }, { "epoch": 0.16, "learning_rate": 0.0019090855629735682, "loss": 2.8049, "step": 6054 }, { "epoch": 0.16, "learning_rate": 0.0019090492981789471, "loss": 2.2606, "step": 6055 }, { "epoch": 0.16, "learning_rate": 0.0019090130264975312, "loss": 2.5792, "step": 6056 }, { "epoch": 0.16, "learning_rate": 0.0019089767479295947, "loss": 2.7532, "step": 6057 }, { "epoch": 0.16, "learning_rate": 0.0019089404624754135, "loss": 2.814, "step": 6058 }, { "epoch": 0.16, "learning_rate": 0.0019089041701352612, "loss": 2.4597, "step": 6059 }, { "epoch": 0.16, "learning_rate": 0.0019088678709094139, "loss": 2.5057, "step": 6060 }, { "epoch": 0.16, "learning_rate": 0.0019088315647981457, "loss": 2.801, "step": 6061 }, { "epoch": 0.16, "learning_rate": 0.0019087952518017325, "loss": 2.6591, "step": 6062 }, { "epoch": 0.16, "learning_rate": 0.0019087589319204486, "loss": 3.1612, "step": 6063 }, { "epoch": 0.16, "learning_rate": 0.0019087226051545695, "loss": 3.1744, "step": 6064 }, { "epoch": 0.16, "learning_rate": 0.0019086862715043706, "loss": 2.4679, "step": 6065 }, { "epoch": 0.16, "learning_rate": 0.0019086499309701268, "loss": 2.4923, "step": 6066 }, { "epoch": 0.16, "learning_rate": 0.0019086135835521137, "loss": 2.7326, "step": 6067 }, { "epoch": 0.16, "learning_rate": 0.0019085772292506062, "loss": 2.8131, "step": 6068 }, { "epoch": 0.16, "learning_rate": 0.0019085408680658805, "loss": 2.7664, "step": 6069 }, { "epoch": 0.16, "learning_rate": 0.0019085044999982116, "loss": 3.0297, "step": 6070 }, { "epoch": 0.16, "learning_rate": 0.0019084681250478748, "loss": 2.5865, "step": 6071 }, { "epoch": 0.16, "learning_rate": 0.001908431743215146, "loss": 2.3591, "step": 6072 }, { "epoch": 0.16, "learning_rate": 0.0019083953545003009, "loss": 2.4754, "step": 6073 }, { "epoch": 0.16, "learning_rate": 0.0019083589589036145, "loss": 2.6081, "step": 6074 }, { "epoch": 0.16, "learning_rate": 0.0019083225564253635, "loss": 2.6763, "step": 6075 }, { "epoch": 0.16, "learning_rate": 0.001908286147065823, "loss": 2.6068, "step": 6076 }, { "epoch": 0.16, "learning_rate": 0.001908249730825269, "loss": 2.8288, "step": 6077 }, { "epoch": 0.16, "learning_rate": 0.0019082133077039777, "loss": 2.6637, "step": 6078 }, { "epoch": 0.16, "learning_rate": 0.0019081768777022244, "loss": 3.1307, "step": 6079 }, { "epoch": 0.16, "learning_rate": 0.0019081404408202857, "loss": 2.777, "step": 6080 }, { "epoch": 0.16, "learning_rate": 0.0019081039970584373, "loss": 2.6064, "step": 6081 }, { "epoch": 0.16, "learning_rate": 0.0019080675464169551, "loss": 2.6763, "step": 6082 }, { "epoch": 0.16, "learning_rate": 0.001908031088896116, "loss": 2.4454, "step": 6083 }, { "epoch": 0.16, "learning_rate": 0.0019079946244961955, "loss": 2.6245, "step": 6084 }, { "epoch": 0.16, "learning_rate": 0.00190795815321747, "loss": 2.7961, "step": 6085 }, { "epoch": 0.16, "learning_rate": 0.0019079216750602158, "loss": 3.216, "step": 6086 }, { "epoch": 0.16, "learning_rate": 0.0019078851900247093, "loss": 2.7461, "step": 6087 }, { "epoch": 0.16, "learning_rate": 0.001907848698111227, "loss": 2.5796, "step": 6088 }, { "epoch": 0.16, "learning_rate": 0.0019078121993200455, "loss": 2.588, "step": 6089 }, { "epoch": 0.16, "learning_rate": 0.0019077756936514408, "loss": 2.6085, "step": 6090 }, { "epoch": 0.16, "learning_rate": 0.00190773918110569, "loss": 3.0722, "step": 6091 }, { "epoch": 0.16, "learning_rate": 0.001907702661683069, "loss": 3.0689, "step": 6092 }, { "epoch": 0.16, "learning_rate": 0.001907666135383855, "loss": 2.8735, "step": 6093 }, { "epoch": 0.16, "learning_rate": 0.001907629602208325, "loss": 2.7426, "step": 6094 }, { "epoch": 0.16, "learning_rate": 0.0019075930621567552, "loss": 2.9539, "step": 6095 }, { "epoch": 0.16, "learning_rate": 0.0019075565152294228, "loss": 2.7931, "step": 6096 }, { "epoch": 0.16, "learning_rate": 0.0019075199614266042, "loss": 2.4208, "step": 6097 }, { "epoch": 0.16, "learning_rate": 0.0019074834007485769, "loss": 2.2976, "step": 6098 }, { "epoch": 0.16, "learning_rate": 0.0019074468331956175, "loss": 2.9086, "step": 6099 }, { "epoch": 0.16, "learning_rate": 0.0019074102587680031, "loss": 3.1187, "step": 6100 }, { "epoch": 0.16, "learning_rate": 0.0019073736774660106, "loss": 2.7157, "step": 6101 }, { "epoch": 0.16, "learning_rate": 0.0019073370892899177, "loss": 2.7234, "step": 6102 }, { "epoch": 0.16, "learning_rate": 0.001907300494240001, "loss": 2.6206, "step": 6103 }, { "epoch": 0.16, "learning_rate": 0.001907263892316538, "loss": 2.6753, "step": 6104 }, { "epoch": 0.16, "learning_rate": 0.0019072272835198062, "loss": 2.4647, "step": 6105 }, { "epoch": 0.16, "learning_rate": 0.0019071906678500823, "loss": 2.6056, "step": 6106 }, { "epoch": 0.16, "learning_rate": 0.0019071540453076442, "loss": 2.349, "step": 6107 }, { "epoch": 0.16, "learning_rate": 0.0019071174158927693, "loss": 2.5039, "step": 6108 }, { "epoch": 0.16, "learning_rate": 0.0019070807796057352, "loss": 2.3846, "step": 6109 }, { "epoch": 0.16, "learning_rate": 0.0019070441364468192, "loss": 2.9175, "step": 6110 }, { "epoch": 0.16, "learning_rate": 0.0019070074864162988, "loss": 2.5853, "step": 6111 }, { "epoch": 0.16, "learning_rate": 0.001906970829514452, "loss": 2.6003, "step": 6112 }, { "epoch": 0.16, "learning_rate": 0.0019069341657415562, "loss": 2.5698, "step": 6113 }, { "epoch": 0.16, "learning_rate": 0.0019068974950978894, "loss": 2.5111, "step": 6114 }, { "epoch": 0.16, "learning_rate": 0.0019068608175837295, "loss": 2.592, "step": 6115 }, { "epoch": 0.16, "learning_rate": 0.0019068241331993538, "loss": 2.5858, "step": 6116 }, { "epoch": 0.16, "learning_rate": 0.0019067874419450407, "loss": 2.4331, "step": 6117 }, { "epoch": 0.16, "learning_rate": 0.0019067507438210683, "loss": 2.5911, "step": 6118 }, { "epoch": 0.16, "learning_rate": 0.0019067140388277142, "loss": 2.8502, "step": 6119 }, { "epoch": 0.16, "learning_rate": 0.0019066773269652568, "loss": 2.8757, "step": 6120 }, { "epoch": 0.16, "learning_rate": 0.0019066406082339738, "loss": 2.9979, "step": 6121 }, { "epoch": 0.16, "learning_rate": 0.001906603882634144, "loss": 2.9782, "step": 6122 }, { "epoch": 0.16, "learning_rate": 0.0019065671501660448, "loss": 2.4541, "step": 6123 }, { "epoch": 0.16, "learning_rate": 0.0019065304108299556, "loss": 2.3144, "step": 6124 }, { "epoch": 0.16, "learning_rate": 0.0019064936646261536, "loss": 2.6744, "step": 6125 }, { "epoch": 0.16, "learning_rate": 0.0019064569115549174, "loss": 2.424, "step": 6126 }, { "epoch": 0.16, "learning_rate": 0.0019064201516165262, "loss": 2.8343, "step": 6127 }, { "epoch": 0.16, "learning_rate": 0.001906383384811258, "loss": 2.5395, "step": 6128 }, { "epoch": 0.16, "learning_rate": 0.001906346611139391, "loss": 2.5847, "step": 6129 }, { "epoch": 0.16, "learning_rate": 0.0019063098306012043, "loss": 2.5886, "step": 6130 }, { "epoch": 0.16, "learning_rate": 0.0019062730431969764, "loss": 2.736, "step": 6131 }, { "epoch": 0.16, "learning_rate": 0.0019062362489269857, "loss": 2.7677, "step": 6132 }, { "epoch": 0.16, "learning_rate": 0.0019061994477915115, "loss": 2.5921, "step": 6133 }, { "epoch": 0.16, "learning_rate": 0.001906162639790832, "loss": 2.2403, "step": 6134 }, { "epoch": 0.16, "learning_rate": 0.0019061258249252267, "loss": 2.5864, "step": 6135 }, { "epoch": 0.16, "learning_rate": 0.0019060890031949737, "loss": 2.9267, "step": 6136 }, { "epoch": 0.16, "learning_rate": 0.001906052174600353, "loss": 2.5568, "step": 6137 }, { "epoch": 0.16, "learning_rate": 0.0019060153391416426, "loss": 2.6449, "step": 6138 }, { "epoch": 0.16, "learning_rate": 0.001905978496819122, "loss": 2.5304, "step": 6139 }, { "epoch": 0.17, "learning_rate": 0.0019059416476330704, "loss": 2.366, "step": 6140 }, { "epoch": 0.17, "learning_rate": 0.0019059047915837666, "loss": 3.0973, "step": 6141 }, { "epoch": 0.17, "learning_rate": 0.0019058679286714903, "loss": 3.0937, "step": 6142 }, { "epoch": 0.17, "learning_rate": 0.0019058310588965207, "loss": 2.8358, "step": 6143 }, { "epoch": 0.17, "learning_rate": 0.0019057941822591365, "loss": 2.9836, "step": 6144 }, { "epoch": 0.17, "learning_rate": 0.0019057572987596179, "loss": 2.616, "step": 6145 }, { "epoch": 0.17, "learning_rate": 0.001905720408398244, "loss": 2.683, "step": 6146 }, { "epoch": 0.17, "learning_rate": 0.0019056835111752937, "loss": 2.7771, "step": 6147 }, { "epoch": 0.17, "learning_rate": 0.0019056466070910471, "loss": 2.7955, "step": 6148 }, { "epoch": 0.17, "learning_rate": 0.0019056096961457842, "loss": 2.8221, "step": 6149 }, { "epoch": 0.17, "learning_rate": 0.001905572778339784, "loss": 2.5822, "step": 6150 }, { "epoch": 0.17, "learning_rate": 0.0019055358536733261, "loss": 2.488, "step": 6151 }, { "epoch": 0.17, "learning_rate": 0.0019054989221466906, "loss": 2.7696, "step": 6152 }, { "epoch": 0.17, "learning_rate": 0.0019054619837601573, "loss": 2.7868, "step": 6153 }, { "epoch": 0.17, "learning_rate": 0.0019054250385140054, "loss": 3.1953, "step": 6154 }, { "epoch": 0.17, "learning_rate": 0.0019053880864085158, "loss": 2.8898, "step": 6155 }, { "epoch": 0.17, "learning_rate": 0.001905351127443968, "loss": 2.993, "step": 6156 }, { "epoch": 0.17, "learning_rate": 0.0019053141616206415, "loss": 2.8613, "step": 6157 }, { "epoch": 0.17, "learning_rate": 0.001905277188938817, "loss": 2.5704, "step": 6158 }, { "epoch": 0.17, "learning_rate": 0.0019052402093987742, "loss": 2.8718, "step": 6159 }, { "epoch": 0.17, "learning_rate": 0.0019052032230007937, "loss": 2.8266, "step": 6160 }, { "epoch": 0.17, "learning_rate": 0.001905166229745155, "loss": 2.9151, "step": 6161 }, { "epoch": 0.17, "learning_rate": 0.0019051292296321392, "loss": 2.8152, "step": 6162 }, { "epoch": 0.17, "learning_rate": 0.001905092222662026, "loss": 2.8814, "step": 6163 }, { "epoch": 0.17, "learning_rate": 0.0019050552088350958, "loss": 2.4516, "step": 6164 }, { "epoch": 0.17, "learning_rate": 0.0019050181881516291, "loss": 2.6744, "step": 6165 }, { "epoch": 0.17, "learning_rate": 0.0019049811606119068, "loss": 2.7663, "step": 6166 }, { "epoch": 0.17, "learning_rate": 0.0019049441262162087, "loss": 2.5712, "step": 6167 }, { "epoch": 0.17, "learning_rate": 0.0019049070849648157, "loss": 2.4852, "step": 6168 }, { "epoch": 0.17, "learning_rate": 0.0019048700368580085, "loss": 2.6153, "step": 6169 }, { "epoch": 0.17, "learning_rate": 0.0019048329818960679, "loss": 3.0482, "step": 6170 }, { "epoch": 0.17, "learning_rate": 0.0019047959200792742, "loss": 2.6247, "step": 6171 }, { "epoch": 0.17, "learning_rate": 0.0019047588514079083, "loss": 2.8594, "step": 6172 }, { "epoch": 0.17, "learning_rate": 0.001904721775882251, "loss": 2.5496, "step": 6173 }, { "epoch": 0.17, "learning_rate": 0.0019046846935025835, "loss": 2.8358, "step": 6174 }, { "epoch": 0.17, "learning_rate": 0.0019046476042691865, "loss": 2.8264, "step": 6175 }, { "epoch": 0.17, "learning_rate": 0.0019046105081823405, "loss": 2.4355, "step": 6176 }, { "epoch": 0.17, "learning_rate": 0.0019045734052423279, "loss": 3.1158, "step": 6177 }, { "epoch": 0.17, "learning_rate": 0.0019045362954494282, "loss": 2.7766, "step": 6178 }, { "epoch": 0.17, "learning_rate": 0.0019044991788039235, "loss": 2.5742, "step": 6179 }, { "epoch": 0.17, "learning_rate": 0.0019044620553060946, "loss": 2.3347, "step": 6180 }, { "epoch": 0.17, "learning_rate": 0.001904424924956223, "loss": 2.7795, "step": 6181 }, { "epoch": 0.17, "learning_rate": 0.0019043877877545899, "loss": 2.5879, "step": 6182 }, { "epoch": 0.17, "learning_rate": 0.0019043506437014766, "loss": 3.09, "step": 6183 }, { "epoch": 0.17, "learning_rate": 0.0019043134927971643, "loss": 2.6043, "step": 6184 }, { "epoch": 0.17, "learning_rate": 0.001904276335041935, "loss": 2.0366, "step": 6185 }, { "epoch": 0.17, "learning_rate": 0.0019042391704360696, "loss": 2.589, "step": 6186 }, { "epoch": 0.17, "learning_rate": 0.0019042019989798501, "loss": 2.797, "step": 6187 }, { "epoch": 0.17, "learning_rate": 0.0019041648206735576, "loss": 2.7038, "step": 6188 }, { "epoch": 0.17, "learning_rate": 0.0019041276355174742, "loss": 3.0143, "step": 6189 }, { "epoch": 0.17, "learning_rate": 0.0019040904435118815, "loss": 2.8124, "step": 6190 }, { "epoch": 0.17, "learning_rate": 0.0019040532446570613, "loss": 2.693, "step": 6191 }, { "epoch": 0.17, "learning_rate": 0.0019040160389532951, "loss": 2.8191, "step": 6192 }, { "epoch": 0.17, "learning_rate": 0.0019039788264008655, "loss": 2.6325, "step": 6193 }, { "epoch": 0.17, "learning_rate": 0.0019039416070000534, "loss": 2.7956, "step": 6194 }, { "epoch": 0.17, "learning_rate": 0.0019039043807511419, "loss": 2.8487, "step": 6195 }, { "epoch": 0.17, "learning_rate": 0.0019038671476544118, "loss": 2.6498, "step": 6196 }, { "epoch": 0.17, "learning_rate": 0.001903829907710146, "loss": 2.478, "step": 6197 }, { "epoch": 0.17, "learning_rate": 0.0019037926609186268, "loss": 3.0501, "step": 6198 }, { "epoch": 0.17, "learning_rate": 0.0019037554072801352, "loss": 2.3674, "step": 6199 }, { "epoch": 0.17, "learning_rate": 0.0019037181467949549, "loss": 2.5568, "step": 6200 }, { "epoch": 0.17, "learning_rate": 0.0019036808794633672, "loss": 2.6864, "step": 6201 }, { "epoch": 0.17, "learning_rate": 0.0019036436052856547, "loss": 2.4236, "step": 6202 }, { "epoch": 0.17, "learning_rate": 0.0019036063242620998, "loss": 2.5903, "step": 6203 }, { "epoch": 0.17, "learning_rate": 0.0019035690363929851, "loss": 2.7129, "step": 6204 }, { "epoch": 0.17, "learning_rate": 0.0019035317416785929, "loss": 2.499, "step": 6205 }, { "epoch": 0.17, "learning_rate": 0.0019034944401192056, "loss": 2.7604, "step": 6206 }, { "epoch": 0.17, "learning_rate": 0.001903457131715106, "loss": 2.7195, "step": 6207 }, { "epoch": 0.17, "learning_rate": 0.0019034198164665768, "loss": 2.6579, "step": 6208 }, { "epoch": 0.17, "learning_rate": 0.0019033824943739007, "loss": 2.6279, "step": 6209 }, { "epoch": 0.17, "learning_rate": 0.0019033451654373599, "loss": 2.8872, "step": 6210 }, { "epoch": 0.17, "learning_rate": 0.001903307829657238, "loss": 3.092, "step": 6211 }, { "epoch": 0.17, "learning_rate": 0.0019032704870338172, "loss": 3.0648, "step": 6212 }, { "epoch": 0.17, "learning_rate": 0.0019032331375673807, "loss": 2.5782, "step": 6213 }, { "epoch": 0.17, "learning_rate": 0.0019031957812582117, "loss": 2.7546, "step": 6214 }, { "epoch": 0.17, "learning_rate": 0.0019031584181065928, "loss": 2.6271, "step": 6215 }, { "epoch": 0.17, "learning_rate": 0.0019031210481128072, "loss": 2.8214, "step": 6216 }, { "epoch": 0.17, "learning_rate": 0.001903083671277138, "loss": 2.7563, "step": 6217 }, { "epoch": 0.17, "learning_rate": 0.0019030462875998684, "loss": 2.4532, "step": 6218 }, { "epoch": 0.17, "learning_rate": 0.0019030088970812815, "loss": 2.5686, "step": 6219 }, { "epoch": 0.17, "learning_rate": 0.0019029714997216608, "loss": 2.6157, "step": 6220 }, { "epoch": 0.17, "learning_rate": 0.0019029340955212892, "loss": 2.5405, "step": 6221 }, { "epoch": 0.17, "learning_rate": 0.0019028966844804505, "loss": 2.4024, "step": 6222 }, { "epoch": 0.17, "learning_rate": 0.0019028592665994277, "loss": 2.6674, "step": 6223 }, { "epoch": 0.17, "learning_rate": 0.0019028218418785051, "loss": 2.5767, "step": 6224 }, { "epoch": 0.17, "learning_rate": 0.001902784410317965, "loss": 3.0974, "step": 6225 }, { "epoch": 0.17, "learning_rate": 0.0019027469719180919, "loss": 3.1069, "step": 6226 }, { "epoch": 0.17, "learning_rate": 0.001902709526679169, "loss": 2.771, "step": 6227 }, { "epoch": 0.17, "learning_rate": 0.0019026720746014804, "loss": 2.4437, "step": 6228 }, { "epoch": 0.17, "learning_rate": 0.0019026346156853094, "loss": 2.416, "step": 6229 }, { "epoch": 0.17, "learning_rate": 0.0019025971499309399, "loss": 2.8377, "step": 6230 }, { "epoch": 0.17, "learning_rate": 0.0019025596773386555, "loss": 2.6011, "step": 6231 }, { "epoch": 0.17, "learning_rate": 0.0019025221979087409, "loss": 2.4889, "step": 6232 }, { "epoch": 0.17, "learning_rate": 0.001902484711641479, "loss": 2.7783, "step": 6233 }, { "epoch": 0.17, "learning_rate": 0.0019024472185371543, "loss": 2.2835, "step": 6234 }, { "epoch": 0.17, "learning_rate": 0.0019024097185960512, "loss": 2.4072, "step": 6235 }, { "epoch": 0.17, "learning_rate": 0.001902372211818453, "loss": 2.447, "step": 6236 }, { "epoch": 0.17, "learning_rate": 0.0019023346982046446, "loss": 2.6932, "step": 6237 }, { "epoch": 0.17, "learning_rate": 0.0019022971777549094, "loss": 2.6846, "step": 6238 }, { "epoch": 0.17, "learning_rate": 0.0019022596504695325, "loss": 2.164, "step": 6239 }, { "epoch": 0.17, "learning_rate": 0.0019022221163487976, "loss": 2.5829, "step": 6240 }, { "epoch": 0.17, "learning_rate": 0.0019021845753929895, "loss": 2.8542, "step": 6241 }, { "epoch": 0.17, "learning_rate": 0.001902147027602392, "loss": 3.0483, "step": 6242 }, { "epoch": 0.17, "learning_rate": 0.00190210947297729, "loss": 2.6301, "step": 6243 }, { "epoch": 0.17, "learning_rate": 0.001902071911517968, "loss": 2.7486, "step": 6244 }, { "epoch": 0.17, "learning_rate": 0.0019020343432247105, "loss": 2.3123, "step": 6245 }, { "epoch": 0.17, "learning_rate": 0.0019019967680978021, "loss": 2.7878, "step": 6246 }, { "epoch": 0.17, "learning_rate": 0.0019019591861375274, "loss": 2.8218, "step": 6247 }, { "epoch": 0.17, "learning_rate": 0.001901921597344171, "loss": 2.3628, "step": 6248 }, { "epoch": 0.17, "learning_rate": 0.001901884001718018, "loss": 2.256, "step": 6249 }, { "epoch": 0.17, "learning_rate": 0.001901846399259353, "loss": 3.0754, "step": 6250 }, { "epoch": 0.17, "learning_rate": 0.001901808789968461, "loss": 2.6704, "step": 6251 }, { "epoch": 0.17, "learning_rate": 0.001901771173845627, "loss": 2.5911, "step": 6252 }, { "epoch": 0.17, "learning_rate": 0.0019017335508911353, "loss": 2.8494, "step": 6253 }, { "epoch": 0.17, "learning_rate": 0.0019016959211052718, "loss": 3.0661, "step": 6254 }, { "epoch": 0.17, "learning_rate": 0.0019016582844883212, "loss": 2.7527, "step": 6255 }, { "epoch": 0.17, "learning_rate": 0.0019016206410405686, "loss": 2.9121, "step": 6256 }, { "epoch": 0.17, "learning_rate": 0.001901582990762299, "loss": 2.5854, "step": 6257 }, { "epoch": 0.17, "learning_rate": 0.001901545333653798, "loss": 2.805, "step": 6258 }, { "epoch": 0.17, "learning_rate": 0.0019015076697153509, "loss": 2.7768, "step": 6259 }, { "epoch": 0.17, "learning_rate": 0.0019014699989472427, "loss": 2.5676, "step": 6260 }, { "epoch": 0.17, "learning_rate": 0.001901432321349759, "loss": 2.7666, "step": 6261 }, { "epoch": 0.17, "learning_rate": 0.0019013946369231852, "loss": 2.8757, "step": 6262 }, { "epoch": 0.17, "learning_rate": 0.0019013569456678065, "loss": 2.5246, "step": 6263 }, { "epoch": 0.17, "learning_rate": 0.0019013192475839092, "loss": 2.7399, "step": 6264 }, { "epoch": 0.17, "learning_rate": 0.0019012815426717783, "loss": 2.0803, "step": 6265 }, { "epoch": 0.17, "learning_rate": 0.0019012438309316995, "loss": 2.9147, "step": 6266 }, { "epoch": 0.17, "learning_rate": 0.0019012061123639583, "loss": 2.56, "step": 6267 }, { "epoch": 0.17, "learning_rate": 0.0019011683869688413, "loss": 2.3887, "step": 6268 }, { "epoch": 0.17, "learning_rate": 0.0019011306547466332, "loss": 2.896, "step": 6269 }, { "epoch": 0.17, "learning_rate": 0.0019010929156976204, "loss": 2.5883, "step": 6270 }, { "epoch": 0.17, "learning_rate": 0.0019010551698220891, "loss": 2.539, "step": 6271 }, { "epoch": 0.17, "learning_rate": 0.0019010174171203245, "loss": 2.7849, "step": 6272 }, { "epoch": 0.17, "learning_rate": 0.0019009796575926133, "loss": 2.9057, "step": 6273 }, { "epoch": 0.17, "learning_rate": 0.0019009418912392412, "loss": 2.6338, "step": 6274 }, { "epoch": 0.17, "learning_rate": 0.0019009041180604947, "loss": 2.3403, "step": 6275 }, { "epoch": 0.17, "learning_rate": 0.0019008663380566592, "loss": 2.418, "step": 6276 }, { "epoch": 0.17, "learning_rate": 0.0019008285512280216, "loss": 2.5167, "step": 6277 }, { "epoch": 0.17, "learning_rate": 0.0019007907575748681, "loss": 2.7096, "step": 6278 }, { "epoch": 0.17, "learning_rate": 0.001900752957097485, "loss": 2.8602, "step": 6279 }, { "epoch": 0.17, "learning_rate": 0.0019007151497961582, "loss": 2.4613, "step": 6280 }, { "epoch": 0.17, "learning_rate": 0.0019006773356711744, "loss": 2.7953, "step": 6281 }, { "epoch": 0.17, "learning_rate": 0.0019006395147228203, "loss": 2.2813, "step": 6282 }, { "epoch": 0.17, "learning_rate": 0.0019006016869513823, "loss": 2.7174, "step": 6283 }, { "epoch": 0.17, "learning_rate": 0.0019005638523571467, "loss": 2.2909, "step": 6284 }, { "epoch": 0.17, "learning_rate": 0.0019005260109404005, "loss": 2.4958, "step": 6285 }, { "epoch": 0.17, "learning_rate": 0.0019004881627014303, "loss": 2.9608, "step": 6286 }, { "epoch": 0.17, "learning_rate": 0.0019004503076405226, "loss": 2.5599, "step": 6287 }, { "epoch": 0.17, "learning_rate": 0.0019004124457579646, "loss": 2.3581, "step": 6288 }, { "epoch": 0.17, "learning_rate": 0.0019003745770540428, "loss": 2.698, "step": 6289 }, { "epoch": 0.17, "learning_rate": 0.0019003367015290441, "loss": 2.6856, "step": 6290 }, { "epoch": 0.17, "learning_rate": 0.0019002988191832554, "loss": 2.5272, "step": 6291 }, { "epoch": 0.17, "learning_rate": 0.0019002609300169642, "loss": 2.998, "step": 6292 }, { "epoch": 0.17, "learning_rate": 0.0019002230340304568, "loss": 2.239, "step": 6293 }, { "epoch": 0.17, "learning_rate": 0.0019001851312240208, "loss": 2.6926, "step": 6294 }, { "epoch": 0.17, "learning_rate": 0.0019001472215979432, "loss": 2.7552, "step": 6295 }, { "epoch": 0.17, "learning_rate": 0.001900109305152511, "loss": 2.2881, "step": 6296 }, { "epoch": 0.17, "learning_rate": 0.0019000713818880118, "loss": 2.3688, "step": 6297 }, { "epoch": 0.17, "learning_rate": 0.0019000334518047327, "loss": 2.9154, "step": 6298 }, { "epoch": 0.17, "learning_rate": 0.0018999955149029608, "loss": 2.8845, "step": 6299 }, { "epoch": 0.17, "learning_rate": 0.0018999575711829842, "loss": 3.2036, "step": 6300 }, { "epoch": 0.17, "learning_rate": 0.0018999196206450897, "loss": 2.2265, "step": 6301 }, { "epoch": 0.17, "learning_rate": 0.0018998816632895652, "loss": 2.541, "step": 6302 }, { "epoch": 0.17, "learning_rate": 0.0018998436991166981, "loss": 2.3523, "step": 6303 }, { "epoch": 0.17, "learning_rate": 0.001899805728126776, "loss": 2.5912, "step": 6304 }, { "epoch": 0.17, "learning_rate": 0.0018997677503200863, "loss": 2.3798, "step": 6305 }, { "epoch": 0.17, "learning_rate": 0.0018997297656969173, "loss": 2.227, "step": 6306 }, { "epoch": 0.17, "learning_rate": 0.0018996917742575563, "loss": 2.7315, "step": 6307 }, { "epoch": 0.17, "learning_rate": 0.0018996537760022913, "loss": 2.6115, "step": 6308 }, { "epoch": 0.17, "learning_rate": 0.0018996157709314102, "loss": 2.6848, "step": 6309 }, { "epoch": 0.17, "learning_rate": 0.0018995777590452008, "loss": 2.8197, "step": 6310 }, { "epoch": 0.17, "learning_rate": 0.0018995397403439509, "loss": 2.7727, "step": 6311 }, { "epoch": 0.17, "learning_rate": 0.0018995017148279493, "loss": 2.8771, "step": 6312 }, { "epoch": 0.17, "learning_rate": 0.0018994636824974831, "loss": 2.7307, "step": 6313 }, { "epoch": 0.17, "learning_rate": 0.001899425643352841, "loss": 2.6777, "step": 6314 }, { "epoch": 0.17, "learning_rate": 0.0018993875973943109, "loss": 2.5042, "step": 6315 }, { "epoch": 0.17, "learning_rate": 0.0018993495446221812, "loss": 2.571, "step": 6316 }, { "epoch": 0.17, "learning_rate": 0.00189931148503674, "loss": 2.5453, "step": 6317 }, { "epoch": 0.17, "learning_rate": 0.001899273418638276, "loss": 2.6603, "step": 6318 }, { "epoch": 0.17, "learning_rate": 0.0018992353454270773, "loss": 2.9272, "step": 6319 }, { "epoch": 0.17, "learning_rate": 0.0018991972654034326, "loss": 2.4112, "step": 6320 }, { "epoch": 0.17, "learning_rate": 0.0018991591785676302, "loss": 2.4569, "step": 6321 }, { "epoch": 0.17, "learning_rate": 0.0018991210849199584, "loss": 2.7511, "step": 6322 }, { "epoch": 0.17, "learning_rate": 0.0018990829844607057, "loss": 2.5827, "step": 6323 }, { "epoch": 0.17, "learning_rate": 0.0018990448771901613, "loss": 2.5761, "step": 6324 }, { "epoch": 0.17, "learning_rate": 0.0018990067631086136, "loss": 2.9881, "step": 6325 }, { "epoch": 0.17, "learning_rate": 0.0018989686422163517, "loss": 2.5689, "step": 6326 }, { "epoch": 0.17, "learning_rate": 0.0018989305145136637, "loss": 2.9571, "step": 6327 }, { "epoch": 0.17, "learning_rate": 0.0018988923800008393, "loss": 2.5916, "step": 6328 }, { "epoch": 0.17, "learning_rate": 0.0018988542386781666, "loss": 2.7117, "step": 6329 }, { "epoch": 0.17, "learning_rate": 0.001898816090545935, "loss": 2.2049, "step": 6330 }, { "epoch": 0.17, "learning_rate": 0.001898777935604433, "loss": 2.6001, "step": 6331 }, { "epoch": 0.17, "learning_rate": 0.0018987397738539507, "loss": 2.7002, "step": 6332 }, { "epoch": 0.17, "learning_rate": 0.0018987016052947761, "loss": 2.9977, "step": 6333 }, { "epoch": 0.17, "learning_rate": 0.0018986634299271987, "loss": 2.4136, "step": 6334 }, { "epoch": 0.17, "learning_rate": 0.0018986252477515082, "loss": 2.4591, "step": 6335 }, { "epoch": 0.17, "learning_rate": 0.0018985870587679935, "loss": 2.5286, "step": 6336 }, { "epoch": 0.17, "learning_rate": 0.0018985488629769437, "loss": 2.4263, "step": 6337 }, { "epoch": 0.17, "learning_rate": 0.0018985106603786482, "loss": 2.4676, "step": 6338 }, { "epoch": 0.17, "learning_rate": 0.0018984724509733969, "loss": 2.611, "step": 6339 }, { "epoch": 0.17, "learning_rate": 0.0018984342347614788, "loss": 2.7527, "step": 6340 }, { "epoch": 0.17, "learning_rate": 0.0018983960117431836, "loss": 2.275, "step": 6341 }, { "epoch": 0.17, "learning_rate": 0.0018983577819188008, "loss": 2.7133, "step": 6342 }, { "epoch": 0.17, "learning_rate": 0.00189831954528862, "loss": 2.7295, "step": 6343 }, { "epoch": 0.17, "learning_rate": 0.001898281301852931, "loss": 2.6446, "step": 6344 }, { "epoch": 0.17, "learning_rate": 0.0018982430516120234, "loss": 2.8672, "step": 6345 }, { "epoch": 0.17, "learning_rate": 0.001898204794566187, "loss": 2.583, "step": 6346 }, { "epoch": 0.17, "learning_rate": 0.0018981665307157118, "loss": 2.5162, "step": 6347 }, { "epoch": 0.17, "learning_rate": 0.0018981282600608875, "loss": 2.6617, "step": 6348 }, { "epoch": 0.17, "learning_rate": 0.0018980899826020043, "loss": 2.5507, "step": 6349 }, { "epoch": 0.17, "learning_rate": 0.0018980516983393514, "loss": 2.5989, "step": 6350 }, { "epoch": 0.17, "learning_rate": 0.0018980134072732198, "loss": 2.8078, "step": 6351 }, { "epoch": 0.17, "learning_rate": 0.001897975109403899, "loss": 2.6796, "step": 6352 }, { "epoch": 0.17, "learning_rate": 0.0018979368047316795, "loss": 2.6783, "step": 6353 }, { "epoch": 0.17, "learning_rate": 0.001897898493256851, "loss": 2.6607, "step": 6354 }, { "epoch": 0.17, "learning_rate": 0.0018978601749797045, "loss": 2.4133, "step": 6355 }, { "epoch": 0.17, "learning_rate": 0.0018978218499005296, "loss": 2.8025, "step": 6356 }, { "epoch": 0.17, "learning_rate": 0.001897783518019617, "loss": 2.6863, "step": 6357 }, { "epoch": 0.17, "learning_rate": 0.0018977451793372566, "loss": 2.5686, "step": 6358 }, { "epoch": 0.17, "learning_rate": 0.0018977068338537394, "loss": 2.6492, "step": 6359 }, { "epoch": 0.17, "learning_rate": 0.001897668481569356, "loss": 2.573, "step": 6360 }, { "epoch": 0.17, "learning_rate": 0.0018976301224843963, "loss": 2.859, "step": 6361 }, { "epoch": 0.17, "learning_rate": 0.001897591756599151, "loss": 2.4384, "step": 6362 }, { "epoch": 0.17, "learning_rate": 0.001897553383913912, "loss": 2.5272, "step": 6363 }, { "epoch": 0.17, "learning_rate": 0.0018975150044289683, "loss": 2.8553, "step": 6364 }, { "epoch": 0.17, "learning_rate": 0.0018974766181446114, "loss": 2.6015, "step": 6365 }, { "epoch": 0.17, "learning_rate": 0.0018974382250611325, "loss": 3.0053, "step": 6366 }, { "epoch": 0.17, "learning_rate": 0.0018973998251788219, "loss": 2.8532, "step": 6367 }, { "epoch": 0.17, "learning_rate": 0.0018973614184979704, "loss": 2.7725, "step": 6368 }, { "epoch": 0.17, "learning_rate": 0.0018973230050188695, "loss": 2.4857, "step": 6369 }, { "epoch": 0.17, "learning_rate": 0.0018972845847418096, "loss": 2.6388, "step": 6370 }, { "epoch": 0.17, "learning_rate": 0.0018972461576670825, "loss": 2.4002, "step": 6371 }, { "epoch": 0.17, "learning_rate": 0.0018972077237949787, "loss": 2.7276, "step": 6372 }, { "epoch": 0.17, "learning_rate": 0.0018971692831257897, "loss": 2.9871, "step": 6373 }, { "epoch": 0.17, "learning_rate": 0.0018971308356598065, "loss": 3.1919, "step": 6374 }, { "epoch": 0.17, "learning_rate": 0.0018970923813973206, "loss": 2.8055, "step": 6375 }, { "epoch": 0.17, "learning_rate": 0.0018970539203386231, "loss": 2.6967, "step": 6376 }, { "epoch": 0.17, "learning_rate": 0.0018970154524840055, "loss": 2.7393, "step": 6377 }, { "epoch": 0.17, "learning_rate": 0.0018969769778337594, "loss": 2.7355, "step": 6378 }, { "epoch": 0.17, "learning_rate": 0.001896938496388176, "loss": 2.8468, "step": 6379 }, { "epoch": 0.17, "learning_rate": 0.0018969000081475466, "loss": 2.6398, "step": 6380 }, { "epoch": 0.17, "learning_rate": 0.0018968615131121633, "loss": 2.0528, "step": 6381 }, { "epoch": 0.17, "learning_rate": 0.0018968230112823177, "loss": 2.4603, "step": 6382 }, { "epoch": 0.17, "learning_rate": 0.0018967845026583012, "loss": 2.4654, "step": 6383 }, { "epoch": 0.17, "learning_rate": 0.0018967459872404056, "loss": 2.5135, "step": 6384 }, { "epoch": 0.17, "learning_rate": 0.0018967074650289226, "loss": 2.4252, "step": 6385 }, { "epoch": 0.17, "learning_rate": 0.0018966689360241443, "loss": 2.6097, "step": 6386 }, { "epoch": 0.17, "learning_rate": 0.0018966304002263623, "loss": 2.4942, "step": 6387 }, { "epoch": 0.17, "learning_rate": 0.001896591857635869, "loss": 2.9529, "step": 6388 }, { "epoch": 0.17, "learning_rate": 0.0018965533082529555, "loss": 3.027, "step": 6389 }, { "epoch": 0.17, "learning_rate": 0.0018965147520779149, "loss": 2.5944, "step": 6390 }, { "epoch": 0.17, "learning_rate": 0.0018964761891110387, "loss": 2.526, "step": 6391 }, { "epoch": 0.17, "learning_rate": 0.0018964376193526195, "loss": 2.5851, "step": 6392 }, { "epoch": 0.17, "learning_rate": 0.0018963990428029487, "loss": 2.6439, "step": 6393 }, { "epoch": 0.17, "learning_rate": 0.0018963604594623192, "loss": 2.569, "step": 6394 }, { "epoch": 0.17, "learning_rate": 0.001896321869331023, "loss": 2.9583, "step": 6395 }, { "epoch": 0.17, "learning_rate": 0.0018962832724093528, "loss": 2.3157, "step": 6396 }, { "epoch": 0.17, "learning_rate": 0.0018962446686976004, "loss": 2.3011, "step": 6397 }, { "epoch": 0.17, "learning_rate": 0.001896206058196059, "loss": 2.8818, "step": 6398 }, { "epoch": 0.17, "learning_rate": 0.0018961674409050206, "loss": 2.5329, "step": 6399 }, { "epoch": 0.17, "learning_rate": 0.0018961288168247777, "loss": 2.6712, "step": 6400 }, { "epoch": 0.17, "learning_rate": 0.0018960901859556235, "loss": 2.3616, "step": 6401 }, { "epoch": 0.17, "learning_rate": 0.0018960515482978498, "loss": 2.7614, "step": 6402 }, { "epoch": 0.17, "learning_rate": 0.0018960129038517503, "loss": 2.5522, "step": 6403 }, { "epoch": 0.17, "learning_rate": 0.0018959742526176164, "loss": 2.5798, "step": 6404 }, { "epoch": 0.17, "learning_rate": 0.0018959355945957425, "loss": 2.9832, "step": 6405 }, { "epoch": 0.17, "learning_rate": 0.0018958969297864204, "loss": 2.7364, "step": 6406 }, { "epoch": 0.17, "learning_rate": 0.0018958582581899434, "loss": 2.7113, "step": 6407 }, { "epoch": 0.17, "learning_rate": 0.0018958195798066044, "loss": 2.7562, "step": 6408 }, { "epoch": 0.17, "learning_rate": 0.0018957808946366967, "loss": 2.5825, "step": 6409 }, { "epoch": 0.17, "learning_rate": 0.0018957422026805127, "loss": 2.8111, "step": 6410 }, { "epoch": 0.17, "learning_rate": 0.0018957035039383458, "loss": 2.6705, "step": 6411 }, { "epoch": 0.17, "learning_rate": 0.0018956647984104899, "loss": 2.728, "step": 6412 }, { "epoch": 0.17, "learning_rate": 0.001895626086097237, "loss": 2.8537, "step": 6413 }, { "epoch": 0.17, "learning_rate": 0.0018955873669988812, "loss": 2.5477, "step": 6414 }, { "epoch": 0.17, "learning_rate": 0.0018955486411157158, "loss": 2.5104, "step": 6415 }, { "epoch": 0.17, "learning_rate": 0.001895509908448034, "loss": 2.5267, "step": 6416 }, { "epoch": 0.17, "learning_rate": 0.0018954711689961289, "loss": 2.8888, "step": 6417 }, { "epoch": 0.17, "learning_rate": 0.0018954324227602945, "loss": 2.4815, "step": 6418 }, { "epoch": 0.17, "learning_rate": 0.0018953936697408242, "loss": 3.0143, "step": 6419 }, { "epoch": 0.17, "learning_rate": 0.0018953549099380114, "loss": 2.5159, "step": 6420 }, { "epoch": 0.17, "learning_rate": 0.0018953161433521502, "loss": 2.7564, "step": 6421 }, { "epoch": 0.17, "learning_rate": 0.0018952773699835337, "loss": 2.906, "step": 6422 }, { "epoch": 0.17, "learning_rate": 0.001895238589832456, "loss": 2.931, "step": 6423 }, { "epoch": 0.17, "learning_rate": 0.0018951998028992106, "loss": 2.4866, "step": 6424 }, { "epoch": 0.17, "learning_rate": 0.0018951610091840919, "loss": 2.9974, "step": 6425 }, { "epoch": 0.17, "learning_rate": 0.001895122208687393, "loss": 2.4021, "step": 6426 }, { "epoch": 0.17, "learning_rate": 0.0018950834014094086, "loss": 2.4927, "step": 6427 }, { "epoch": 0.17, "learning_rate": 0.0018950445873504322, "loss": 2.601, "step": 6428 }, { "epoch": 0.17, "learning_rate": 0.0018950057665107582, "loss": 2.6078, "step": 6429 }, { "epoch": 0.17, "learning_rate": 0.0018949669388906806, "loss": 2.5223, "step": 6430 }, { "epoch": 0.17, "learning_rate": 0.0018949281044904934, "loss": 2.711, "step": 6431 }, { "epoch": 0.17, "learning_rate": 0.0018948892633104907, "loss": 2.4567, "step": 6432 }, { "epoch": 0.17, "learning_rate": 0.001894850415350967, "loss": 2.5942, "step": 6433 }, { "epoch": 0.17, "learning_rate": 0.0018948115606122165, "loss": 2.8986, "step": 6434 }, { "epoch": 0.17, "learning_rate": 0.0018947726990945339, "loss": 2.4471, "step": 6435 }, { "epoch": 0.17, "learning_rate": 0.001894733830798213, "loss": 2.5255, "step": 6436 }, { "epoch": 0.17, "learning_rate": 0.0018946949557235484, "loss": 2.5581, "step": 6437 }, { "epoch": 0.17, "learning_rate": 0.0018946560738708352, "loss": 2.4552, "step": 6438 }, { "epoch": 0.17, "learning_rate": 0.0018946171852403672, "loss": 3.0009, "step": 6439 }, { "epoch": 0.17, "learning_rate": 0.0018945782898324396, "loss": 2.3194, "step": 6440 }, { "epoch": 0.17, "learning_rate": 0.0018945393876473467, "loss": 2.5662, "step": 6441 }, { "epoch": 0.17, "learning_rate": 0.0018945004786853831, "loss": 2.327, "step": 6442 }, { "epoch": 0.17, "learning_rate": 0.001894461562946844, "loss": 2.7069, "step": 6443 }, { "epoch": 0.17, "learning_rate": 0.0018944226404320242, "loss": 2.6818, "step": 6444 }, { "epoch": 0.17, "learning_rate": 0.001894383711141218, "loss": 2.4898, "step": 6445 }, { "epoch": 0.17, "learning_rate": 0.001894344775074721, "loss": 2.3741, "step": 6446 }, { "epoch": 0.17, "learning_rate": 0.0018943058322328278, "loss": 2.5574, "step": 6447 }, { "epoch": 0.17, "learning_rate": 0.0018942668826158336, "loss": 2.2483, "step": 6448 }, { "epoch": 0.17, "learning_rate": 0.001894227926224033, "loss": 2.6627, "step": 6449 }, { "epoch": 0.17, "learning_rate": 0.001894188963057722, "loss": 2.4562, "step": 6450 }, { "epoch": 0.17, "learning_rate": 0.001894149993117195, "loss": 2.786, "step": 6451 }, { "epoch": 0.17, "learning_rate": 0.0018941110164027478, "loss": 2.68, "step": 6452 }, { "epoch": 0.17, "learning_rate": 0.001894072032914675, "loss": 2.7685, "step": 6453 }, { "epoch": 0.17, "learning_rate": 0.0018940330426532725, "loss": 2.8238, "step": 6454 }, { "epoch": 0.17, "learning_rate": 0.0018939940456188353, "loss": 2.7986, "step": 6455 }, { "epoch": 0.17, "learning_rate": 0.0018939550418116593, "loss": 2.5403, "step": 6456 }, { "epoch": 0.17, "learning_rate": 0.0018939160312320396, "loss": 2.653, "step": 6457 }, { "epoch": 0.17, "learning_rate": 0.001893877013880272, "loss": 2.746, "step": 6458 }, { "epoch": 0.17, "learning_rate": 0.0018938379897566518, "loss": 2.3881, "step": 6459 }, { "epoch": 0.17, "learning_rate": 0.001893798958861475, "loss": 2.8421, "step": 6460 }, { "epoch": 0.17, "learning_rate": 0.001893759921195037, "loss": 2.4947, "step": 6461 }, { "epoch": 0.17, "learning_rate": 0.0018937208767576335, "loss": 2.9101, "step": 6462 }, { "epoch": 0.17, "learning_rate": 0.0018936818255495605, "loss": 2.9533, "step": 6463 }, { "epoch": 0.17, "learning_rate": 0.001893642767571114, "loss": 2.3428, "step": 6464 }, { "epoch": 0.17, "learning_rate": 0.0018936037028225892, "loss": 2.6379, "step": 6465 }, { "epoch": 0.17, "learning_rate": 0.0018935646313042826, "loss": 2.4138, "step": 6466 }, { "epoch": 0.17, "learning_rate": 0.0018935255530164903, "loss": 2.8753, "step": 6467 }, { "epoch": 0.17, "learning_rate": 0.0018934864679595084, "loss": 2.2101, "step": 6468 }, { "epoch": 0.17, "learning_rate": 0.0018934473761336324, "loss": 2.8805, "step": 6469 }, { "epoch": 0.17, "learning_rate": 0.0018934082775391588, "loss": 2.6071, "step": 6470 }, { "epoch": 0.17, "learning_rate": 0.0018933691721763836, "loss": 2.6616, "step": 6471 }, { "epoch": 0.17, "learning_rate": 0.0018933300600456038, "loss": 2.881, "step": 6472 }, { "epoch": 0.17, "learning_rate": 0.0018932909411471148, "loss": 3.1613, "step": 6473 }, { "epoch": 0.17, "learning_rate": 0.0018932518154812135, "loss": 2.7312, "step": 6474 }, { "epoch": 0.17, "learning_rate": 0.0018932126830481961, "loss": 2.9917, "step": 6475 }, { "epoch": 0.17, "learning_rate": 0.0018931735438483593, "loss": 2.6812, "step": 6476 }, { "epoch": 0.17, "learning_rate": 0.0018931343978819994, "loss": 2.2313, "step": 6477 }, { "epoch": 0.17, "learning_rate": 0.0018930952451494125, "loss": 2.9914, "step": 6478 }, { "epoch": 0.17, "learning_rate": 0.0018930560856508963, "loss": 2.7137, "step": 6479 }, { "epoch": 0.17, "learning_rate": 0.0018930169193867464, "loss": 2.8763, "step": 6480 }, { "epoch": 0.17, "learning_rate": 0.0018929777463572602, "loss": 2.6352, "step": 6481 }, { "epoch": 0.17, "learning_rate": 0.001892938566562734, "loss": 2.2662, "step": 6482 }, { "epoch": 0.17, "learning_rate": 0.001892899380003465, "loss": 2.6502, "step": 6483 }, { "epoch": 0.17, "learning_rate": 0.0018928601866797501, "loss": 2.9554, "step": 6484 }, { "epoch": 0.17, "learning_rate": 0.001892820986591886, "loss": 2.6956, "step": 6485 }, { "epoch": 0.17, "learning_rate": 0.0018927817797401696, "loss": 2.6297, "step": 6486 }, { "epoch": 0.17, "learning_rate": 0.0018927425661248983, "loss": 3.0458, "step": 6487 }, { "epoch": 0.17, "learning_rate": 0.0018927033457463685, "loss": 2.5211, "step": 6488 }, { "epoch": 0.17, "learning_rate": 0.0018926641186048782, "loss": 2.4445, "step": 6489 }, { "epoch": 0.17, "learning_rate": 0.001892624884700724, "loss": 2.6275, "step": 6490 }, { "epoch": 0.17, "learning_rate": 0.001892585644034203, "loss": 3.3654, "step": 6491 }, { "epoch": 0.17, "learning_rate": 0.0018925463966056129, "loss": 2.7996, "step": 6492 }, { "epoch": 0.17, "learning_rate": 0.001892507142415251, "loss": 2.255, "step": 6493 }, { "epoch": 0.17, "learning_rate": 0.0018924678814634143, "loss": 2.4032, "step": 6494 }, { "epoch": 0.17, "learning_rate": 0.0018924286137504006, "loss": 2.5857, "step": 6495 }, { "epoch": 0.17, "learning_rate": 0.0018923893392765075, "loss": 2.5924, "step": 6496 }, { "epoch": 0.17, "learning_rate": 0.001892350058042032, "loss": 2.7223, "step": 6497 }, { "epoch": 0.17, "learning_rate": 0.0018923107700472722, "loss": 2.6339, "step": 6498 }, { "epoch": 0.17, "learning_rate": 0.0018922714752925254, "loss": 2.6793, "step": 6499 }, { "epoch": 0.17, "learning_rate": 0.0018922321737780893, "loss": 2.3883, "step": 6500 }, { "epoch": 0.17, "learning_rate": 0.0018921928655042622, "loss": 2.8759, "step": 6501 }, { "epoch": 0.17, "learning_rate": 0.001892153550471341, "loss": 2.6121, "step": 6502 }, { "epoch": 0.17, "learning_rate": 0.0018921142286796244, "loss": 2.5646, "step": 6503 }, { "epoch": 0.17, "learning_rate": 0.0018920749001294097, "loss": 2.5984, "step": 6504 }, { "epoch": 0.17, "learning_rate": 0.0018920355648209951, "loss": 2.9793, "step": 6505 }, { "epoch": 0.17, "learning_rate": 0.0018919962227546786, "loss": 2.7844, "step": 6506 }, { "epoch": 0.17, "learning_rate": 0.001891956873930758, "loss": 2.6007, "step": 6507 }, { "epoch": 0.17, "learning_rate": 0.0018919175183495316, "loss": 2.9094, "step": 6508 }, { "epoch": 0.17, "learning_rate": 0.0018918781560112977, "loss": 2.9073, "step": 6509 }, { "epoch": 0.17, "learning_rate": 0.0018918387869163542, "loss": 2.6357, "step": 6510 }, { "epoch": 0.17, "learning_rate": 0.0018917994110649997, "loss": 2.423, "step": 6511 }, { "epoch": 0.18, "learning_rate": 0.001891760028457532, "loss": 2.4241, "step": 6512 }, { "epoch": 0.18, "learning_rate": 0.00189172063909425, "loss": 2.5053, "step": 6513 }, { "epoch": 0.18, "learning_rate": 0.0018916812429754515, "loss": 2.7204, "step": 6514 }, { "epoch": 0.18, "learning_rate": 0.0018916418401014358, "loss": 2.7522, "step": 6515 }, { "epoch": 0.18, "learning_rate": 0.0018916024304725006, "loss": 2.776, "step": 6516 }, { "epoch": 0.18, "learning_rate": 0.001891563014088945, "loss": 2.5194, "step": 6517 }, { "epoch": 0.18, "learning_rate": 0.0018915235909510674, "loss": 2.8882, "step": 6518 }, { "epoch": 0.18, "learning_rate": 0.0018914841610591661, "loss": 2.5496, "step": 6519 }, { "epoch": 0.18, "learning_rate": 0.0018914447244135406, "loss": 2.67, "step": 6520 }, { "epoch": 0.18, "learning_rate": 0.0018914052810144893, "loss": 2.5935, "step": 6521 }, { "epoch": 0.18, "learning_rate": 0.0018913658308623105, "loss": 2.2585, "step": 6522 }, { "epoch": 0.18, "learning_rate": 0.001891326373957304, "loss": 2.6712, "step": 6523 }, { "epoch": 0.18, "learning_rate": 0.0018912869102997681, "loss": 2.7316, "step": 6524 }, { "epoch": 0.18, "learning_rate": 0.0018912474398900018, "loss": 2.5331, "step": 6525 }, { "epoch": 0.18, "learning_rate": 0.0018912079627283044, "loss": 2.4396, "step": 6526 }, { "epoch": 0.18, "learning_rate": 0.0018911684788149744, "loss": 2.5605, "step": 6527 }, { "epoch": 0.18, "learning_rate": 0.0018911289881503117, "loss": 2.9264, "step": 6528 }, { "epoch": 0.18, "learning_rate": 0.0018910894907346151, "loss": 2.6465, "step": 6529 }, { "epoch": 0.18, "learning_rate": 0.0018910499865681838, "loss": 2.2776, "step": 6530 }, { "epoch": 0.18, "learning_rate": 0.0018910104756513172, "loss": 2.6663, "step": 6531 }, { "epoch": 0.18, "learning_rate": 0.0018909709579843141, "loss": 2.3528, "step": 6532 }, { "epoch": 0.18, "learning_rate": 0.0018909314335674744, "loss": 2.4727, "step": 6533 }, { "epoch": 0.18, "learning_rate": 0.001890891902401098, "loss": 2.6405, "step": 6534 }, { "epoch": 0.18, "learning_rate": 0.0018908523644854834, "loss": 3.0432, "step": 6535 }, { "epoch": 0.18, "learning_rate": 0.0018908128198209307, "loss": 3.0063, "step": 6536 }, { "epoch": 0.18, "learning_rate": 0.0018907732684077393, "loss": 2.4706, "step": 6537 }, { "epoch": 0.18, "learning_rate": 0.001890733710246209, "loss": 2.6629, "step": 6538 }, { "epoch": 0.18, "learning_rate": 0.001890694145336639, "loss": 2.581, "step": 6539 }, { "epoch": 0.18, "learning_rate": 0.0018906545736793296, "loss": 3.0872, "step": 6540 }, { "epoch": 0.18, "learning_rate": 0.0018906149952745803, "loss": 2.7233, "step": 6541 }, { "epoch": 0.18, "learning_rate": 0.0018905754101226913, "loss": 2.521, "step": 6542 }, { "epoch": 0.18, "learning_rate": 0.0018905358182239617, "loss": 2.6168, "step": 6543 }, { "epoch": 0.18, "learning_rate": 0.0018904962195786927, "loss": 2.9369, "step": 6544 }, { "epoch": 0.18, "learning_rate": 0.0018904566141871829, "loss": 3.0164, "step": 6545 }, { "epoch": 0.18, "learning_rate": 0.0018904170020497334, "loss": 2.7674, "step": 6546 }, { "epoch": 0.18, "learning_rate": 0.0018903773831666438, "loss": 2.5225, "step": 6547 }, { "epoch": 0.18, "learning_rate": 0.0018903377575382142, "loss": 2.6331, "step": 6548 }, { "epoch": 0.18, "learning_rate": 0.0018902981251647448, "loss": 2.9765, "step": 6549 }, { "epoch": 0.18, "learning_rate": 0.0018902584860465363, "loss": 2.8422, "step": 6550 }, { "epoch": 0.18, "learning_rate": 0.0018902188401838883, "loss": 2.4517, "step": 6551 }, { "epoch": 0.18, "learning_rate": 0.0018901791875771017, "loss": 2.7595, "step": 6552 }, { "epoch": 0.18, "learning_rate": 0.0018901395282264768, "loss": 2.7316, "step": 6553 }, { "epoch": 0.18, "learning_rate": 0.0018900998621323138, "loss": 3.2689, "step": 6554 }, { "epoch": 0.18, "learning_rate": 0.0018900601892949136, "loss": 2.6104, "step": 6555 }, { "epoch": 0.18, "learning_rate": 0.0018900205097145766, "loss": 2.5459, "step": 6556 }, { "epoch": 0.18, "learning_rate": 0.001889980823391603, "loss": 2.451, "step": 6557 }, { "epoch": 0.18, "learning_rate": 0.001889941130326294, "loss": 2.326, "step": 6558 }, { "epoch": 0.18, "learning_rate": 0.0018899014305189502, "loss": 2.8136, "step": 6559 }, { "epoch": 0.18, "learning_rate": 0.0018898617239698722, "loss": 2.7068, "step": 6560 }, { "epoch": 0.18, "learning_rate": 0.0018898220106793606, "loss": 2.7463, "step": 6561 }, { "epoch": 0.18, "learning_rate": 0.0018897822906477168, "loss": 2.4132, "step": 6562 }, { "epoch": 0.18, "learning_rate": 0.0018897425638752414, "loss": 2.6327, "step": 6563 }, { "epoch": 0.18, "learning_rate": 0.0018897028303622354, "loss": 2.7444, "step": 6564 }, { "epoch": 0.18, "learning_rate": 0.0018896630901089999, "loss": 2.8333, "step": 6565 }, { "epoch": 0.18, "learning_rate": 0.0018896233431158357, "loss": 2.7809, "step": 6566 }, { "epoch": 0.18, "learning_rate": 0.0018895835893830441, "loss": 2.7997, "step": 6567 }, { "epoch": 0.18, "learning_rate": 0.0018895438289109263, "loss": 2.9459, "step": 6568 }, { "epoch": 0.18, "learning_rate": 0.0018895040616997837, "loss": 2.4956, "step": 6569 }, { "epoch": 0.18, "learning_rate": 0.0018894642877499172, "loss": 2.663, "step": 6570 }, { "epoch": 0.18, "learning_rate": 0.0018894245070616284, "loss": 2.2902, "step": 6571 }, { "epoch": 0.18, "learning_rate": 0.0018893847196352182, "loss": 2.6759, "step": 6572 }, { "epoch": 0.18, "learning_rate": 0.0018893449254709887, "loss": 2.4025, "step": 6573 }, { "epoch": 0.18, "learning_rate": 0.001889305124569241, "loss": 3.0347, "step": 6574 }, { "epoch": 0.18, "learning_rate": 0.0018892653169302767, "loss": 2.5294, "step": 6575 }, { "epoch": 0.18, "learning_rate": 0.0018892255025543974, "loss": 2.5108, "step": 6576 }, { "epoch": 0.18, "learning_rate": 0.0018891856814419047, "loss": 2.4818, "step": 6577 }, { "epoch": 0.18, "learning_rate": 0.0018891458535931, "loss": 2.9287, "step": 6578 }, { "epoch": 0.18, "learning_rate": 0.0018891060190082852, "loss": 2.4505, "step": 6579 }, { "epoch": 0.18, "learning_rate": 0.0018890661776877625, "loss": 2.3715, "step": 6580 }, { "epoch": 0.18, "learning_rate": 0.0018890263296318331, "loss": 2.6938, "step": 6581 }, { "epoch": 0.18, "learning_rate": 0.0018889864748407993, "loss": 2.9328, "step": 6582 }, { "epoch": 0.18, "learning_rate": 0.001888946613314963, "loss": 2.5238, "step": 6583 }, { "epoch": 0.18, "learning_rate": 0.0018889067450546257, "loss": 2.9243, "step": 6584 }, { "epoch": 0.18, "learning_rate": 0.0018888668700600905, "loss": 2.7883, "step": 6585 }, { "epoch": 0.18, "learning_rate": 0.0018888269883316582, "loss": 2.445, "step": 6586 }, { "epoch": 0.18, "learning_rate": 0.0018887870998696317, "loss": 2.5922, "step": 6587 }, { "epoch": 0.18, "learning_rate": 0.001888747204674313, "loss": 2.4522, "step": 6588 }, { "epoch": 0.18, "learning_rate": 0.0018887073027460044, "loss": 2.6676, "step": 6589 }, { "epoch": 0.18, "learning_rate": 0.0018886673940850082, "loss": 2.9637, "step": 6590 }, { "epoch": 0.18, "learning_rate": 0.0018886274786916268, "loss": 2.9066, "step": 6591 }, { "epoch": 0.18, "learning_rate": 0.0018885875565661622, "loss": 2.4292, "step": 6592 }, { "epoch": 0.18, "learning_rate": 0.0018885476277089176, "loss": 2.8515, "step": 6593 }, { "epoch": 0.18, "learning_rate": 0.0018885076921201947, "loss": 2.6942, "step": 6594 }, { "epoch": 0.18, "learning_rate": 0.0018884677498002965, "loss": 3.0252, "step": 6595 }, { "epoch": 0.18, "learning_rate": 0.0018884278007495255, "loss": 2.5634, "step": 6596 }, { "epoch": 0.18, "learning_rate": 0.0018883878449681842, "loss": 3.0441, "step": 6597 }, { "epoch": 0.18, "learning_rate": 0.0018883478824565753, "loss": 2.5101, "step": 6598 }, { "epoch": 0.18, "learning_rate": 0.0018883079132150018, "loss": 2.3998, "step": 6599 }, { "epoch": 0.18, "learning_rate": 0.0018882679372437667, "loss": 2.5963, "step": 6600 }, { "epoch": 0.18, "learning_rate": 0.001888227954543172, "loss": 2.8803, "step": 6601 }, { "epoch": 0.18, "learning_rate": 0.0018881879651135214, "loss": 2.4835, "step": 6602 }, { "epoch": 0.18, "learning_rate": 0.0018881479689551173, "loss": 2.7557, "step": 6603 }, { "epoch": 0.18, "learning_rate": 0.0018881079660682631, "loss": 2.363, "step": 6604 }, { "epoch": 0.18, "learning_rate": 0.0018880679564532619, "loss": 2.9871, "step": 6605 }, { "epoch": 0.18, "learning_rate": 0.0018880279401104166, "loss": 2.6394, "step": 6606 }, { "epoch": 0.18, "learning_rate": 0.0018879879170400303, "loss": 2.5233, "step": 6607 }, { "epoch": 0.18, "learning_rate": 0.0018879478872424063, "loss": 2.7034, "step": 6608 }, { "epoch": 0.18, "learning_rate": 0.0018879078507178478, "loss": 2.9976, "step": 6609 }, { "epoch": 0.18, "learning_rate": 0.0018878678074666583, "loss": 2.6896, "step": 6610 }, { "epoch": 0.18, "learning_rate": 0.001887827757489141, "loss": 2.9217, "step": 6611 }, { "epoch": 0.18, "learning_rate": 0.0018877877007855992, "loss": 2.5031, "step": 6612 }, { "epoch": 0.18, "learning_rate": 0.0018877476373563365, "loss": 2.6363, "step": 6613 }, { "epoch": 0.18, "learning_rate": 0.0018877075672016565, "loss": 2.7005, "step": 6614 }, { "epoch": 0.18, "learning_rate": 0.0018876674903218627, "loss": 2.3694, "step": 6615 }, { "epoch": 0.18, "learning_rate": 0.0018876274067172588, "loss": 2.6761, "step": 6616 }, { "epoch": 0.18, "learning_rate": 0.0018875873163881481, "loss": 2.6051, "step": 6617 }, { "epoch": 0.18, "learning_rate": 0.0018875472193348349, "loss": 2.5017, "step": 6618 }, { "epoch": 0.18, "learning_rate": 0.0018875071155576224, "loss": 2.5585, "step": 6619 }, { "epoch": 0.18, "learning_rate": 0.0018874670050568147, "loss": 2.894, "step": 6620 }, { "epoch": 0.18, "learning_rate": 0.0018874268878327155, "loss": 2.6479, "step": 6621 }, { "epoch": 0.18, "learning_rate": 0.0018873867638856292, "loss": 2.5312, "step": 6622 }, { "epoch": 0.18, "learning_rate": 0.0018873466332158591, "loss": 2.7488, "step": 6623 }, { "epoch": 0.18, "learning_rate": 0.0018873064958237098, "loss": 2.8786, "step": 6624 }, { "epoch": 0.18, "learning_rate": 0.001887266351709485, "loss": 2.7842, "step": 6625 }, { "epoch": 0.18, "learning_rate": 0.001887226200873489, "loss": 2.7409, "step": 6626 }, { "epoch": 0.18, "learning_rate": 0.0018871860433160258, "loss": 2.5255, "step": 6627 }, { "epoch": 0.18, "learning_rate": 0.0018871458790373997, "loss": 2.6566, "step": 6628 }, { "epoch": 0.18, "learning_rate": 0.0018871057080379152, "loss": 2.4974, "step": 6629 }, { "epoch": 0.18, "learning_rate": 0.0018870655303178765, "loss": 2.825, "step": 6630 }, { "epoch": 0.18, "learning_rate": 0.001887025345877588, "loss": 2.4447, "step": 6631 }, { "epoch": 0.18, "learning_rate": 0.0018869851547173538, "loss": 2.8088, "step": 6632 }, { "epoch": 0.18, "learning_rate": 0.0018869449568374788, "loss": 2.6663, "step": 6633 }, { "epoch": 0.18, "learning_rate": 0.0018869047522382671, "loss": 2.9802, "step": 6634 }, { "epoch": 0.18, "learning_rate": 0.001886864540920024, "loss": 2.5434, "step": 6635 }, { "epoch": 0.18, "learning_rate": 0.0018868243228830532, "loss": 2.4149, "step": 6636 }, { "epoch": 0.18, "learning_rate": 0.0018867840981276604, "loss": 2.4128, "step": 6637 }, { "epoch": 0.18, "learning_rate": 0.0018867438666541495, "loss": 2.5979, "step": 6638 }, { "epoch": 0.18, "learning_rate": 0.0018867036284628256, "loss": 2.7891, "step": 6639 }, { "epoch": 0.18, "learning_rate": 0.0018866633835539937, "loss": 2.3151, "step": 6640 }, { "epoch": 0.18, "learning_rate": 0.0018866231319279586, "loss": 2.5895, "step": 6641 }, { "epoch": 0.18, "learning_rate": 0.001886582873585025, "loss": 2.7908, "step": 6642 }, { "epoch": 0.18, "learning_rate": 0.001886542608525498, "loss": 2.3435, "step": 6643 }, { "epoch": 0.18, "learning_rate": 0.0018865023367496828, "loss": 2.6888, "step": 6644 }, { "epoch": 0.18, "learning_rate": 0.0018864620582578842, "loss": 2.7105, "step": 6645 }, { "epoch": 0.18, "learning_rate": 0.0018864217730504076, "loss": 2.3446, "step": 6646 }, { "epoch": 0.18, "learning_rate": 0.0018863814811275583, "loss": 2.3428, "step": 6647 }, { "epoch": 0.18, "learning_rate": 0.0018863411824896414, "loss": 2.5587, "step": 6648 }, { "epoch": 0.18, "learning_rate": 0.001886300877136962, "loss": 2.6173, "step": 6649 }, { "epoch": 0.18, "learning_rate": 0.0018862605650698256, "loss": 2.4976, "step": 6650 }, { "epoch": 0.18, "learning_rate": 0.0018862202462885378, "loss": 2.5261, "step": 6651 }, { "epoch": 0.18, "learning_rate": 0.0018861799207934035, "loss": 2.889, "step": 6652 }, { "epoch": 0.18, "learning_rate": 0.001886139588584729, "loss": 2.6314, "step": 6653 }, { "epoch": 0.18, "learning_rate": 0.001886099249662819, "loss": 2.7109, "step": 6654 }, { "epoch": 0.18, "learning_rate": 0.0018860589040279798, "loss": 2.5455, "step": 6655 }, { "epoch": 0.18, "learning_rate": 0.0018860185516805165, "loss": 2.4049, "step": 6656 }, { "epoch": 0.18, "learning_rate": 0.0018859781926207353, "loss": 2.3532, "step": 6657 }, { "epoch": 0.18, "learning_rate": 0.0018859378268489416, "loss": 2.649, "step": 6658 }, { "epoch": 0.18, "learning_rate": 0.0018858974543654412, "loss": 2.4204, "step": 6659 }, { "epoch": 0.18, "learning_rate": 0.0018858570751705405, "loss": 2.3255, "step": 6660 }, { "epoch": 0.18, "learning_rate": 0.0018858166892645445, "loss": 2.8637, "step": 6661 }, { "epoch": 0.18, "learning_rate": 0.0018857762966477598, "loss": 2.6358, "step": 6662 }, { "epoch": 0.18, "learning_rate": 0.0018857358973204921, "loss": 2.5424, "step": 6663 }, { "epoch": 0.18, "learning_rate": 0.0018856954912830478, "loss": 2.1581, "step": 6664 }, { "epoch": 0.18, "learning_rate": 0.001885655078535733, "loss": 2.4379, "step": 6665 }, { "epoch": 0.18, "learning_rate": 0.0018856146590788532, "loss": 2.6095, "step": 6666 }, { "epoch": 0.18, "learning_rate": 0.0018855742329127155, "loss": 2.4615, "step": 6667 }, { "epoch": 0.18, "learning_rate": 0.0018855338000376251, "loss": 2.5773, "step": 6668 }, { "epoch": 0.18, "learning_rate": 0.0018854933604538896, "loss": 2.5209, "step": 6669 }, { "epoch": 0.18, "learning_rate": 0.0018854529141618147, "loss": 2.6946, "step": 6670 }, { "epoch": 0.18, "learning_rate": 0.0018854124611617062, "loss": 2.5861, "step": 6671 }, { "epoch": 0.18, "learning_rate": 0.0018853720014538717, "loss": 2.5852, "step": 6672 }, { "epoch": 0.18, "learning_rate": 0.0018853315350386172, "loss": 2.3133, "step": 6673 }, { "epoch": 0.18, "learning_rate": 0.0018852910619162491, "loss": 2.7571, "step": 6674 }, { "epoch": 0.18, "learning_rate": 0.0018852505820870743, "loss": 2.6131, "step": 6675 }, { "epoch": 0.18, "learning_rate": 0.0018852100955513993, "loss": 2.6559, "step": 6676 }, { "epoch": 0.18, "learning_rate": 0.0018851696023095312, "loss": 2.3956, "step": 6677 }, { "epoch": 0.18, "learning_rate": 0.001885129102361776, "loss": 2.7202, "step": 6678 }, { "epoch": 0.18, "learning_rate": 0.001885088595708441, "loss": 3.0837, "step": 6679 }, { "epoch": 0.18, "learning_rate": 0.001885048082349833, "loss": 2.5726, "step": 6680 }, { "epoch": 0.18, "learning_rate": 0.0018850075622862592, "loss": 2.7221, "step": 6681 }, { "epoch": 0.18, "learning_rate": 0.0018849670355180264, "loss": 2.7386, "step": 6682 }, { "epoch": 0.18, "learning_rate": 0.0018849265020454413, "loss": 2.3025, "step": 6683 }, { "epoch": 0.18, "learning_rate": 0.0018848859618688114, "loss": 2.9537, "step": 6684 }, { "epoch": 0.18, "learning_rate": 0.0018848454149884436, "loss": 2.9552, "step": 6685 }, { "epoch": 0.18, "learning_rate": 0.0018848048614046452, "loss": 2.8243, "step": 6686 }, { "epoch": 0.18, "learning_rate": 0.0018847643011177231, "loss": 2.7842, "step": 6687 }, { "epoch": 0.18, "learning_rate": 0.001884723734127985, "loss": 2.9016, "step": 6688 }, { "epoch": 0.18, "learning_rate": 0.0018846831604357379, "loss": 2.7153, "step": 6689 }, { "epoch": 0.18, "learning_rate": 0.0018846425800412897, "loss": 2.5775, "step": 6690 }, { "epoch": 0.18, "learning_rate": 0.0018846019929449475, "loss": 2.8252, "step": 6691 }, { "epoch": 0.18, "learning_rate": 0.0018845613991470183, "loss": 2.7582, "step": 6692 }, { "epoch": 0.18, "learning_rate": 0.0018845207986478104, "loss": 2.3841, "step": 6693 }, { "epoch": 0.18, "learning_rate": 0.001884480191447631, "loss": 2.6929, "step": 6694 }, { "epoch": 0.18, "learning_rate": 0.0018844395775467876, "loss": 2.7271, "step": 6695 }, { "epoch": 0.18, "learning_rate": 0.0018843989569455885, "loss": 2.5585, "step": 6696 }, { "epoch": 0.18, "learning_rate": 0.0018843583296443407, "loss": 2.2283, "step": 6697 }, { "epoch": 0.18, "learning_rate": 0.0018843176956433525, "loss": 2.9191, "step": 6698 }, { "epoch": 0.18, "learning_rate": 0.0018842770549429315, "loss": 2.5779, "step": 6699 }, { "epoch": 0.18, "learning_rate": 0.0018842364075433854, "loss": 2.8683, "step": 6700 }, { "epoch": 0.18, "learning_rate": 0.0018841957534450225, "loss": 2.6974, "step": 6701 }, { "epoch": 0.18, "learning_rate": 0.0018841550926481509, "loss": 2.8215, "step": 6702 }, { "epoch": 0.18, "learning_rate": 0.001884114425153078, "loss": 2.6568, "step": 6703 }, { "epoch": 0.18, "learning_rate": 0.0018840737509601125, "loss": 2.3292, "step": 6704 }, { "epoch": 0.18, "learning_rate": 0.0018840330700695624, "loss": 2.6399, "step": 6705 }, { "epoch": 0.18, "learning_rate": 0.0018839923824817357, "loss": 3.0723, "step": 6706 }, { "epoch": 0.18, "learning_rate": 0.0018839516881969404, "loss": 2.6976, "step": 6707 }, { "epoch": 0.18, "learning_rate": 0.0018839109872154855, "loss": 2.5905, "step": 6708 }, { "epoch": 0.18, "learning_rate": 0.0018838702795376792, "loss": 2.8004, "step": 6709 }, { "epoch": 0.18, "learning_rate": 0.0018838295651638294, "loss": 2.3668, "step": 6710 }, { "epoch": 0.18, "learning_rate": 0.0018837888440942448, "loss": 2.5812, "step": 6711 }, { "epoch": 0.18, "learning_rate": 0.001883748116329234, "loss": 2.4255, "step": 6712 }, { "epoch": 0.18, "learning_rate": 0.0018837073818691054, "loss": 2.6716, "step": 6713 }, { "epoch": 0.18, "learning_rate": 0.001883666640714168, "loss": 2.4661, "step": 6714 }, { "epoch": 0.18, "learning_rate": 0.00188362589286473, "loss": 2.739, "step": 6715 }, { "epoch": 0.18, "learning_rate": 0.0018835851383211, "loss": 2.7043, "step": 6716 }, { "epoch": 0.18, "learning_rate": 0.001883544377083587, "loss": 2.9212, "step": 6717 }, { "epoch": 0.18, "learning_rate": 0.0018835036091524998, "loss": 2.5837, "step": 6718 }, { "epoch": 0.18, "learning_rate": 0.0018834628345281474, "loss": 2.673, "step": 6719 }, { "epoch": 0.18, "learning_rate": 0.001883422053210838, "loss": 2.6295, "step": 6720 }, { "epoch": 0.18, "learning_rate": 0.0018833812652008814, "loss": 2.3617, "step": 6721 }, { "epoch": 0.18, "learning_rate": 0.0018833404704985863, "loss": 2.3476, "step": 6722 }, { "epoch": 0.18, "learning_rate": 0.0018832996691042618, "loss": 2.638, "step": 6723 }, { "epoch": 0.18, "learning_rate": 0.0018832588610182166, "loss": 2.8384, "step": 6724 }, { "epoch": 0.18, "learning_rate": 0.0018832180462407604, "loss": 2.579, "step": 6725 }, { "epoch": 0.18, "learning_rate": 0.0018831772247722021, "loss": 2.935, "step": 6726 }, { "epoch": 0.18, "learning_rate": 0.0018831363966128514, "loss": 2.5106, "step": 6727 }, { "epoch": 0.18, "learning_rate": 0.0018830955617630167, "loss": 2.6666, "step": 6728 }, { "epoch": 0.18, "learning_rate": 0.0018830547202230083, "loss": 2.5879, "step": 6729 }, { "epoch": 0.18, "learning_rate": 0.001883013871993135, "loss": 2.7781, "step": 6730 }, { "epoch": 0.18, "learning_rate": 0.0018829730170737066, "loss": 2.6771, "step": 6731 }, { "epoch": 0.18, "learning_rate": 0.0018829321554650325, "loss": 2.7091, "step": 6732 }, { "epoch": 0.18, "learning_rate": 0.0018828912871674223, "loss": 3.0644, "step": 6733 }, { "epoch": 0.18, "learning_rate": 0.0018828504121811854, "loss": 2.8221, "step": 6734 }, { "epoch": 0.18, "learning_rate": 0.0018828095305066315, "loss": 2.94, "step": 6735 }, { "epoch": 0.18, "learning_rate": 0.0018827686421440707, "loss": 2.7983, "step": 6736 }, { "epoch": 0.18, "learning_rate": 0.0018827277470938122, "loss": 2.4171, "step": 6737 }, { "epoch": 0.18, "learning_rate": 0.0018826868453561665, "loss": 2.3199, "step": 6738 }, { "epoch": 0.18, "learning_rate": 0.0018826459369314429, "loss": 2.7091, "step": 6739 }, { "epoch": 0.18, "learning_rate": 0.0018826050218199513, "loss": 2.857, "step": 6740 }, { "epoch": 0.18, "learning_rate": 0.001882564100022002, "loss": 2.6262, "step": 6741 }, { "epoch": 0.18, "learning_rate": 0.0018825231715379049, "loss": 2.653, "step": 6742 }, { "epoch": 0.18, "learning_rate": 0.00188248223636797, "loss": 2.5917, "step": 6743 }, { "epoch": 0.18, "learning_rate": 0.0018824412945125074, "loss": 2.6451, "step": 6744 }, { "epoch": 0.18, "learning_rate": 0.0018824003459718274, "loss": 2.7077, "step": 6745 }, { "epoch": 0.18, "learning_rate": 0.00188235939074624, "loss": 2.7883, "step": 6746 }, { "epoch": 0.18, "learning_rate": 0.0018823184288360557, "loss": 2.7172, "step": 6747 }, { "epoch": 0.18, "learning_rate": 0.0018822774602415846, "loss": 2.8413, "step": 6748 }, { "epoch": 0.18, "learning_rate": 0.0018822364849631374, "loss": 2.8139, "step": 6749 }, { "epoch": 0.18, "learning_rate": 0.0018821955030010242, "loss": 2.6117, "step": 6750 }, { "epoch": 0.18, "learning_rate": 0.0018821545143555558, "loss": 2.8889, "step": 6751 }, { "epoch": 0.18, "learning_rate": 0.0018821135190270422, "loss": 3.0106, "step": 6752 }, { "epoch": 0.18, "learning_rate": 0.0018820725170157946, "loss": 2.6099, "step": 6753 }, { "epoch": 0.18, "learning_rate": 0.001882031508322123, "loss": 2.8437, "step": 6754 }, { "epoch": 0.18, "learning_rate": 0.0018819904929463385, "loss": 2.5204, "step": 6755 }, { "epoch": 0.18, "learning_rate": 0.0018819494708887518, "loss": 2.37, "step": 6756 }, { "epoch": 0.18, "learning_rate": 0.0018819084421496735, "loss": 2.3557, "step": 6757 }, { "epoch": 0.18, "learning_rate": 0.0018818674067294146, "loss": 2.7086, "step": 6758 }, { "epoch": 0.18, "learning_rate": 0.0018818263646282858, "loss": 2.6137, "step": 6759 }, { "epoch": 0.18, "learning_rate": 0.001881785315846598, "loss": 2.6516, "step": 6760 }, { "epoch": 0.18, "learning_rate": 0.0018817442603846627, "loss": 2.744, "step": 6761 }, { "epoch": 0.18, "learning_rate": 0.0018817031982427902, "loss": 2.8446, "step": 6762 }, { "epoch": 0.18, "learning_rate": 0.001881662129421292, "loss": 2.92, "step": 6763 }, { "epoch": 0.18, "learning_rate": 0.0018816210539204792, "loss": 2.481, "step": 6764 }, { "epoch": 0.18, "learning_rate": 0.0018815799717406625, "loss": 2.7385, "step": 6765 }, { "epoch": 0.18, "learning_rate": 0.001881538882882154, "loss": 2.8369, "step": 6766 }, { "epoch": 0.18, "learning_rate": 0.0018814977873452645, "loss": 2.6994, "step": 6767 }, { "epoch": 0.18, "learning_rate": 0.0018814566851303052, "loss": 2.8683, "step": 6768 }, { "epoch": 0.18, "learning_rate": 0.0018814155762375876, "loss": 2.5131, "step": 6769 }, { "epoch": 0.18, "learning_rate": 0.0018813744606674234, "loss": 2.5867, "step": 6770 }, { "epoch": 0.18, "learning_rate": 0.0018813333384201237, "loss": 2.5482, "step": 6771 }, { "epoch": 0.18, "learning_rate": 0.0018812922094960003, "loss": 2.335, "step": 6772 }, { "epoch": 0.18, "learning_rate": 0.0018812510738953645, "loss": 2.6887, "step": 6773 }, { "epoch": 0.18, "learning_rate": 0.0018812099316185282, "loss": 2.9911, "step": 6774 }, { "epoch": 0.18, "learning_rate": 0.001881168782665803, "loss": 3.0041, "step": 6775 }, { "epoch": 0.18, "learning_rate": 0.001881127627037501, "loss": 2.6409, "step": 6776 }, { "epoch": 0.18, "learning_rate": 0.0018810864647339329, "loss": 2.8037, "step": 6777 }, { "epoch": 0.18, "learning_rate": 0.001881045295755412, "loss": 2.6719, "step": 6778 }, { "epoch": 0.18, "learning_rate": 0.001881004120102249, "loss": 2.4245, "step": 6779 }, { "epoch": 0.18, "learning_rate": 0.0018809629377747564, "loss": 2.498, "step": 6780 }, { "epoch": 0.18, "learning_rate": 0.001880921748773246, "loss": 2.6436, "step": 6781 }, { "epoch": 0.18, "learning_rate": 0.00188088055309803, "loss": 2.7847, "step": 6782 }, { "epoch": 0.18, "learning_rate": 0.0018808393507494206, "loss": 2.7409, "step": 6783 }, { "epoch": 0.18, "learning_rate": 0.0018807981417277295, "loss": 2.643, "step": 6784 }, { "epoch": 0.18, "learning_rate": 0.0018807569260332693, "loss": 2.6803, "step": 6785 }, { "epoch": 0.18, "learning_rate": 0.001880715703666352, "loss": 2.8841, "step": 6786 }, { "epoch": 0.18, "learning_rate": 0.0018806744746272899, "loss": 2.9749, "step": 6787 }, { "epoch": 0.18, "learning_rate": 0.0018806332389163956, "loss": 2.863, "step": 6788 }, { "epoch": 0.18, "learning_rate": 0.0018805919965339815, "loss": 2.7544, "step": 6789 }, { "epoch": 0.18, "learning_rate": 0.0018805507474803597, "loss": 2.5637, "step": 6790 }, { "epoch": 0.18, "learning_rate": 0.0018805094917558427, "loss": 2.6712, "step": 6791 }, { "epoch": 0.18, "learning_rate": 0.0018804682293607434, "loss": 2.7725, "step": 6792 }, { "epoch": 0.18, "learning_rate": 0.0018804269602953742, "loss": 2.678, "step": 6793 }, { "epoch": 0.18, "learning_rate": 0.0018803856845600476, "loss": 2.0661, "step": 6794 }, { "epoch": 0.18, "learning_rate": 0.0018803444021550763, "loss": 2.9627, "step": 6795 }, { "epoch": 0.18, "learning_rate": 0.0018803031130807737, "loss": 2.7268, "step": 6796 }, { "epoch": 0.18, "learning_rate": 0.0018802618173374519, "loss": 2.6445, "step": 6797 }, { "epoch": 0.18, "learning_rate": 0.0018802205149254236, "loss": 2.4876, "step": 6798 }, { "epoch": 0.18, "learning_rate": 0.0018801792058450026, "loss": 2.5187, "step": 6799 }, { "epoch": 0.18, "learning_rate": 0.0018801378900965009, "loss": 2.742, "step": 6800 }, { "epoch": 0.18, "learning_rate": 0.0018800965676802322, "loss": 2.9233, "step": 6801 }, { "epoch": 0.18, "learning_rate": 0.001880055238596509, "loss": 2.5605, "step": 6802 }, { "epoch": 0.18, "learning_rate": 0.0018800139028456446, "loss": 2.7929, "step": 6803 }, { "epoch": 0.18, "learning_rate": 0.0018799725604279525, "loss": 2.6814, "step": 6804 }, { "epoch": 0.18, "learning_rate": 0.0018799312113437453, "loss": 2.4636, "step": 6805 }, { "epoch": 0.18, "learning_rate": 0.0018798898555933369, "loss": 2.5378, "step": 6806 }, { "epoch": 0.18, "learning_rate": 0.0018798484931770402, "loss": 2.436, "step": 6807 }, { "epoch": 0.18, "learning_rate": 0.0018798071240951682, "loss": 2.7567, "step": 6808 }, { "epoch": 0.18, "learning_rate": 0.001879765748348035, "loss": 2.7892, "step": 6809 }, { "epoch": 0.18, "learning_rate": 0.001879724365935954, "loss": 2.8989, "step": 6810 }, { "epoch": 0.18, "learning_rate": 0.001879682976859238, "loss": 2.7089, "step": 6811 }, { "epoch": 0.18, "learning_rate": 0.0018796415811182016, "loss": 2.5523, "step": 6812 }, { "epoch": 0.18, "learning_rate": 0.0018796001787131573, "loss": 2.8707, "step": 6813 }, { "epoch": 0.18, "learning_rate": 0.0018795587696444197, "loss": 2.6423, "step": 6814 }, { "epoch": 0.18, "learning_rate": 0.001879517353912302, "loss": 2.3504, "step": 6815 }, { "epoch": 0.18, "learning_rate": 0.001879475931517118, "loss": 2.6317, "step": 6816 }, { "epoch": 0.18, "learning_rate": 0.0018794345024591816, "loss": 2.7514, "step": 6817 }, { "epoch": 0.18, "learning_rate": 0.0018793930667388066, "loss": 2.9469, "step": 6818 }, { "epoch": 0.18, "learning_rate": 0.001879351624356307, "loss": 2.2932, "step": 6819 }, { "epoch": 0.18, "learning_rate": 0.0018793101753119968, "loss": 2.3488, "step": 6820 }, { "epoch": 0.18, "learning_rate": 0.0018792687196061897, "loss": 2.6881, "step": 6821 }, { "epoch": 0.18, "learning_rate": 0.0018792272572392002, "loss": 2.4095, "step": 6822 }, { "epoch": 0.18, "learning_rate": 0.0018791857882113421, "loss": 2.6385, "step": 6823 }, { "epoch": 0.18, "learning_rate": 0.0018791443125229295, "loss": 2.2754, "step": 6824 }, { "epoch": 0.18, "learning_rate": 0.0018791028301742769, "loss": 3.0667, "step": 6825 }, { "epoch": 0.18, "learning_rate": 0.0018790613411656986, "loss": 2.6545, "step": 6826 }, { "epoch": 0.18, "learning_rate": 0.0018790198454975084, "loss": 2.782, "step": 6827 }, { "epoch": 0.18, "learning_rate": 0.0018789783431700214, "loss": 2.2751, "step": 6828 }, { "epoch": 0.18, "learning_rate": 0.0018789368341835515, "loss": 2.4922, "step": 6829 }, { "epoch": 0.18, "learning_rate": 0.001878895318538413, "loss": 2.8352, "step": 6830 }, { "epoch": 0.18, "learning_rate": 0.001878853796234921, "loss": 2.6692, "step": 6831 }, { "epoch": 0.18, "learning_rate": 0.0018788122672733895, "loss": 2.448, "step": 6832 }, { "epoch": 0.18, "learning_rate": 0.0018787707316541336, "loss": 2.842, "step": 6833 }, { "epoch": 0.18, "learning_rate": 0.001878729189377468, "loss": 2.5387, "step": 6834 }, { "epoch": 0.18, "learning_rate": 0.0018786876404437065, "loss": 2.7999, "step": 6835 }, { "epoch": 0.18, "learning_rate": 0.001878646084853165, "loss": 2.5661, "step": 6836 }, { "epoch": 0.18, "learning_rate": 0.0018786045226061576, "loss": 2.4895, "step": 6837 }, { "epoch": 0.18, "learning_rate": 0.0018785629537029999, "loss": 2.384, "step": 6838 }, { "epoch": 0.18, "learning_rate": 0.0018785213781440057, "loss": 2.8375, "step": 6839 }, { "epoch": 0.18, "learning_rate": 0.0018784797959294909, "loss": 2.5989, "step": 6840 }, { "epoch": 0.18, "learning_rate": 0.0018784382070597702, "loss": 2.4509, "step": 6841 }, { "epoch": 0.18, "learning_rate": 0.0018783966115351587, "loss": 2.6403, "step": 6842 }, { "epoch": 0.18, "learning_rate": 0.0018783550093559717, "loss": 2.6097, "step": 6843 }, { "epoch": 0.18, "learning_rate": 0.001878313400522524, "loss": 2.9929, "step": 6844 }, { "epoch": 0.18, "learning_rate": 0.001878271785035131, "loss": 2.6178, "step": 6845 }, { "epoch": 0.18, "learning_rate": 0.001878230162894108, "loss": 2.2617, "step": 6846 }, { "epoch": 0.18, "learning_rate": 0.0018781885340997699, "loss": 2.6706, "step": 6847 }, { "epoch": 0.18, "learning_rate": 0.001878146898652433, "loss": 2.4008, "step": 6848 }, { "epoch": 0.18, "learning_rate": 0.0018781052565524118, "loss": 2.8054, "step": 6849 }, { "epoch": 0.18, "learning_rate": 0.0018780636078000227, "loss": 2.7643, "step": 6850 }, { "epoch": 0.18, "learning_rate": 0.0018780219523955805, "loss": 2.7254, "step": 6851 }, { "epoch": 0.18, "learning_rate": 0.0018779802903394005, "loss": 2.5946, "step": 6852 }, { "epoch": 0.18, "learning_rate": 0.0018779386216317992, "loss": 2.1798, "step": 6853 }, { "epoch": 0.18, "learning_rate": 0.001877896946273092, "loss": 2.4493, "step": 6854 }, { "epoch": 0.18, "learning_rate": 0.0018778552642635944, "loss": 2.8037, "step": 6855 }, { "epoch": 0.18, "learning_rate": 0.001877813575603622, "loss": 2.4356, "step": 6856 }, { "epoch": 0.18, "learning_rate": 0.0018777718802934912, "loss": 2.8827, "step": 6857 }, { "epoch": 0.18, "learning_rate": 0.0018777301783335174, "loss": 2.9643, "step": 6858 }, { "epoch": 0.18, "learning_rate": 0.0018776884697240166, "loss": 2.5785, "step": 6859 }, { "epoch": 0.18, "learning_rate": 0.0018776467544653049, "loss": 3.0516, "step": 6860 }, { "epoch": 0.18, "learning_rate": 0.0018776050325576986, "loss": 2.6684, "step": 6861 }, { "epoch": 0.18, "learning_rate": 0.0018775633040015133, "loss": 2.2933, "step": 6862 }, { "epoch": 0.18, "learning_rate": 0.0018775215687970653, "loss": 2.6503, "step": 6863 }, { "epoch": 0.18, "learning_rate": 0.0018774798269446708, "loss": 2.9122, "step": 6864 }, { "epoch": 0.18, "learning_rate": 0.0018774380784446457, "loss": 2.4275, "step": 6865 }, { "epoch": 0.18, "learning_rate": 0.0018773963232973068, "loss": 3.0569, "step": 6866 }, { "epoch": 0.18, "learning_rate": 0.0018773545615029703, "loss": 2.7856, "step": 6867 }, { "epoch": 0.18, "learning_rate": 0.0018773127930619524, "loss": 2.7381, "step": 6868 }, { "epoch": 0.18, "learning_rate": 0.0018772710179745698, "loss": 2.5044, "step": 6869 }, { "epoch": 0.18, "learning_rate": 0.0018772292362411384, "loss": 3.1572, "step": 6870 }, { "epoch": 0.18, "learning_rate": 0.0018771874478619758, "loss": 2.7819, "step": 6871 }, { "epoch": 0.18, "learning_rate": 0.0018771456528373974, "loss": 2.6891, "step": 6872 }, { "epoch": 0.18, "learning_rate": 0.0018771038511677205, "loss": 2.6036, "step": 6873 }, { "epoch": 0.18, "learning_rate": 0.0018770620428532616, "loss": 2.7398, "step": 6874 }, { "epoch": 0.18, "learning_rate": 0.0018770202278943376, "loss": 2.7011, "step": 6875 }, { "epoch": 0.18, "learning_rate": 0.001876978406291265, "loss": 2.503, "step": 6876 }, { "epoch": 0.18, "learning_rate": 0.001876936578044361, "loss": 2.7661, "step": 6877 }, { "epoch": 0.18, "learning_rate": 0.001876894743153942, "loss": 2.6535, "step": 6878 }, { "epoch": 0.18, "learning_rate": 0.0018768529016203253, "loss": 2.6058, "step": 6879 }, { "epoch": 0.18, "learning_rate": 0.0018768110534438276, "loss": 2.7238, "step": 6880 }, { "epoch": 0.18, "learning_rate": 0.0018767691986247663, "loss": 2.3639, "step": 6881 }, { "epoch": 0.18, "learning_rate": 0.0018767273371634583, "loss": 2.5473, "step": 6882 }, { "epoch": 0.18, "learning_rate": 0.0018766854690602211, "loss": 2.5811, "step": 6883 }, { "epoch": 0.18, "learning_rate": 0.0018766435943153711, "loss": 2.9082, "step": 6884 }, { "epoch": 0.19, "learning_rate": 0.001876601712929226, "loss": 2.9244, "step": 6885 }, { "epoch": 0.19, "learning_rate": 0.0018765598249021029, "loss": 2.626, "step": 6886 }, { "epoch": 0.19, "learning_rate": 0.0018765179302343196, "loss": 2.2177, "step": 6887 }, { "epoch": 0.19, "learning_rate": 0.0018764760289261928, "loss": 2.5141, "step": 6888 }, { "epoch": 0.19, "learning_rate": 0.0018764341209780407, "loss": 2.9325, "step": 6889 }, { "epoch": 0.19, "learning_rate": 0.00187639220639018, "loss": 2.7548, "step": 6890 }, { "epoch": 0.19, "learning_rate": 0.001876350285162929, "loss": 2.982, "step": 6891 }, { "epoch": 0.19, "learning_rate": 0.0018763083572966046, "loss": 2.7495, "step": 6892 }, { "epoch": 0.19, "learning_rate": 0.0018762664227915252, "loss": 2.6873, "step": 6893 }, { "epoch": 0.19, "learning_rate": 0.0018762244816480078, "loss": 2.4716, "step": 6894 }, { "epoch": 0.19, "learning_rate": 0.0018761825338663703, "loss": 2.5317, "step": 6895 }, { "epoch": 0.19, "learning_rate": 0.0018761405794469306, "loss": 2.7686, "step": 6896 }, { "epoch": 0.19, "learning_rate": 0.0018760986183900066, "loss": 2.875, "step": 6897 }, { "epoch": 0.19, "learning_rate": 0.001876056650695916, "loss": 2.2528, "step": 6898 }, { "epoch": 0.19, "learning_rate": 0.0018760146763649767, "loss": 2.7665, "step": 6899 }, { "epoch": 0.19, "learning_rate": 0.0018759726953975072, "loss": 2.7558, "step": 6900 }, { "epoch": 0.19, "learning_rate": 0.001875930707793825, "loss": 2.8686, "step": 6901 }, { "epoch": 0.19, "learning_rate": 0.0018758887135542483, "loss": 2.7472, "step": 6902 }, { "epoch": 0.19, "learning_rate": 0.001875846712679095, "loss": 2.7761, "step": 6903 }, { "epoch": 0.19, "learning_rate": 0.0018758047051686839, "loss": 2.8896, "step": 6904 }, { "epoch": 0.19, "learning_rate": 0.0018757626910233332, "loss": 2.5877, "step": 6905 }, { "epoch": 0.19, "learning_rate": 0.0018757206702433606, "loss": 2.5834, "step": 6906 }, { "epoch": 0.19, "learning_rate": 0.0018756786428290849, "loss": 2.623, "step": 6907 }, { "epoch": 0.19, "learning_rate": 0.0018756366087808241, "loss": 2.4236, "step": 6908 }, { "epoch": 0.19, "learning_rate": 0.0018755945680988973, "loss": 2.8035, "step": 6909 }, { "epoch": 0.19, "learning_rate": 0.0018755525207836223, "loss": 2.8113, "step": 6910 }, { "epoch": 0.19, "learning_rate": 0.001875510466835318, "loss": 2.7431, "step": 6911 }, { "epoch": 0.19, "learning_rate": 0.001875468406254303, "loss": 2.6937, "step": 6912 }, { "epoch": 0.19, "learning_rate": 0.001875426339040896, "loss": 2.3386, "step": 6913 }, { "epoch": 0.19, "learning_rate": 0.0018753842651954152, "loss": 2.6763, "step": 6914 }, { "epoch": 0.19, "learning_rate": 0.0018753421847181797, "loss": 2.5802, "step": 6915 }, { "epoch": 0.19, "learning_rate": 0.0018753000976095087, "loss": 2.7215, "step": 6916 }, { "epoch": 0.19, "learning_rate": 0.0018752580038697204, "loss": 2.9097, "step": 6917 }, { "epoch": 0.19, "learning_rate": 0.001875215903499134, "loss": 2.7606, "step": 6918 }, { "epoch": 0.19, "learning_rate": 0.0018751737964980684, "loss": 2.9562, "step": 6919 }, { "epoch": 0.19, "learning_rate": 0.0018751316828668426, "loss": 2.4742, "step": 6920 }, { "epoch": 0.19, "learning_rate": 0.0018750895626057755, "loss": 2.4325, "step": 6921 }, { "epoch": 0.19, "learning_rate": 0.0018750474357151865, "loss": 2.8807, "step": 6922 }, { "epoch": 0.19, "learning_rate": 0.0018750053021953945, "loss": 2.6643, "step": 6923 }, { "epoch": 0.19, "learning_rate": 0.0018749631620467188, "loss": 2.6844, "step": 6924 }, { "epoch": 0.19, "learning_rate": 0.0018749210152694787, "loss": 2.839, "step": 6925 }, { "epoch": 0.19, "learning_rate": 0.0018748788618639931, "loss": 2.7283, "step": 6926 }, { "epoch": 0.19, "learning_rate": 0.0018748367018305819, "loss": 2.9349, "step": 6927 }, { "epoch": 0.19, "learning_rate": 0.0018747945351695644, "loss": 2.6845, "step": 6928 }, { "epoch": 0.19, "learning_rate": 0.0018747523618812597, "loss": 2.6141, "step": 6929 }, { "epoch": 0.19, "learning_rate": 0.0018747101819659873, "loss": 3.0167, "step": 6930 }, { "epoch": 0.19, "learning_rate": 0.0018746679954240674, "loss": 2.6592, "step": 6931 }, { "epoch": 0.19, "learning_rate": 0.0018746258022558186, "loss": 2.5915, "step": 6932 }, { "epoch": 0.19, "learning_rate": 0.0018745836024615615, "loss": 2.8359, "step": 6933 }, { "epoch": 0.19, "learning_rate": 0.001874541396041615, "loss": 2.4557, "step": 6934 }, { "epoch": 0.19, "learning_rate": 0.0018744991829962997, "loss": 2.6767, "step": 6935 }, { "epoch": 0.19, "learning_rate": 0.0018744569633259347, "loss": 2.441, "step": 6936 }, { "epoch": 0.19, "learning_rate": 0.0018744147370308402, "loss": 2.4732, "step": 6937 }, { "epoch": 0.19, "learning_rate": 0.001874372504111336, "loss": 2.6592, "step": 6938 }, { "epoch": 0.19, "learning_rate": 0.0018743302645677419, "loss": 2.642, "step": 6939 }, { "epoch": 0.19, "learning_rate": 0.0018742880184003778, "loss": 2.6069, "step": 6940 }, { "epoch": 0.19, "learning_rate": 0.0018742457656095643, "loss": 2.4993, "step": 6941 }, { "epoch": 0.19, "learning_rate": 0.001874203506195621, "loss": 2.8556, "step": 6942 }, { "epoch": 0.19, "learning_rate": 0.0018741612401588685, "loss": 2.8746, "step": 6943 }, { "epoch": 0.19, "learning_rate": 0.0018741189674996266, "loss": 2.6739, "step": 6944 }, { "epoch": 0.19, "learning_rate": 0.0018740766882182158, "loss": 2.8074, "step": 6945 }, { "epoch": 0.19, "learning_rate": 0.001874034402314956, "loss": 2.9218, "step": 6946 }, { "epoch": 0.19, "learning_rate": 0.001873992109790168, "loss": 2.6481, "step": 6947 }, { "epoch": 0.19, "learning_rate": 0.0018739498106441722, "loss": 2.9379, "step": 6948 }, { "epoch": 0.19, "learning_rate": 0.0018739075048772884, "loss": 2.5522, "step": 6949 }, { "epoch": 0.19, "learning_rate": 0.001873865192489838, "loss": 2.6716, "step": 6950 }, { "epoch": 0.19, "learning_rate": 0.001873822873482141, "loss": 2.3308, "step": 6951 }, { "epoch": 0.19, "learning_rate": 0.0018737805478545183, "loss": 2.6359, "step": 6952 }, { "epoch": 0.19, "learning_rate": 0.0018737382156072903, "loss": 2.198, "step": 6953 }, { "epoch": 0.19, "learning_rate": 0.0018736958767407775, "loss": 2.8573, "step": 6954 }, { "epoch": 0.19, "learning_rate": 0.0018736535312553011, "loss": 2.9541, "step": 6955 }, { "epoch": 0.19, "learning_rate": 0.0018736111791511818, "loss": 2.487, "step": 6956 }, { "epoch": 0.19, "learning_rate": 0.0018735688204287407, "loss": 2.6565, "step": 6957 }, { "epoch": 0.19, "learning_rate": 0.0018735264550882977, "loss": 2.7171, "step": 6958 }, { "epoch": 0.19, "learning_rate": 0.0018734840831301752, "loss": 2.7585, "step": 6959 }, { "epoch": 0.19, "learning_rate": 0.001873441704554693, "loss": 2.6477, "step": 6960 }, { "epoch": 0.19, "learning_rate": 0.0018733993193621725, "loss": 2.8524, "step": 6961 }, { "epoch": 0.19, "learning_rate": 0.0018733569275529351, "loss": 2.8541, "step": 6962 }, { "epoch": 0.19, "learning_rate": 0.0018733145291273017, "loss": 2.5541, "step": 6963 }, { "epoch": 0.19, "learning_rate": 0.0018732721240855938, "loss": 2.6713, "step": 6964 }, { "epoch": 0.19, "learning_rate": 0.0018732297124281322, "loss": 2.8027, "step": 6965 }, { "epoch": 0.19, "learning_rate": 0.0018731872941552385, "loss": 2.5334, "step": 6966 }, { "epoch": 0.19, "learning_rate": 0.0018731448692672337, "loss": 2.4491, "step": 6967 }, { "epoch": 0.19, "learning_rate": 0.00187310243776444, "loss": 2.8597, "step": 6968 }, { "epoch": 0.19, "learning_rate": 0.001873059999647178, "loss": 2.7658, "step": 6969 }, { "epoch": 0.19, "learning_rate": 0.0018730175549157694, "loss": 2.7471, "step": 6970 }, { "epoch": 0.19, "learning_rate": 0.001872975103570536, "loss": 2.7024, "step": 6971 }, { "epoch": 0.19, "learning_rate": 0.0018729326456117994, "loss": 2.9378, "step": 6972 }, { "epoch": 0.19, "learning_rate": 0.001872890181039881, "loss": 2.4865, "step": 6973 }, { "epoch": 0.19, "learning_rate": 0.0018728477098551028, "loss": 2.6474, "step": 6974 }, { "epoch": 0.19, "learning_rate": 0.0018728052320577864, "loss": 2.4656, "step": 6975 }, { "epoch": 0.19, "learning_rate": 0.0018727627476482535, "loss": 2.9532, "step": 6976 }, { "epoch": 0.19, "learning_rate": 0.001872720256626826, "loss": 2.5202, "step": 6977 }, { "epoch": 0.19, "learning_rate": 0.001872677758993826, "loss": 2.768, "step": 6978 }, { "epoch": 0.19, "learning_rate": 0.0018726352547495753, "loss": 2.8259, "step": 6979 }, { "epoch": 0.19, "learning_rate": 0.001872592743894396, "loss": 2.913, "step": 6980 }, { "epoch": 0.19, "learning_rate": 0.0018725502264286098, "loss": 2.6404, "step": 6981 }, { "epoch": 0.19, "learning_rate": 0.0018725077023525394, "loss": 2.7109, "step": 6982 }, { "epoch": 0.19, "learning_rate": 0.0018724651716665063, "loss": 2.8845, "step": 6983 }, { "epoch": 0.19, "learning_rate": 0.0018724226343708333, "loss": 2.6734, "step": 6984 }, { "epoch": 0.19, "learning_rate": 0.0018723800904658422, "loss": 2.7708, "step": 6985 }, { "epoch": 0.19, "learning_rate": 0.0018723375399518555, "loss": 2.4996, "step": 6986 }, { "epoch": 0.19, "learning_rate": 0.0018722949828291959, "loss": 2.9402, "step": 6987 }, { "epoch": 0.19, "learning_rate": 0.001872252419098185, "loss": 2.5894, "step": 6988 }, { "epoch": 0.19, "learning_rate": 0.0018722098487591462, "loss": 2.7694, "step": 6989 }, { "epoch": 0.19, "learning_rate": 0.0018721672718124012, "loss": 3.172, "step": 6990 }, { "epoch": 0.19, "learning_rate": 0.001872124688258273, "loss": 2.6344, "step": 6991 }, { "epoch": 0.19, "learning_rate": 0.001872082098097084, "loss": 2.5504, "step": 6992 }, { "epoch": 0.19, "learning_rate": 0.0018720395013291568, "loss": 2.7793, "step": 6993 }, { "epoch": 0.19, "learning_rate": 0.0018719968979548148, "loss": 2.5929, "step": 6994 }, { "epoch": 0.19, "learning_rate": 0.0018719542879743797, "loss": 2.6154, "step": 6995 }, { "epoch": 0.19, "learning_rate": 0.0018719116713881748, "loss": 2.7526, "step": 6996 }, { "epoch": 0.19, "learning_rate": 0.0018718690481965231, "loss": 2.5363, "step": 6997 }, { "epoch": 0.19, "learning_rate": 0.0018718264183997474, "loss": 2.9341, "step": 6998 }, { "epoch": 0.19, "learning_rate": 0.0018717837819981708, "loss": 2.8683, "step": 6999 }, { "epoch": 0.19, "learning_rate": 0.0018717411389921157, "loss": 2.4094, "step": 7000 }, { "epoch": 0.19, "learning_rate": 0.0018716984893819059, "loss": 2.6114, "step": 7001 }, { "epoch": 0.19, "learning_rate": 0.001871655833167864, "loss": 3.0339, "step": 7002 }, { "epoch": 0.19, "learning_rate": 0.0018716131703503133, "loss": 2.7076, "step": 7003 }, { "epoch": 0.19, "learning_rate": 0.0018715705009295772, "loss": 2.7841, "step": 7004 }, { "epoch": 0.19, "learning_rate": 0.0018715278249059788, "loss": 2.6395, "step": 7005 }, { "epoch": 0.19, "learning_rate": 0.0018714851422798415, "loss": 2.402, "step": 7006 }, { "epoch": 0.19, "learning_rate": 0.0018714424530514883, "loss": 2.6134, "step": 7007 }, { "epoch": 0.19, "learning_rate": 0.0018713997572212431, "loss": 2.5696, "step": 7008 }, { "epoch": 0.19, "learning_rate": 0.0018713570547894292, "loss": 2.5584, "step": 7009 }, { "epoch": 0.19, "learning_rate": 0.0018713143457563697, "loss": 2.6446, "step": 7010 }, { "epoch": 0.19, "learning_rate": 0.0018712716301223886, "loss": 2.8171, "step": 7011 }, { "epoch": 0.19, "learning_rate": 0.0018712289078878098, "loss": 2.4614, "step": 7012 }, { "epoch": 0.19, "learning_rate": 0.0018711861790529562, "loss": 2.4424, "step": 7013 }, { "epoch": 0.19, "learning_rate": 0.001871143443618152, "loss": 2.1095, "step": 7014 }, { "epoch": 0.19, "learning_rate": 0.0018711007015837207, "loss": 2.6359, "step": 7015 }, { "epoch": 0.19, "learning_rate": 0.001871057952949986, "loss": 1.8327, "step": 7016 }, { "epoch": 0.19, "learning_rate": 0.0018710151977172724, "loss": 2.5172, "step": 7017 }, { "epoch": 0.19, "learning_rate": 0.0018709724358859034, "loss": 2.6066, "step": 7018 }, { "epoch": 0.19, "learning_rate": 0.0018709296674562026, "loss": 2.8365, "step": 7019 }, { "epoch": 0.19, "learning_rate": 0.0018708868924284946, "loss": 2.8624, "step": 7020 }, { "epoch": 0.19, "learning_rate": 0.0018708441108031032, "loss": 2.7321, "step": 7021 }, { "epoch": 0.19, "learning_rate": 0.0018708013225803522, "loss": 2.6975, "step": 7022 }, { "epoch": 0.19, "learning_rate": 0.0018707585277605663, "loss": 2.6085, "step": 7023 }, { "epoch": 0.19, "learning_rate": 0.0018707157263440695, "loss": 2.4629, "step": 7024 }, { "epoch": 0.19, "learning_rate": 0.0018706729183311861, "loss": 2.6364, "step": 7025 }, { "epoch": 0.19, "learning_rate": 0.0018706301037222399, "loss": 2.8985, "step": 7026 }, { "epoch": 0.19, "learning_rate": 0.001870587282517556, "loss": 2.4605, "step": 7027 }, { "epoch": 0.19, "learning_rate": 0.0018705444547174586, "loss": 2.6618, "step": 7028 }, { "epoch": 0.19, "learning_rate": 0.001870501620322272, "loss": 2.5141, "step": 7029 }, { "epoch": 0.19, "learning_rate": 0.0018704587793323207, "loss": 2.6952, "step": 7030 }, { "epoch": 0.19, "learning_rate": 0.0018704159317479295, "loss": 2.1568, "step": 7031 }, { "epoch": 0.19, "learning_rate": 0.0018703730775694223, "loss": 2.9799, "step": 7032 }, { "epoch": 0.19, "learning_rate": 0.0018703302167971249, "loss": 2.5388, "step": 7033 }, { "epoch": 0.19, "learning_rate": 0.001870287349431361, "loss": 2.7955, "step": 7034 }, { "epoch": 0.19, "learning_rate": 0.0018702444754724558, "loss": 2.6976, "step": 7035 }, { "epoch": 0.19, "learning_rate": 0.001870201594920734, "loss": 2.8112, "step": 7036 }, { "epoch": 0.19, "learning_rate": 0.0018701587077765206, "loss": 2.3551, "step": 7037 }, { "epoch": 0.19, "learning_rate": 0.0018701158140401405, "loss": 2.6027, "step": 7038 }, { "epoch": 0.19, "learning_rate": 0.0018700729137119182, "loss": 2.5375, "step": 7039 }, { "epoch": 0.19, "learning_rate": 0.0018700300067921792, "loss": 2.8644, "step": 7040 }, { "epoch": 0.19, "learning_rate": 0.0018699870932812486, "loss": 2.8276, "step": 7041 }, { "epoch": 0.19, "learning_rate": 0.0018699441731794512, "loss": 2.339, "step": 7042 }, { "epoch": 0.19, "learning_rate": 0.0018699012464871122, "loss": 2.5273, "step": 7043 }, { "epoch": 0.19, "learning_rate": 0.0018698583132045568, "loss": 2.7791, "step": 7044 }, { "epoch": 0.19, "learning_rate": 0.0018698153733321106, "loss": 2.4865, "step": 7045 }, { "epoch": 0.19, "learning_rate": 0.0018697724268700985, "loss": 2.693, "step": 7046 }, { "epoch": 0.19, "learning_rate": 0.001869729473818846, "loss": 2.6732, "step": 7047 }, { "epoch": 0.19, "learning_rate": 0.0018696865141786785, "loss": 2.5925, "step": 7048 }, { "epoch": 0.19, "learning_rate": 0.0018696435479499214, "loss": 2.6236, "step": 7049 }, { "epoch": 0.19, "learning_rate": 0.0018696005751329006, "loss": 2.9054, "step": 7050 }, { "epoch": 0.19, "learning_rate": 0.001869557595727941, "loss": 2.8662, "step": 7051 }, { "epoch": 0.19, "learning_rate": 0.0018695146097353686, "loss": 2.4507, "step": 7052 }, { "epoch": 0.19, "learning_rate": 0.001869471617155509, "loss": 2.7597, "step": 7053 }, { "epoch": 0.19, "learning_rate": 0.0018694286179886876, "loss": 2.9228, "step": 7054 }, { "epoch": 0.19, "learning_rate": 0.001869385612235231, "loss": 2.5059, "step": 7055 }, { "epoch": 0.19, "learning_rate": 0.0018693425998954636, "loss": 2.6457, "step": 7056 }, { "epoch": 0.19, "learning_rate": 0.0018692995809697127, "loss": 2.8817, "step": 7057 }, { "epoch": 0.19, "learning_rate": 0.0018692565554583034, "loss": 2.9157, "step": 7058 }, { "epoch": 0.19, "learning_rate": 0.001869213523361562, "loss": 2.6161, "step": 7059 }, { "epoch": 0.19, "learning_rate": 0.0018691704846798142, "loss": 2.222, "step": 7060 }, { "epoch": 0.19, "learning_rate": 0.0018691274394133863, "loss": 2.3319, "step": 7061 }, { "epoch": 0.19, "learning_rate": 0.0018690843875626042, "loss": 2.885, "step": 7062 }, { "epoch": 0.19, "learning_rate": 0.0018690413291277941, "loss": 2.2993, "step": 7063 }, { "epoch": 0.19, "learning_rate": 0.0018689982641092824, "loss": 2.5582, "step": 7064 }, { "epoch": 0.19, "learning_rate": 0.0018689551925073953, "loss": 2.5266, "step": 7065 }, { "epoch": 0.19, "learning_rate": 0.001868912114322459, "loss": 2.8306, "step": 7066 }, { "epoch": 0.19, "learning_rate": 0.0018688690295547996, "loss": 1.9914, "step": 7067 }, { "epoch": 0.19, "learning_rate": 0.0018688259382047439, "loss": 2.7644, "step": 7068 }, { "epoch": 0.19, "learning_rate": 0.0018687828402726185, "loss": 2.6304, "step": 7069 }, { "epoch": 0.19, "learning_rate": 0.0018687397357587492, "loss": 2.5384, "step": 7070 }, { "epoch": 0.19, "learning_rate": 0.001868696624663463, "loss": 2.7942, "step": 7071 }, { "epoch": 0.19, "learning_rate": 0.0018686535069870867, "loss": 2.5136, "step": 7072 }, { "epoch": 0.19, "learning_rate": 0.0018686103827299468, "loss": 2.3932, "step": 7073 }, { "epoch": 0.19, "learning_rate": 0.0018685672518923698, "loss": 2.0363, "step": 7074 }, { "epoch": 0.19, "learning_rate": 0.0018685241144746824, "loss": 2.5464, "step": 7075 }, { "epoch": 0.19, "learning_rate": 0.0018684809704772119, "loss": 2.5934, "step": 7076 }, { "epoch": 0.19, "learning_rate": 0.0018684378199002847, "loss": 2.7303, "step": 7077 }, { "epoch": 0.19, "learning_rate": 0.0018683946627442278, "loss": 2.4375, "step": 7078 }, { "epoch": 0.19, "learning_rate": 0.0018683514990093684, "loss": 2.4271, "step": 7079 }, { "epoch": 0.19, "learning_rate": 0.0018683083286960332, "loss": 2.8031, "step": 7080 }, { "epoch": 0.19, "learning_rate": 0.0018682651518045492, "loss": 2.8564, "step": 7081 }, { "epoch": 0.19, "learning_rate": 0.0018682219683352438, "loss": 2.4501, "step": 7082 }, { "epoch": 0.19, "learning_rate": 0.0018681787782884437, "loss": 2.9111, "step": 7083 }, { "epoch": 0.19, "learning_rate": 0.0018681355816644767, "loss": 3.0675, "step": 7084 }, { "epoch": 0.19, "learning_rate": 0.0018680923784636697, "loss": 2.6192, "step": 7085 }, { "epoch": 0.19, "learning_rate": 0.00186804916868635, "loss": 2.7128, "step": 7086 }, { "epoch": 0.19, "learning_rate": 0.001868005952332845, "loss": 2.796, "step": 7087 }, { "epoch": 0.19, "learning_rate": 0.001867962729403482, "loss": 2.4929, "step": 7088 }, { "epoch": 0.19, "learning_rate": 0.0018679194998985887, "loss": 2.832, "step": 7089 }, { "epoch": 0.19, "learning_rate": 0.0018678762638184923, "loss": 2.9936, "step": 7090 }, { "epoch": 0.19, "learning_rate": 0.0018678330211635203, "loss": 2.6012, "step": 7091 }, { "epoch": 0.19, "learning_rate": 0.001867789771934001, "loss": 2.2868, "step": 7092 }, { "epoch": 0.19, "learning_rate": 0.0018677465161302611, "loss": 2.2458, "step": 7093 }, { "epoch": 0.19, "learning_rate": 0.0018677032537526288, "loss": 2.6683, "step": 7094 }, { "epoch": 0.19, "learning_rate": 0.001867659984801432, "loss": 2.6222, "step": 7095 }, { "epoch": 0.19, "learning_rate": 0.001867616709276998, "loss": 2.5861, "step": 7096 }, { "epoch": 0.19, "learning_rate": 0.0018675734271796553, "loss": 2.3016, "step": 7097 }, { "epoch": 0.19, "learning_rate": 0.001867530138509731, "loss": 2.3529, "step": 7098 }, { "epoch": 0.19, "learning_rate": 0.0018674868432675539, "loss": 2.4726, "step": 7099 }, { "epoch": 0.19, "learning_rate": 0.0018674435414534512, "loss": 2.7974, "step": 7100 }, { "epoch": 0.19, "learning_rate": 0.0018674002330677513, "loss": 2.5842, "step": 7101 }, { "epoch": 0.19, "learning_rate": 0.0018673569181107826, "loss": 2.9763, "step": 7102 }, { "epoch": 0.19, "learning_rate": 0.0018673135965828727, "loss": 2.7293, "step": 7103 }, { "epoch": 0.19, "learning_rate": 0.0018672702684843503, "loss": 2.8112, "step": 7104 }, { "epoch": 0.19, "learning_rate": 0.0018672269338155432, "loss": 2.2679, "step": 7105 }, { "epoch": 0.19, "learning_rate": 0.0018671835925767799, "loss": 2.8997, "step": 7106 }, { "epoch": 0.19, "learning_rate": 0.001867140244768389, "loss": 2.5057, "step": 7107 }, { "epoch": 0.19, "learning_rate": 0.0018670968903906982, "loss": 2.5329, "step": 7108 }, { "epoch": 0.19, "learning_rate": 0.0018670535294440368, "loss": 2.4515, "step": 7109 }, { "epoch": 0.19, "learning_rate": 0.0018670101619287327, "loss": 2.658, "step": 7110 }, { "epoch": 0.19, "learning_rate": 0.0018669667878451147, "loss": 2.9894, "step": 7111 }, { "epoch": 0.19, "learning_rate": 0.001866923407193511, "loss": 2.5355, "step": 7112 }, { "epoch": 0.19, "learning_rate": 0.0018668800199742508, "loss": 2.5869, "step": 7113 }, { "epoch": 0.19, "learning_rate": 0.0018668366261876627, "loss": 2.8374, "step": 7114 }, { "epoch": 0.19, "learning_rate": 0.001866793225834075, "loss": 2.6994, "step": 7115 }, { "epoch": 0.19, "learning_rate": 0.001866749818913817, "loss": 2.776, "step": 7116 }, { "epoch": 0.19, "learning_rate": 0.001866706405427217, "loss": 2.9094, "step": 7117 }, { "epoch": 0.19, "learning_rate": 0.0018666629853746047, "loss": 2.8936, "step": 7118 }, { "epoch": 0.19, "learning_rate": 0.0018666195587563085, "loss": 2.8216, "step": 7119 }, { "epoch": 0.19, "learning_rate": 0.001866576125572657, "loss": 2.6159, "step": 7120 }, { "epoch": 0.19, "learning_rate": 0.0018665326858239802, "loss": 2.3995, "step": 7121 }, { "epoch": 0.19, "learning_rate": 0.0018664892395106065, "loss": 2.4872, "step": 7122 }, { "epoch": 0.19, "learning_rate": 0.0018664457866328652, "loss": 2.9972, "step": 7123 }, { "epoch": 0.19, "learning_rate": 0.0018664023271910857, "loss": 2.5236, "step": 7124 }, { "epoch": 0.19, "learning_rate": 0.0018663588611855966, "loss": 2.5525, "step": 7125 }, { "epoch": 0.19, "learning_rate": 0.0018663153886167283, "loss": 2.0496, "step": 7126 }, { "epoch": 0.19, "learning_rate": 0.0018662719094848092, "loss": 2.679, "step": 7127 }, { "epoch": 0.19, "learning_rate": 0.0018662284237901687, "loss": 2.8293, "step": 7128 }, { "epoch": 0.19, "learning_rate": 0.001866184931533137, "loss": 2.6746, "step": 7129 }, { "epoch": 0.19, "learning_rate": 0.0018661414327140427, "loss": 2.9483, "step": 7130 }, { "epoch": 0.19, "learning_rate": 0.0018660979273332162, "loss": 2.0842, "step": 7131 }, { "epoch": 0.19, "learning_rate": 0.0018660544153909864, "loss": 2.4918, "step": 7132 }, { "epoch": 0.19, "learning_rate": 0.001866010896887683, "loss": 2.735, "step": 7133 }, { "epoch": 0.19, "learning_rate": 0.0018659673718236364, "loss": 2.2604, "step": 7134 }, { "epoch": 0.19, "learning_rate": 0.0018659238401991752, "loss": 2.6853, "step": 7135 }, { "epoch": 0.19, "learning_rate": 0.0018658803020146304, "loss": 2.6762, "step": 7136 }, { "epoch": 0.19, "learning_rate": 0.0018658367572703307, "loss": 2.5107, "step": 7137 }, { "epoch": 0.19, "learning_rate": 0.001865793205966607, "loss": 2.7588, "step": 7138 }, { "epoch": 0.19, "learning_rate": 0.0018657496481037884, "loss": 2.885, "step": 7139 }, { "epoch": 0.19, "learning_rate": 0.0018657060836822052, "loss": 3.2986, "step": 7140 }, { "epoch": 0.19, "learning_rate": 0.0018656625127021877, "loss": 2.6142, "step": 7141 }, { "epoch": 0.19, "learning_rate": 0.0018656189351640659, "loss": 2.6246, "step": 7142 }, { "epoch": 0.19, "learning_rate": 0.0018655753510681695, "loss": 2.3536, "step": 7143 }, { "epoch": 0.19, "learning_rate": 0.0018655317604148291, "loss": 2.6629, "step": 7144 }, { "epoch": 0.19, "learning_rate": 0.001865488163204375, "loss": 2.236, "step": 7145 }, { "epoch": 0.19, "learning_rate": 0.001865444559437137, "loss": 2.8301, "step": 7146 }, { "epoch": 0.19, "learning_rate": 0.0018654009491134457, "loss": 2.2456, "step": 7147 }, { "epoch": 0.19, "learning_rate": 0.0018653573322336319, "loss": 2.7096, "step": 7148 }, { "epoch": 0.19, "learning_rate": 0.0018653137087980257, "loss": 2.4368, "step": 7149 }, { "epoch": 0.19, "learning_rate": 0.0018652700788069573, "loss": 2.6233, "step": 7150 }, { "epoch": 0.19, "learning_rate": 0.0018652264422607573, "loss": 2.7457, "step": 7151 }, { "epoch": 0.19, "learning_rate": 0.0018651827991597568, "loss": 2.6295, "step": 7152 }, { "epoch": 0.19, "learning_rate": 0.001865139149504286, "loss": 2.74, "step": 7153 }, { "epoch": 0.19, "learning_rate": 0.0018650954932946755, "loss": 2.588, "step": 7154 }, { "epoch": 0.19, "learning_rate": 0.0018650518305312566, "loss": 2.2074, "step": 7155 }, { "epoch": 0.19, "learning_rate": 0.0018650081612143592, "loss": 3.0087, "step": 7156 }, { "epoch": 0.19, "learning_rate": 0.0018649644853443149, "loss": 2.6537, "step": 7157 }, { "epoch": 0.19, "learning_rate": 0.001864920802921454, "loss": 2.5418, "step": 7158 }, { "epoch": 0.19, "learning_rate": 0.0018648771139461082, "loss": 2.7806, "step": 7159 }, { "epoch": 0.19, "learning_rate": 0.0018648334184186077, "loss": 2.4809, "step": 7160 }, { "epoch": 0.19, "learning_rate": 0.001864789716339284, "loss": 2.6914, "step": 7161 }, { "epoch": 0.19, "learning_rate": 0.001864746007708468, "loss": 2.4471, "step": 7162 }, { "epoch": 0.19, "learning_rate": 0.0018647022925264909, "loss": 2.996, "step": 7163 }, { "epoch": 0.19, "learning_rate": 0.0018646585707936835, "loss": 2.326, "step": 7164 }, { "epoch": 0.19, "learning_rate": 0.0018646148425103778, "loss": 2.242, "step": 7165 }, { "epoch": 0.19, "learning_rate": 0.0018645711076769045, "loss": 2.5836, "step": 7166 }, { "epoch": 0.19, "learning_rate": 0.0018645273662935948, "loss": 2.734, "step": 7167 }, { "epoch": 0.19, "learning_rate": 0.0018644836183607804, "loss": 3.0842, "step": 7168 }, { "epoch": 0.19, "learning_rate": 0.001864439863878793, "loss": 2.4735, "step": 7169 }, { "epoch": 0.19, "learning_rate": 0.0018643961028479634, "loss": 2.5308, "step": 7170 }, { "epoch": 0.19, "learning_rate": 0.0018643523352686235, "loss": 2.6565, "step": 7171 }, { "epoch": 0.19, "learning_rate": 0.001864308561141105, "loss": 2.5326, "step": 7172 }, { "epoch": 0.19, "learning_rate": 0.0018642647804657394, "loss": 2.7251, "step": 7173 }, { "epoch": 0.19, "learning_rate": 0.0018642209932428582, "loss": 2.7409, "step": 7174 }, { "epoch": 0.19, "learning_rate": 0.0018641771994727932, "loss": 2.6472, "step": 7175 }, { "epoch": 0.19, "learning_rate": 0.0018641333991558761, "loss": 2.3577, "step": 7176 }, { "epoch": 0.19, "learning_rate": 0.0018640895922924395, "loss": 2.8379, "step": 7177 }, { "epoch": 0.19, "learning_rate": 0.001864045778882814, "loss": 2.4238, "step": 7178 }, { "epoch": 0.19, "learning_rate": 0.0018640019589273322, "loss": 2.7193, "step": 7179 }, { "epoch": 0.19, "learning_rate": 0.0018639581324263264, "loss": 2.8032, "step": 7180 }, { "epoch": 0.19, "learning_rate": 0.001863914299380128, "loss": 2.9356, "step": 7181 }, { "epoch": 0.19, "learning_rate": 0.0018638704597890693, "loss": 2.4463, "step": 7182 }, { "epoch": 0.19, "learning_rate": 0.0018638266136534827, "loss": 2.5305, "step": 7183 }, { "epoch": 0.19, "learning_rate": 0.0018637827609736999, "loss": 3.0429, "step": 7184 }, { "epoch": 0.19, "learning_rate": 0.0018637389017500535, "loss": 3.1152, "step": 7185 }, { "epoch": 0.19, "learning_rate": 0.0018636950359828752, "loss": 2.5773, "step": 7186 }, { "epoch": 0.19, "learning_rate": 0.001863651163672498, "loss": 2.6559, "step": 7187 }, { "epoch": 0.19, "learning_rate": 0.001863607284819254, "loss": 2.5946, "step": 7188 }, { "epoch": 0.19, "learning_rate": 0.0018635633994234758, "loss": 2.4739, "step": 7189 }, { "epoch": 0.19, "learning_rate": 0.0018635195074854951, "loss": 2.4577, "step": 7190 }, { "epoch": 0.19, "learning_rate": 0.0018634756090056455, "loss": 2.9541, "step": 7191 }, { "epoch": 0.19, "learning_rate": 0.001863431703984259, "loss": 3.203, "step": 7192 }, { "epoch": 0.19, "learning_rate": 0.0018633877924216682, "loss": 2.4498, "step": 7193 }, { "epoch": 0.19, "learning_rate": 0.0018633438743182059, "loss": 2.3043, "step": 7194 }, { "epoch": 0.19, "learning_rate": 0.0018632999496742046, "loss": 2.7737, "step": 7195 }, { "epoch": 0.19, "learning_rate": 0.0018632560184899973, "loss": 2.8688, "step": 7196 }, { "epoch": 0.19, "learning_rate": 0.0018632120807659167, "loss": 3.0481, "step": 7197 }, { "epoch": 0.19, "learning_rate": 0.0018631681365022957, "loss": 2.5526, "step": 7198 }, { "epoch": 0.19, "learning_rate": 0.0018631241856994674, "loss": 2.895, "step": 7199 }, { "epoch": 0.19, "learning_rate": 0.0018630802283577644, "loss": 2.3986, "step": 7200 }, { "epoch": 0.19, "learning_rate": 0.00186303626447752, "loss": 2.65, "step": 7201 }, { "epoch": 0.19, "learning_rate": 0.0018629922940590672, "loss": 3.1163, "step": 7202 }, { "epoch": 0.19, "learning_rate": 0.001862948317102739, "loss": 2.2459, "step": 7203 }, { "epoch": 0.19, "learning_rate": 0.0018629043336088685, "loss": 2.7851, "step": 7204 }, { "epoch": 0.19, "learning_rate": 0.0018628603435777893, "loss": 2.1595, "step": 7205 }, { "epoch": 0.19, "learning_rate": 0.0018628163470098343, "loss": 2.4984, "step": 7206 }, { "epoch": 0.19, "learning_rate": 0.0018627723439053369, "loss": 2.9556, "step": 7207 }, { "epoch": 0.19, "learning_rate": 0.0018627283342646304, "loss": 2.5147, "step": 7208 }, { "epoch": 0.19, "learning_rate": 0.0018626843180880482, "loss": 2.7633, "step": 7209 }, { "epoch": 0.19, "learning_rate": 0.001862640295375924, "loss": 2.7061, "step": 7210 }, { "epoch": 0.19, "learning_rate": 0.0018625962661285912, "loss": 2.9839, "step": 7211 }, { "epoch": 0.19, "learning_rate": 0.0018625522303463832, "loss": 2.5371, "step": 7212 }, { "epoch": 0.19, "learning_rate": 0.0018625081880296334, "loss": 2.5311, "step": 7213 }, { "epoch": 0.19, "learning_rate": 0.0018624641391786763, "loss": 2.8168, "step": 7214 }, { "epoch": 0.19, "learning_rate": 0.001862420083793845, "loss": 2.7664, "step": 7215 }, { "epoch": 0.19, "learning_rate": 0.001862376021875473, "loss": 2.4654, "step": 7216 }, { "epoch": 0.19, "learning_rate": 0.0018623319534238948, "loss": 2.402, "step": 7217 }, { "epoch": 0.19, "learning_rate": 0.0018622878784394436, "loss": 2.3809, "step": 7218 }, { "epoch": 0.19, "learning_rate": 0.0018622437969224538, "loss": 2.6657, "step": 7219 }, { "epoch": 0.19, "learning_rate": 0.0018621997088732588, "loss": 2.4471, "step": 7220 }, { "epoch": 0.19, "learning_rate": 0.0018621556142921936, "loss": 2.6122, "step": 7221 }, { "epoch": 0.19, "learning_rate": 0.001862111513179591, "loss": 3.2066, "step": 7222 }, { "epoch": 0.19, "learning_rate": 0.001862067405535786, "loss": 2.5204, "step": 7223 }, { "epoch": 0.19, "learning_rate": 0.0018620232913611123, "loss": 2.4177, "step": 7224 }, { "epoch": 0.19, "learning_rate": 0.0018619791706559045, "loss": 2.8561, "step": 7225 }, { "epoch": 0.19, "learning_rate": 0.0018619350434204965, "loss": 2.6668, "step": 7226 }, { "epoch": 0.19, "learning_rate": 0.0018618909096552226, "loss": 2.6153, "step": 7227 }, { "epoch": 0.19, "learning_rate": 0.0018618467693604175, "loss": 2.6186, "step": 7228 }, { "epoch": 0.19, "learning_rate": 0.001861802622536415, "loss": 2.5666, "step": 7229 }, { "epoch": 0.19, "learning_rate": 0.0018617584691835503, "loss": 2.8108, "step": 7230 }, { "epoch": 0.19, "learning_rate": 0.0018617143093021574, "loss": 2.4296, "step": 7231 }, { "epoch": 0.19, "learning_rate": 0.0018616701428925706, "loss": 2.3546, "step": 7232 }, { "epoch": 0.19, "learning_rate": 0.0018616259699551253, "loss": 2.6424, "step": 7233 }, { "epoch": 0.19, "learning_rate": 0.0018615817904901553, "loss": 2.5572, "step": 7234 }, { "epoch": 0.19, "learning_rate": 0.0018615376044979958, "loss": 2.9517, "step": 7235 }, { "epoch": 0.19, "learning_rate": 0.0018614934119789816, "loss": 2.9366, "step": 7236 }, { "epoch": 0.19, "learning_rate": 0.0018614492129334472, "loss": 2.5532, "step": 7237 }, { "epoch": 0.19, "learning_rate": 0.0018614050073617278, "loss": 2.6842, "step": 7238 }, { "epoch": 0.19, "learning_rate": 0.001861360795264158, "loss": 2.4388, "step": 7239 }, { "epoch": 0.19, "learning_rate": 0.0018613165766410726, "loss": 3.0378, "step": 7240 }, { "epoch": 0.19, "learning_rate": 0.0018612723514928068, "loss": 2.8929, "step": 7241 }, { "epoch": 0.19, "learning_rate": 0.0018612281198196962, "loss": 2.967, "step": 7242 }, { "epoch": 0.19, "learning_rate": 0.0018611838816220748, "loss": 2.4513, "step": 7243 }, { "epoch": 0.19, "learning_rate": 0.0018611396369002783, "loss": 2.3505, "step": 7244 }, { "epoch": 0.19, "learning_rate": 0.001861095385654642, "loss": 2.7352, "step": 7245 }, { "epoch": 0.19, "learning_rate": 0.0018610511278855009, "loss": 2.3047, "step": 7246 }, { "epoch": 0.19, "learning_rate": 0.0018610068635931906, "loss": 2.5177, "step": 7247 }, { "epoch": 0.19, "learning_rate": 0.0018609625927780461, "loss": 2.8295, "step": 7248 }, { "epoch": 0.19, "learning_rate": 0.001860918315440403, "loss": 2.5124, "step": 7249 }, { "epoch": 0.19, "learning_rate": 0.0018608740315805964, "loss": 2.7123, "step": 7250 }, { "epoch": 0.19, "learning_rate": 0.0018608297411989623, "loss": 2.6082, "step": 7251 }, { "epoch": 0.19, "learning_rate": 0.0018607854442958358, "loss": 2.3252, "step": 7252 }, { "epoch": 0.19, "learning_rate": 0.0018607411408715529, "loss": 2.5853, "step": 7253 }, { "epoch": 0.19, "learning_rate": 0.001860696830926449, "loss": 2.5114, "step": 7254 }, { "epoch": 0.19, "learning_rate": 0.0018606525144608595, "loss": 2.9335, "step": 7255 }, { "epoch": 0.19, "learning_rate": 0.0018606081914751206, "loss": 2.5722, "step": 7256 }, { "epoch": 0.2, "learning_rate": 0.0018605638619695677, "loss": 2.4851, "step": 7257 }, { "epoch": 0.2, "learning_rate": 0.0018605195259445374, "loss": 2.8148, "step": 7258 }, { "epoch": 0.2, "learning_rate": 0.0018604751834003644, "loss": 2.5521, "step": 7259 }, { "epoch": 0.2, "learning_rate": 0.0018604308343373854, "loss": 2.419, "step": 7260 }, { "epoch": 0.2, "learning_rate": 0.0018603864787559363, "loss": 3.1597, "step": 7261 }, { "epoch": 0.2, "learning_rate": 0.0018603421166563533, "loss": 2.8183, "step": 7262 }, { "epoch": 0.2, "learning_rate": 0.001860297748038972, "loss": 2.6565, "step": 7263 }, { "epoch": 0.2, "learning_rate": 0.0018602533729041289, "loss": 2.852, "step": 7264 }, { "epoch": 0.2, "learning_rate": 0.0018602089912521601, "loss": 2.6159, "step": 7265 }, { "epoch": 0.2, "learning_rate": 0.0018601646030834014, "loss": 2.7501, "step": 7266 }, { "epoch": 0.2, "learning_rate": 0.0018601202083981896, "loss": 2.7856, "step": 7267 }, { "epoch": 0.2, "learning_rate": 0.001860075807196861, "loss": 2.6049, "step": 7268 }, { "epoch": 0.2, "learning_rate": 0.0018600313994797518, "loss": 2.3009, "step": 7269 }, { "epoch": 0.2, "learning_rate": 0.0018599869852471984, "loss": 2.7838, "step": 7270 }, { "epoch": 0.2, "learning_rate": 0.0018599425644995377, "loss": 2.9652, "step": 7271 }, { "epoch": 0.2, "learning_rate": 0.0018598981372371054, "loss": 2.3167, "step": 7272 }, { "epoch": 0.2, "learning_rate": 0.0018598537034602387, "loss": 2.747, "step": 7273 }, { "epoch": 0.2, "learning_rate": 0.0018598092631692742, "loss": 2.6717, "step": 7274 }, { "epoch": 0.2, "learning_rate": 0.001859764816364548, "loss": 2.8264, "step": 7275 }, { "epoch": 0.2, "learning_rate": 0.0018597203630463979, "loss": 2.529, "step": 7276 }, { "epoch": 0.2, "learning_rate": 0.0018596759032151599, "loss": 2.7015, "step": 7277 }, { "epoch": 0.2, "learning_rate": 0.0018596314368711706, "loss": 2.5064, "step": 7278 }, { "epoch": 0.2, "learning_rate": 0.0018595869640147674, "loss": 2.1959, "step": 7279 }, { "epoch": 0.2, "learning_rate": 0.0018595424846462871, "loss": 2.4461, "step": 7280 }, { "epoch": 0.2, "learning_rate": 0.0018594979987660665, "loss": 2.4855, "step": 7281 }, { "epoch": 0.2, "learning_rate": 0.0018594535063744429, "loss": 2.6256, "step": 7282 }, { "epoch": 0.2, "learning_rate": 0.001859409007471753, "loss": 2.9134, "step": 7283 }, { "epoch": 0.2, "learning_rate": 0.0018593645020583342, "loss": 3.2655, "step": 7284 }, { "epoch": 0.2, "learning_rate": 0.0018593199901345238, "loss": 2.7023, "step": 7285 }, { "epoch": 0.2, "learning_rate": 0.0018592754717006584, "loss": 2.6166, "step": 7286 }, { "epoch": 0.2, "learning_rate": 0.0018592309467570759, "loss": 2.3426, "step": 7287 }, { "epoch": 0.2, "learning_rate": 0.0018591864153041132, "loss": 2.4475, "step": 7288 }, { "epoch": 0.2, "learning_rate": 0.001859141877342108, "loss": 2.601, "step": 7289 }, { "epoch": 0.2, "learning_rate": 0.0018590973328713974, "loss": 2.4366, "step": 7290 }, { "epoch": 0.2, "learning_rate": 0.001859052781892319, "loss": 2.8057, "step": 7291 }, { "epoch": 0.2, "learning_rate": 0.0018590082244052102, "loss": 2.6423, "step": 7292 }, { "epoch": 0.2, "learning_rate": 0.001858963660410409, "loss": 2.3907, "step": 7293 }, { "epoch": 0.2, "learning_rate": 0.0018589190899082524, "loss": 2.602, "step": 7294 }, { "epoch": 0.2, "learning_rate": 0.0018588745128990784, "loss": 2.6851, "step": 7295 }, { "epoch": 0.2, "learning_rate": 0.0018588299293832247, "loss": 2.5917, "step": 7296 }, { "epoch": 0.2, "learning_rate": 0.001858785339361029, "loss": 2.4717, "step": 7297 }, { "epoch": 0.2, "learning_rate": 0.001858740742832829, "loss": 2.6137, "step": 7298 }, { "epoch": 0.2, "learning_rate": 0.0018586961397989627, "loss": 2.9478, "step": 7299 }, { "epoch": 0.2, "learning_rate": 0.001858651530259768, "loss": 2.5683, "step": 7300 }, { "epoch": 0.2, "learning_rate": 0.0018586069142155829, "loss": 2.7304, "step": 7301 }, { "epoch": 0.2, "learning_rate": 0.001858562291666745, "loss": 2.6817, "step": 7302 }, { "epoch": 0.2, "learning_rate": 0.0018585176626135932, "loss": 2.148, "step": 7303 }, { "epoch": 0.2, "learning_rate": 0.0018584730270564647, "loss": 2.4229, "step": 7304 }, { "epoch": 0.2, "learning_rate": 0.001858428384995698, "loss": 2.5327, "step": 7305 }, { "epoch": 0.2, "learning_rate": 0.0018583837364316315, "loss": 2.4963, "step": 7306 }, { "epoch": 0.2, "learning_rate": 0.0018583390813646033, "loss": 2.4541, "step": 7307 }, { "epoch": 0.2, "learning_rate": 0.0018582944197949515, "loss": 2.2945, "step": 7308 }, { "epoch": 0.2, "learning_rate": 0.0018582497517230148, "loss": 2.8662, "step": 7309 }, { "epoch": 0.2, "learning_rate": 0.0018582050771491314, "loss": 2.6505, "step": 7310 }, { "epoch": 0.2, "learning_rate": 0.0018581603960736398, "loss": 2.6186, "step": 7311 }, { "epoch": 0.2, "learning_rate": 0.0018581157084968784, "loss": 2.8724, "step": 7312 }, { "epoch": 0.2, "learning_rate": 0.0018580710144191857, "loss": 2.615, "step": 7313 }, { "epoch": 0.2, "learning_rate": 0.0018580263138409004, "loss": 2.5406, "step": 7314 }, { "epoch": 0.2, "learning_rate": 0.0018579816067623614, "loss": 2.9314, "step": 7315 }, { "epoch": 0.2, "learning_rate": 0.001857936893183907, "loss": 2.4369, "step": 7316 }, { "epoch": 0.2, "learning_rate": 0.001857892173105876, "loss": 2.2771, "step": 7317 }, { "epoch": 0.2, "learning_rate": 0.001857847446528607, "loss": 2.5142, "step": 7318 }, { "epoch": 0.2, "learning_rate": 0.0018578027134524397, "loss": 2.5022, "step": 7319 }, { "epoch": 0.2, "learning_rate": 0.0018577579738777122, "loss": 2.6693, "step": 7320 }, { "epoch": 0.2, "learning_rate": 0.0018577132278047635, "loss": 2.8398, "step": 7321 }, { "epoch": 0.2, "learning_rate": 0.0018576684752339328, "loss": 2.3943, "step": 7322 }, { "epoch": 0.2, "learning_rate": 0.0018576237161655592, "loss": 2.5748, "step": 7323 }, { "epoch": 0.2, "learning_rate": 0.0018575789505999817, "loss": 2.8163, "step": 7324 }, { "epoch": 0.2, "learning_rate": 0.001857534178537539, "loss": 2.5379, "step": 7325 }, { "epoch": 0.2, "learning_rate": 0.0018574893999785708, "loss": 2.4129, "step": 7326 }, { "epoch": 0.2, "learning_rate": 0.0018574446149234164, "loss": 3.2646, "step": 7327 }, { "epoch": 0.2, "learning_rate": 0.0018573998233724148, "loss": 2.6319, "step": 7328 }, { "epoch": 0.2, "learning_rate": 0.0018573550253259054, "loss": 2.4309, "step": 7329 }, { "epoch": 0.2, "learning_rate": 0.0018573102207842277, "loss": 2.6686, "step": 7330 }, { "epoch": 0.2, "learning_rate": 0.001857265409747721, "loss": 2.4896, "step": 7331 }, { "epoch": 0.2, "learning_rate": 0.0018572205922167248, "loss": 2.6593, "step": 7332 }, { "epoch": 0.2, "learning_rate": 0.0018571757681915787, "loss": 2.4494, "step": 7333 }, { "epoch": 0.2, "learning_rate": 0.0018571309376726223, "loss": 2.5883, "step": 7334 }, { "epoch": 0.2, "learning_rate": 0.001857086100660195, "loss": 2.6647, "step": 7335 }, { "epoch": 0.2, "learning_rate": 0.0018570412571546364, "loss": 2.8696, "step": 7336 }, { "epoch": 0.2, "learning_rate": 0.001856996407156287, "loss": 2.5852, "step": 7337 }, { "epoch": 0.2, "learning_rate": 0.0018569515506654858, "loss": 2.5841, "step": 7338 }, { "epoch": 0.2, "learning_rate": 0.0018569066876825727, "loss": 2.2525, "step": 7339 }, { "epoch": 0.2, "learning_rate": 0.001856861818207888, "loss": 2.7493, "step": 7340 }, { "epoch": 0.2, "learning_rate": 0.0018568169422417712, "loss": 2.5522, "step": 7341 }, { "epoch": 0.2, "learning_rate": 0.0018567720597845625, "loss": 2.3847, "step": 7342 }, { "epoch": 0.2, "learning_rate": 0.0018567271708366017, "loss": 2.8257, "step": 7343 }, { "epoch": 0.2, "learning_rate": 0.0018566822753982293, "loss": 2.8239, "step": 7344 }, { "epoch": 0.2, "learning_rate": 0.001856637373469785, "loss": 2.8002, "step": 7345 }, { "epoch": 0.2, "learning_rate": 0.0018565924650516088, "loss": 2.7458, "step": 7346 }, { "epoch": 0.2, "learning_rate": 0.001856547550144042, "loss": 2.506, "step": 7347 }, { "epoch": 0.2, "learning_rate": 0.0018565026287474234, "loss": 2.7146, "step": 7348 }, { "epoch": 0.2, "learning_rate": 0.0018564577008620942, "loss": 2.5787, "step": 7349 }, { "epoch": 0.2, "learning_rate": 0.0018564127664883944, "loss": 2.4994, "step": 7350 }, { "epoch": 0.2, "learning_rate": 0.001856367825626665, "loss": 2.9422, "step": 7351 }, { "epoch": 0.2, "learning_rate": 0.001856322878277246, "loss": 2.5013, "step": 7352 }, { "epoch": 0.2, "learning_rate": 0.0018562779244404774, "loss": 2.3021, "step": 7353 }, { "epoch": 0.2, "learning_rate": 0.0018562329641167012, "loss": 2.4614, "step": 7354 }, { "epoch": 0.2, "learning_rate": 0.0018561879973062565, "loss": 2.4447, "step": 7355 }, { "epoch": 0.2, "learning_rate": 0.001856143024009485, "loss": 2.9202, "step": 7356 }, { "epoch": 0.2, "learning_rate": 0.0018560980442267265, "loss": 2.3766, "step": 7357 }, { "epoch": 0.2, "learning_rate": 0.001856053057958323, "loss": 2.9316, "step": 7358 }, { "epoch": 0.2, "learning_rate": 0.0018560080652046138, "loss": 2.6864, "step": 7359 }, { "epoch": 0.2, "learning_rate": 0.001855963065965941, "loss": 2.6682, "step": 7360 }, { "epoch": 0.2, "learning_rate": 0.001855918060242645, "loss": 2.5605, "step": 7361 }, { "epoch": 0.2, "learning_rate": 0.0018558730480350667, "loss": 2.6795, "step": 7362 }, { "epoch": 0.2, "learning_rate": 0.0018558280293435475, "loss": 2.2885, "step": 7363 }, { "epoch": 0.2, "learning_rate": 0.0018557830041684275, "loss": 2.7552, "step": 7364 }, { "epoch": 0.2, "learning_rate": 0.001855737972510049, "loss": 2.85, "step": 7365 }, { "epoch": 0.2, "learning_rate": 0.0018556929343687524, "loss": 2.3686, "step": 7366 }, { "epoch": 0.2, "learning_rate": 0.0018556478897448793, "loss": 2.7697, "step": 7367 }, { "epoch": 0.2, "learning_rate": 0.0018556028386387707, "loss": 2.4749, "step": 7368 }, { "epoch": 0.2, "learning_rate": 0.001855557781050768, "loss": 2.9861, "step": 7369 }, { "epoch": 0.2, "learning_rate": 0.0018555127169812122, "loss": 2.2943, "step": 7370 }, { "epoch": 0.2, "learning_rate": 0.0018554676464304456, "loss": 2.8932, "step": 7371 }, { "epoch": 0.2, "learning_rate": 0.0018554225693988085, "loss": 2.4116, "step": 7372 }, { "epoch": 0.2, "learning_rate": 0.0018553774858866433, "loss": 2.522, "step": 7373 }, { "epoch": 0.2, "learning_rate": 0.001855332395894291, "loss": 2.4021, "step": 7374 }, { "epoch": 0.2, "learning_rate": 0.0018552872994220934, "loss": 2.3668, "step": 7375 }, { "epoch": 0.2, "learning_rate": 0.001855242196470392, "loss": 2.567, "step": 7376 }, { "epoch": 0.2, "learning_rate": 0.0018551970870395288, "loss": 2.9803, "step": 7377 }, { "epoch": 0.2, "learning_rate": 0.0018551519711298454, "loss": 2.6331, "step": 7378 }, { "epoch": 0.2, "learning_rate": 0.0018551068487416835, "loss": 2.5192, "step": 7379 }, { "epoch": 0.2, "learning_rate": 0.0018550617198753853, "loss": 2.9228, "step": 7380 }, { "epoch": 0.2, "learning_rate": 0.0018550165845312918, "loss": 2.7652, "step": 7381 }, { "epoch": 0.2, "learning_rate": 0.0018549714427097458, "loss": 2.4122, "step": 7382 }, { "epoch": 0.2, "learning_rate": 0.0018549262944110893, "loss": 2.6783, "step": 7383 }, { "epoch": 0.2, "learning_rate": 0.0018548811396356636, "loss": 2.5798, "step": 7384 }, { "epoch": 0.2, "learning_rate": 0.0018548359783838115, "loss": 2.4822, "step": 7385 }, { "epoch": 0.2, "learning_rate": 0.0018547908106558745, "loss": 2.8606, "step": 7386 }, { "epoch": 0.2, "learning_rate": 0.0018547456364521953, "loss": 2.6401, "step": 7387 }, { "epoch": 0.2, "learning_rate": 0.001854700455773116, "loss": 2.7397, "step": 7388 }, { "epoch": 0.2, "learning_rate": 0.0018546552686189788, "loss": 2.7538, "step": 7389 }, { "epoch": 0.2, "learning_rate": 0.0018546100749901263, "loss": 2.5972, "step": 7390 }, { "epoch": 0.2, "learning_rate": 0.0018545648748869007, "loss": 2.4954, "step": 7391 }, { "epoch": 0.2, "learning_rate": 0.0018545196683096442, "loss": 2.7776, "step": 7392 }, { "epoch": 0.2, "learning_rate": 0.0018544744552586995, "loss": 2.4543, "step": 7393 }, { "epoch": 0.2, "learning_rate": 0.001854429235734409, "loss": 2.6623, "step": 7394 }, { "epoch": 0.2, "learning_rate": 0.0018543840097371153, "loss": 2.8705, "step": 7395 }, { "epoch": 0.2, "learning_rate": 0.0018543387772671613, "loss": 2.9028, "step": 7396 }, { "epoch": 0.2, "learning_rate": 0.0018542935383248894, "loss": 2.6707, "step": 7397 }, { "epoch": 0.2, "learning_rate": 0.0018542482929106425, "loss": 2.7046, "step": 7398 }, { "epoch": 0.2, "learning_rate": 0.0018542030410247632, "loss": 2.5324, "step": 7399 }, { "epoch": 0.2, "learning_rate": 0.001854157782667594, "loss": 2.8068, "step": 7400 }, { "epoch": 0.2, "learning_rate": 0.0018541125178394788, "loss": 2.9663, "step": 7401 }, { "epoch": 0.2, "learning_rate": 0.0018540672465407596, "loss": 2.4365, "step": 7402 }, { "epoch": 0.2, "learning_rate": 0.0018540219687717793, "loss": 2.7345, "step": 7403 }, { "epoch": 0.2, "learning_rate": 0.0018539766845328816, "loss": 2.4508, "step": 7404 }, { "epoch": 0.2, "learning_rate": 0.0018539313938244094, "loss": 2.6246, "step": 7405 }, { "epoch": 0.2, "learning_rate": 0.001853886096646705, "loss": 2.6856, "step": 7406 }, { "epoch": 0.2, "learning_rate": 0.0018538407930001127, "loss": 2.6767, "step": 7407 }, { "epoch": 0.2, "learning_rate": 0.001853795482884975, "loss": 2.9071, "step": 7408 }, { "epoch": 0.2, "learning_rate": 0.0018537501663016354, "loss": 2.9032, "step": 7409 }, { "epoch": 0.2, "learning_rate": 0.0018537048432504372, "loss": 2.6746, "step": 7410 }, { "epoch": 0.2, "learning_rate": 0.0018536595137317237, "loss": 2.5671, "step": 7411 }, { "epoch": 0.2, "learning_rate": 0.0018536141777458384, "loss": 2.5512, "step": 7412 }, { "epoch": 0.2, "learning_rate": 0.001853568835293125, "loss": 2.5945, "step": 7413 }, { "epoch": 0.2, "learning_rate": 0.001853523486373926, "loss": 2.7885, "step": 7414 }, { "epoch": 0.2, "learning_rate": 0.0018534781309885863, "loss": 3.0031, "step": 7415 }, { "epoch": 0.2, "learning_rate": 0.0018534327691374485, "loss": 2.5421, "step": 7416 }, { "epoch": 0.2, "learning_rate": 0.001853387400820857, "loss": 3.1892, "step": 7417 }, { "epoch": 0.2, "learning_rate": 0.001853342026039155, "loss": 3.0585, "step": 7418 }, { "epoch": 0.2, "learning_rate": 0.001853296644792686, "loss": 2.8686, "step": 7419 }, { "epoch": 0.2, "learning_rate": 0.0018532512570817944, "loss": 2.9142, "step": 7420 }, { "epoch": 0.2, "learning_rate": 0.0018532058629068238, "loss": 2.7342, "step": 7421 }, { "epoch": 0.2, "learning_rate": 0.0018531604622681183, "loss": 2.1919, "step": 7422 }, { "epoch": 0.2, "learning_rate": 0.0018531150551660215, "loss": 3.1722, "step": 7423 }, { "epoch": 0.2, "learning_rate": 0.0018530696416008774, "loss": 3.101, "step": 7424 }, { "epoch": 0.2, "learning_rate": 0.0018530242215730305, "loss": 2.5152, "step": 7425 }, { "epoch": 0.2, "learning_rate": 0.0018529787950828248, "loss": 2.6611, "step": 7426 }, { "epoch": 0.2, "learning_rate": 0.0018529333621306037, "loss": 2.8223, "step": 7427 }, { "epoch": 0.2, "learning_rate": 0.0018528879227167124, "loss": 3.0686, "step": 7428 }, { "epoch": 0.2, "learning_rate": 0.0018528424768414942, "loss": 2.4031, "step": 7429 }, { "epoch": 0.2, "learning_rate": 0.001852797024505294, "loss": 2.3826, "step": 7430 }, { "epoch": 0.2, "learning_rate": 0.0018527515657084563, "loss": 2.9996, "step": 7431 }, { "epoch": 0.2, "learning_rate": 0.001852706100451325, "loss": 2.5847, "step": 7432 }, { "epoch": 0.2, "learning_rate": 0.001852660628734245, "loss": 2.6042, "step": 7433 }, { "epoch": 0.2, "learning_rate": 0.0018526151505575603, "loss": 2.8262, "step": 7434 }, { "epoch": 0.2, "learning_rate": 0.0018525696659216157, "loss": 2.742, "step": 7435 }, { "epoch": 0.2, "learning_rate": 0.0018525241748267556, "loss": 2.6808, "step": 7436 }, { "epoch": 0.2, "learning_rate": 0.001852478677273325, "loss": 2.7714, "step": 7437 }, { "epoch": 0.2, "learning_rate": 0.0018524331732616682, "loss": 2.4081, "step": 7438 }, { "epoch": 0.2, "learning_rate": 0.0018523876627921298, "loss": 2.6589, "step": 7439 }, { "epoch": 0.2, "learning_rate": 0.0018523421458650554, "loss": 2.2823, "step": 7440 }, { "epoch": 0.2, "learning_rate": 0.001852296622480789, "loss": 3.057, "step": 7441 }, { "epoch": 0.2, "learning_rate": 0.0018522510926396757, "loss": 2.6355, "step": 7442 }, { "epoch": 0.2, "learning_rate": 0.0018522055563420605, "loss": 2.4331, "step": 7443 }, { "epoch": 0.2, "learning_rate": 0.0018521600135882885, "loss": 2.8701, "step": 7444 }, { "epoch": 0.2, "learning_rate": 0.0018521144643787047, "loss": 2.7054, "step": 7445 }, { "epoch": 0.2, "learning_rate": 0.0018520689087136537, "loss": 2.8536, "step": 7446 }, { "epoch": 0.2, "learning_rate": 0.0018520233465934813, "loss": 2.7631, "step": 7447 }, { "epoch": 0.2, "learning_rate": 0.001851977778018532, "loss": 2.6271, "step": 7448 }, { "epoch": 0.2, "learning_rate": 0.0018519322029891519, "loss": 2.7381, "step": 7449 }, { "epoch": 0.2, "learning_rate": 0.0018518866215056853, "loss": 2.7218, "step": 7450 }, { "epoch": 0.2, "learning_rate": 0.0018518410335684782, "loss": 2.8197, "step": 7451 }, { "epoch": 0.2, "learning_rate": 0.0018517954391778755, "loss": 2.8652, "step": 7452 }, { "epoch": 0.2, "learning_rate": 0.0018517498383342232, "loss": 2.587, "step": 7453 }, { "epoch": 0.2, "learning_rate": 0.001851704231037866, "loss": 2.6232, "step": 7454 }, { "epoch": 0.2, "learning_rate": 0.00185165861728915, "loss": 2.5425, "step": 7455 }, { "epoch": 0.2, "learning_rate": 0.0018516129970884206, "loss": 2.177, "step": 7456 }, { "epoch": 0.2, "learning_rate": 0.0018515673704360234, "loss": 2.3824, "step": 7457 }, { "epoch": 0.2, "learning_rate": 0.001851521737332304, "loss": 2.9437, "step": 7458 }, { "epoch": 0.2, "learning_rate": 0.0018514760977776082, "loss": 2.4877, "step": 7459 }, { "epoch": 0.2, "learning_rate": 0.0018514304517722815, "loss": 2.7758, "step": 7460 }, { "epoch": 0.2, "learning_rate": 0.0018513847993166703, "loss": 2.7551, "step": 7461 }, { "epoch": 0.2, "learning_rate": 0.00185133914041112, "loss": 2.6697, "step": 7462 }, { "epoch": 0.2, "learning_rate": 0.0018512934750559765, "loss": 2.6683, "step": 7463 }, { "epoch": 0.2, "learning_rate": 0.0018512478032515856, "loss": 2.7168, "step": 7464 }, { "epoch": 0.2, "learning_rate": 0.0018512021249982938, "loss": 2.0982, "step": 7465 }, { "epoch": 0.2, "learning_rate": 0.0018511564402964467, "loss": 2.534, "step": 7466 }, { "epoch": 0.2, "learning_rate": 0.0018511107491463905, "loss": 2.4339, "step": 7467 }, { "epoch": 0.2, "learning_rate": 0.0018510650515484717, "loss": 2.4459, "step": 7468 }, { "epoch": 0.2, "learning_rate": 0.001851019347503036, "loss": 2.4901, "step": 7469 }, { "epoch": 0.2, "learning_rate": 0.0018509736370104302, "loss": 2.2981, "step": 7470 }, { "epoch": 0.2, "learning_rate": 0.0018509279200710003, "loss": 2.8498, "step": 7471 }, { "epoch": 0.2, "learning_rate": 0.0018508821966850921, "loss": 2.6039, "step": 7472 }, { "epoch": 0.2, "learning_rate": 0.0018508364668530528, "loss": 2.5139, "step": 7473 }, { "epoch": 0.2, "learning_rate": 0.0018507907305752287, "loss": 2.4896, "step": 7474 }, { "epoch": 0.2, "learning_rate": 0.0018507449878519657, "loss": 2.073, "step": 7475 }, { "epoch": 0.2, "learning_rate": 0.0018506992386836112, "loss": 2.779, "step": 7476 }, { "epoch": 0.2, "learning_rate": 0.0018506534830705112, "loss": 2.6171, "step": 7477 }, { "epoch": 0.2, "learning_rate": 0.0018506077210130123, "loss": 2.9571, "step": 7478 }, { "epoch": 0.2, "learning_rate": 0.0018505619525114615, "loss": 2.5349, "step": 7479 }, { "epoch": 0.2, "learning_rate": 0.0018505161775662056, "loss": 2.5948, "step": 7480 }, { "epoch": 0.2, "learning_rate": 0.001850470396177591, "loss": 2.8213, "step": 7481 }, { "epoch": 0.2, "learning_rate": 0.001850424608345965, "loss": 2.5476, "step": 7482 }, { "epoch": 0.2, "learning_rate": 0.0018503788140716737, "loss": 2.5217, "step": 7483 }, { "epoch": 0.2, "learning_rate": 0.0018503330133550651, "loss": 2.4236, "step": 7484 }, { "epoch": 0.2, "learning_rate": 0.0018502872061964852, "loss": 2.7735, "step": 7485 }, { "epoch": 0.2, "learning_rate": 0.0018502413925962817, "loss": 2.7441, "step": 7486 }, { "epoch": 0.2, "learning_rate": 0.001850195572554801, "loss": 3.1923, "step": 7487 }, { "epoch": 0.2, "learning_rate": 0.0018501497460723913, "loss": 2.2716, "step": 7488 }, { "epoch": 0.2, "learning_rate": 0.0018501039131493986, "loss": 2.907, "step": 7489 }, { "epoch": 0.2, "learning_rate": 0.0018500580737861709, "loss": 2.5046, "step": 7490 }, { "epoch": 0.2, "learning_rate": 0.0018500122279830552, "loss": 2.7821, "step": 7491 }, { "epoch": 0.2, "learning_rate": 0.0018499663757403986, "loss": 2.5996, "step": 7492 }, { "epoch": 0.2, "learning_rate": 0.0018499205170585489, "loss": 2.0974, "step": 7493 }, { "epoch": 0.2, "learning_rate": 0.0018498746519378534, "loss": 2.6094, "step": 7494 }, { "epoch": 0.2, "learning_rate": 0.0018498287803786592, "loss": 2.4846, "step": 7495 }, { "epoch": 0.2, "learning_rate": 0.0018497829023813143, "loss": 2.5721, "step": 7496 }, { "epoch": 0.2, "learning_rate": 0.0018497370179461662, "loss": 2.6874, "step": 7497 }, { "epoch": 0.2, "learning_rate": 0.0018496911270735618, "loss": 2.8283, "step": 7498 }, { "epoch": 0.2, "learning_rate": 0.00184964522976385, "loss": 2.655, "step": 7499 }, { "epoch": 0.2, "learning_rate": 0.0018495993260173775, "loss": 2.8835, "step": 7500 }, { "epoch": 0.2, "learning_rate": 0.0018495534158344924, "loss": 2.5779, "step": 7501 }, { "epoch": 0.2, "learning_rate": 0.0018495074992155428, "loss": 2.9727, "step": 7502 }, { "epoch": 0.2, "learning_rate": 0.0018494615761608757, "loss": 2.3796, "step": 7503 }, { "epoch": 0.2, "learning_rate": 0.00184941564667084, "loss": 2.2766, "step": 7504 }, { "epoch": 0.2, "learning_rate": 0.001849369710745783, "loss": 2.4885, "step": 7505 }, { "epoch": 0.2, "learning_rate": 0.001849323768386053, "loss": 2.5581, "step": 7506 }, { "epoch": 0.2, "learning_rate": 0.001849277819591998, "loss": 2.6648, "step": 7507 }, { "epoch": 0.2, "learning_rate": 0.0018492318643639663, "loss": 2.5287, "step": 7508 }, { "epoch": 0.2, "learning_rate": 0.0018491859027023056, "loss": 2.6371, "step": 7509 }, { "epoch": 0.2, "learning_rate": 0.0018491399346073642, "loss": 2.6431, "step": 7510 }, { "epoch": 0.2, "learning_rate": 0.0018490939600794905, "loss": 2.8951, "step": 7511 }, { "epoch": 0.2, "learning_rate": 0.0018490479791190332, "loss": 2.7064, "step": 7512 }, { "epoch": 0.2, "learning_rate": 0.0018490019917263396, "loss": 2.3739, "step": 7513 }, { "epoch": 0.2, "learning_rate": 0.0018489559979017593, "loss": 2.7937, "step": 7514 }, { "epoch": 0.2, "learning_rate": 0.0018489099976456394, "loss": 2.9807, "step": 7515 }, { "epoch": 0.2, "learning_rate": 0.0018488639909583298, "loss": 2.4372, "step": 7516 }, { "epoch": 0.2, "learning_rate": 0.001848817977840178, "loss": 2.4511, "step": 7517 }, { "epoch": 0.2, "learning_rate": 0.001848771958291533, "loss": 3.5018, "step": 7518 }, { "epoch": 0.2, "learning_rate": 0.0018487259323127433, "loss": 2.3759, "step": 7519 }, { "epoch": 0.2, "learning_rate": 0.0018486798999041581, "loss": 2.7216, "step": 7520 }, { "epoch": 0.2, "learning_rate": 0.0018486338610661252, "loss": 2.4845, "step": 7521 }, { "epoch": 0.2, "learning_rate": 0.0018485878157989942, "loss": 2.6186, "step": 7522 }, { "epoch": 0.2, "learning_rate": 0.0018485417641031135, "loss": 2.7888, "step": 7523 }, { "epoch": 0.2, "learning_rate": 0.0018484957059788322, "loss": 2.5114, "step": 7524 }, { "epoch": 0.2, "learning_rate": 0.001848449641426499, "loss": 2.3975, "step": 7525 }, { "epoch": 0.2, "learning_rate": 0.001848403570446463, "loss": 2.2752, "step": 7526 }, { "epoch": 0.2, "learning_rate": 0.0018483574930390735, "loss": 2.6849, "step": 7527 }, { "epoch": 0.2, "learning_rate": 0.0018483114092046789, "loss": 2.5398, "step": 7528 }, { "epoch": 0.2, "learning_rate": 0.0018482653189436289, "loss": 2.98, "step": 7529 }, { "epoch": 0.2, "learning_rate": 0.0018482192222562725, "loss": 2.1982, "step": 7530 }, { "epoch": 0.2, "learning_rate": 0.0018481731191429592, "loss": 2.3635, "step": 7531 }, { "epoch": 0.2, "learning_rate": 0.0018481270096040376, "loss": 2.4484, "step": 7532 }, { "epoch": 0.2, "learning_rate": 0.0018480808936398576, "loss": 2.6693, "step": 7533 }, { "epoch": 0.2, "learning_rate": 0.0018480347712507682, "loss": 2.8952, "step": 7534 }, { "epoch": 0.2, "learning_rate": 0.001847988642437119, "loss": 2.5896, "step": 7535 }, { "epoch": 0.2, "learning_rate": 0.0018479425071992598, "loss": 2.4815, "step": 7536 }, { "epoch": 0.2, "learning_rate": 0.0018478963655375394, "loss": 2.516, "step": 7537 }, { "epoch": 0.2, "learning_rate": 0.001847850217452308, "loss": 2.5855, "step": 7538 }, { "epoch": 0.2, "learning_rate": 0.0018478040629439146, "loss": 2.8176, "step": 7539 }, { "epoch": 0.2, "learning_rate": 0.0018477579020127095, "loss": 2.7616, "step": 7540 }, { "epoch": 0.2, "learning_rate": 0.0018477117346590419, "loss": 2.4462, "step": 7541 }, { "epoch": 0.2, "learning_rate": 0.0018476655608832618, "loss": 2.5844, "step": 7542 }, { "epoch": 0.2, "learning_rate": 0.001847619380685719, "loss": 2.3874, "step": 7543 }, { "epoch": 0.2, "learning_rate": 0.0018475731940667632, "loss": 2.4604, "step": 7544 }, { "epoch": 0.2, "learning_rate": 0.0018475270010267447, "loss": 2.8105, "step": 7545 }, { "epoch": 0.2, "learning_rate": 0.0018474808015660129, "loss": 2.605, "step": 7546 }, { "epoch": 0.2, "learning_rate": 0.001847434595684918, "loss": 2.5545, "step": 7547 }, { "epoch": 0.2, "learning_rate": 0.0018473883833838105, "loss": 2.8914, "step": 7548 }, { "epoch": 0.2, "learning_rate": 0.0018473421646630398, "loss": 2.6361, "step": 7549 }, { "epoch": 0.2, "learning_rate": 0.0018472959395229563, "loss": 2.7606, "step": 7550 }, { "epoch": 0.2, "learning_rate": 0.0018472497079639104, "loss": 2.491, "step": 7551 }, { "epoch": 0.2, "learning_rate": 0.0018472034699862521, "loss": 2.7533, "step": 7552 }, { "epoch": 0.2, "learning_rate": 0.0018471572255903319, "loss": 3.0652, "step": 7553 }, { "epoch": 0.2, "learning_rate": 0.0018471109747764999, "loss": 2.65, "step": 7554 }, { "epoch": 0.2, "learning_rate": 0.0018470647175451065, "loss": 2.4834, "step": 7555 }, { "epoch": 0.2, "learning_rate": 0.0018470184538965024, "loss": 2.7867, "step": 7556 }, { "epoch": 0.2, "learning_rate": 0.001846972183831038, "loss": 2.9219, "step": 7557 }, { "epoch": 0.2, "learning_rate": 0.0018469259073490636, "loss": 2.2756, "step": 7558 }, { "epoch": 0.2, "learning_rate": 0.00184687962445093, "loss": 2.5403, "step": 7559 }, { "epoch": 0.2, "learning_rate": 0.0018468333351369878, "loss": 2.5493, "step": 7560 }, { "epoch": 0.2, "learning_rate": 0.0018467870394075876, "loss": 3.0286, "step": 7561 }, { "epoch": 0.2, "learning_rate": 0.0018467407372630802, "loss": 3.1112, "step": 7562 }, { "epoch": 0.2, "learning_rate": 0.0018466944287038162, "loss": 2.7905, "step": 7563 }, { "epoch": 0.2, "learning_rate": 0.001846648113730147, "loss": 2.6962, "step": 7564 }, { "epoch": 0.2, "learning_rate": 0.0018466017923424228, "loss": 2.8616, "step": 7565 }, { "epoch": 0.2, "learning_rate": 0.0018465554645409948, "loss": 2.8978, "step": 7566 }, { "epoch": 0.2, "learning_rate": 0.001846509130326214, "loss": 2.6202, "step": 7567 }, { "epoch": 0.2, "learning_rate": 0.001846462789698431, "loss": 2.9158, "step": 7568 }, { "epoch": 0.2, "learning_rate": 0.0018464164426579977, "loss": 2.4449, "step": 7569 }, { "epoch": 0.2, "learning_rate": 0.0018463700892052647, "loss": 2.3269, "step": 7570 }, { "epoch": 0.2, "learning_rate": 0.001846323729340583, "loss": 2.6956, "step": 7571 }, { "epoch": 0.2, "learning_rate": 0.0018462773630643042, "loss": 2.849, "step": 7572 }, { "epoch": 0.2, "learning_rate": 0.0018462309903767794, "loss": 2.7502, "step": 7573 }, { "epoch": 0.2, "learning_rate": 0.0018461846112783598, "loss": 2.4001, "step": 7574 }, { "epoch": 0.2, "learning_rate": 0.0018461382257693969, "loss": 2.3049, "step": 7575 }, { "epoch": 0.2, "learning_rate": 0.0018460918338502421, "loss": 2.6243, "step": 7576 }, { "epoch": 0.2, "learning_rate": 0.0018460454355212468, "loss": 2.7021, "step": 7577 }, { "epoch": 0.2, "learning_rate": 0.0018459990307827625, "loss": 2.4869, "step": 7578 }, { "epoch": 0.2, "learning_rate": 0.001845952619635141, "loss": 2.4787, "step": 7579 }, { "epoch": 0.2, "learning_rate": 0.0018459062020787335, "loss": 2.9271, "step": 7580 }, { "epoch": 0.2, "learning_rate": 0.001845859778113892, "loss": 2.4815, "step": 7581 }, { "epoch": 0.2, "learning_rate": 0.001845813347740968, "loss": 2.6383, "step": 7582 }, { "epoch": 0.2, "learning_rate": 0.0018457669109603132, "loss": 2.6175, "step": 7583 }, { "epoch": 0.2, "learning_rate": 0.0018457204677722796, "loss": 2.7892, "step": 7584 }, { "epoch": 0.2, "learning_rate": 0.001845674018177219, "loss": 2.4332, "step": 7585 }, { "epoch": 0.2, "learning_rate": 0.001845627562175483, "loss": 2.329, "step": 7586 }, { "epoch": 0.2, "learning_rate": 0.001845581099767424, "loss": 2.617, "step": 7587 }, { "epoch": 0.2, "learning_rate": 0.0018455346309533935, "loss": 2.6629, "step": 7588 }, { "epoch": 0.2, "learning_rate": 0.001845488155733744, "loss": 2.449, "step": 7589 }, { "epoch": 0.2, "learning_rate": 0.0018454416741088273, "loss": 2.8116, "step": 7590 }, { "epoch": 0.2, "learning_rate": 0.0018453951860789956, "loss": 2.4107, "step": 7591 }, { "epoch": 0.2, "learning_rate": 0.001845348691644601, "loss": 2.8905, "step": 7592 }, { "epoch": 0.2, "learning_rate": 0.0018453021908059963, "loss": 2.7617, "step": 7593 }, { "epoch": 0.2, "learning_rate": 0.001845255683563533, "loss": 2.3565, "step": 7594 }, { "epoch": 0.2, "learning_rate": 0.001845209169917564, "loss": 2.8001, "step": 7595 }, { "epoch": 0.2, "learning_rate": 0.001845162649868441, "loss": 2.1715, "step": 7596 }, { "epoch": 0.2, "learning_rate": 0.0018451161234165172, "loss": 2.8067, "step": 7597 }, { "epoch": 0.2, "learning_rate": 0.0018450695905621447, "loss": 2.6924, "step": 7598 }, { "epoch": 0.2, "learning_rate": 0.001845023051305676, "loss": 2.5535, "step": 7599 }, { "epoch": 0.2, "learning_rate": 0.001844976505647464, "loss": 2.6545, "step": 7600 }, { "epoch": 0.2, "learning_rate": 0.0018449299535878607, "loss": 2.5422, "step": 7601 }, { "epoch": 0.2, "learning_rate": 0.0018448833951272192, "loss": 2.3627, "step": 7602 }, { "epoch": 0.2, "learning_rate": 0.0018448368302658924, "loss": 2.3086, "step": 7603 }, { "epoch": 0.2, "learning_rate": 0.0018447902590042326, "loss": 2.2152, "step": 7604 }, { "epoch": 0.2, "learning_rate": 0.0018447436813425928, "loss": 2.7361, "step": 7605 }, { "epoch": 0.2, "learning_rate": 0.001844697097281326, "loss": 2.73, "step": 7606 }, { "epoch": 0.2, "learning_rate": 0.001844650506820785, "loss": 2.6743, "step": 7607 }, { "epoch": 0.2, "learning_rate": 0.0018446039099613227, "loss": 2.2551, "step": 7608 }, { "epoch": 0.2, "learning_rate": 0.0018445573067032922, "loss": 2.5273, "step": 7609 }, { "epoch": 0.2, "learning_rate": 0.0018445106970470465, "loss": 2.4378, "step": 7610 }, { "epoch": 0.2, "learning_rate": 0.001844464080992939, "loss": 3.031, "step": 7611 }, { "epoch": 0.2, "learning_rate": 0.0018444174585413222, "loss": 2.7856, "step": 7612 }, { "epoch": 0.2, "learning_rate": 0.0018443708296925498, "loss": 2.7557, "step": 7613 }, { "epoch": 0.2, "learning_rate": 0.001844324194446975, "loss": 2.6017, "step": 7614 }, { "epoch": 0.2, "learning_rate": 0.0018442775528049512, "loss": 2.4078, "step": 7615 }, { "epoch": 0.2, "learning_rate": 0.0018442309047668314, "loss": 3.1118, "step": 7616 }, { "epoch": 0.2, "learning_rate": 0.0018441842503329694, "loss": 2.808, "step": 7617 }, { "epoch": 0.2, "learning_rate": 0.0018441375895037184, "loss": 2.7262, "step": 7618 }, { "epoch": 0.2, "learning_rate": 0.001844090922279432, "loss": 2.4868, "step": 7619 }, { "epoch": 0.2, "learning_rate": 0.0018440442486604635, "loss": 2.931, "step": 7620 }, { "epoch": 0.2, "learning_rate": 0.0018439975686471667, "loss": 2.5223, "step": 7621 }, { "epoch": 0.2, "learning_rate": 0.0018439508822398953, "loss": 2.7194, "step": 7622 }, { "epoch": 0.2, "learning_rate": 0.001843904189439003, "loss": 2.5454, "step": 7623 }, { "epoch": 0.2, "learning_rate": 0.0018438574902448434, "loss": 2.6735, "step": 7624 }, { "epoch": 0.2, "learning_rate": 0.00184381078465777, "loss": 2.5062, "step": 7625 }, { "epoch": 0.2, "learning_rate": 0.001843764072678137, "loss": 2.9036, "step": 7626 }, { "epoch": 0.2, "learning_rate": 0.0018437173543062986, "loss": 2.6564, "step": 7627 }, { "epoch": 0.2, "learning_rate": 0.0018436706295426083, "loss": 2.8405, "step": 7628 }, { "epoch": 0.21, "learning_rate": 0.0018436238983874198, "loss": 3.0596, "step": 7629 }, { "epoch": 0.21, "learning_rate": 0.0018435771608410877, "loss": 2.6158, "step": 7630 }, { "epoch": 0.21, "learning_rate": 0.001843530416903966, "loss": 2.5121, "step": 7631 }, { "epoch": 0.21, "learning_rate": 0.0018434836665764084, "loss": 3.0886, "step": 7632 }, { "epoch": 0.21, "learning_rate": 0.0018434369098587694, "loss": 2.6261, "step": 7633 }, { "epoch": 0.21, "learning_rate": 0.0018433901467514034, "loss": 2.4672, "step": 7634 }, { "epoch": 0.21, "learning_rate": 0.001843343377254664, "loss": 2.4375, "step": 7635 }, { "epoch": 0.21, "learning_rate": 0.0018432966013689064, "loss": 2.801, "step": 7636 }, { "epoch": 0.21, "learning_rate": 0.0018432498190944842, "loss": 2.834, "step": 7637 }, { "epoch": 0.21, "learning_rate": 0.0018432030304317522, "loss": 2.3147, "step": 7638 }, { "epoch": 0.21, "learning_rate": 0.001843156235381065, "loss": 2.6714, "step": 7639 }, { "epoch": 0.21, "learning_rate": 0.0018431094339427766, "loss": 2.9133, "step": 7640 }, { "epoch": 0.21, "learning_rate": 0.001843062626117242, "loss": 2.5522, "step": 7641 }, { "epoch": 0.21, "learning_rate": 0.0018430158119048157, "loss": 2.761, "step": 7642 }, { "epoch": 0.21, "learning_rate": 0.0018429689913058522, "loss": 3.0605, "step": 7643 }, { "epoch": 0.21, "learning_rate": 0.0018429221643207067, "loss": 2.7963, "step": 7644 }, { "epoch": 0.21, "learning_rate": 0.001842875330949733, "loss": 2.6431, "step": 7645 }, { "epoch": 0.21, "learning_rate": 0.001842828491193287, "loss": 3.1516, "step": 7646 }, { "epoch": 0.21, "learning_rate": 0.0018427816450517227, "loss": 2.4581, "step": 7647 }, { "epoch": 0.21, "learning_rate": 0.0018427347925253955, "loss": 2.9999, "step": 7648 }, { "epoch": 0.21, "learning_rate": 0.00184268793361466, "loss": 2.6752, "step": 7649 }, { "epoch": 0.21, "learning_rate": 0.0018426410683198716, "loss": 2.6902, "step": 7650 }, { "epoch": 0.21, "learning_rate": 0.001842594196641385, "loss": 2.5692, "step": 7651 }, { "epoch": 0.21, "learning_rate": 0.0018425473185795555, "loss": 2.4211, "step": 7652 }, { "epoch": 0.21, "learning_rate": 0.0018425004341347383, "loss": 2.7623, "step": 7653 }, { "epoch": 0.21, "learning_rate": 0.001842453543307288, "loss": 2.9524, "step": 7654 }, { "epoch": 0.21, "learning_rate": 0.0018424066460975604, "loss": 3.0967, "step": 7655 }, { "epoch": 0.21, "learning_rate": 0.001842359742505911, "loss": 2.1935, "step": 7656 }, { "epoch": 0.21, "learning_rate": 0.0018423128325326945, "loss": 2.8976, "step": 7657 }, { "epoch": 0.21, "learning_rate": 0.0018422659161782665, "loss": 2.6777, "step": 7658 }, { "epoch": 0.21, "learning_rate": 0.0018422189934429825, "loss": 2.3717, "step": 7659 }, { "epoch": 0.21, "learning_rate": 0.0018421720643271985, "loss": 2.4302, "step": 7660 }, { "epoch": 0.21, "learning_rate": 0.0018421251288312688, "loss": 2.7843, "step": 7661 }, { "epoch": 0.21, "learning_rate": 0.00184207818695555, "loss": 2.7849, "step": 7662 }, { "epoch": 0.21, "learning_rate": 0.0018420312387003972, "loss": 2.5361, "step": 7663 }, { "epoch": 0.21, "learning_rate": 0.0018419842840661667, "loss": 2.5999, "step": 7664 }, { "epoch": 0.21, "learning_rate": 0.0018419373230532134, "loss": 2.6869, "step": 7665 }, { "epoch": 0.21, "learning_rate": 0.0018418903556618937, "loss": 2.8794, "step": 7666 }, { "epoch": 0.21, "learning_rate": 0.0018418433818925633, "loss": 2.9173, "step": 7667 }, { "epoch": 0.21, "learning_rate": 0.0018417964017455777, "loss": 2.9232, "step": 7668 }, { "epoch": 0.21, "learning_rate": 0.001841749415221293, "loss": 2.8632, "step": 7669 }, { "epoch": 0.21, "learning_rate": 0.0018417024223200654, "loss": 2.6135, "step": 7670 }, { "epoch": 0.21, "learning_rate": 0.0018416554230422507, "loss": 2.3137, "step": 7671 }, { "epoch": 0.21, "learning_rate": 0.0018416084173882047, "loss": 2.6966, "step": 7672 }, { "epoch": 0.21, "learning_rate": 0.0018415614053582843, "loss": 2.5038, "step": 7673 }, { "epoch": 0.21, "learning_rate": 0.001841514386952845, "loss": 2.5511, "step": 7674 }, { "epoch": 0.21, "learning_rate": 0.001841467362172243, "loss": 2.4318, "step": 7675 }, { "epoch": 0.21, "learning_rate": 0.0018414203310168347, "loss": 2.8256, "step": 7676 }, { "epoch": 0.21, "learning_rate": 0.0018413732934869764, "loss": 2.6646, "step": 7677 }, { "epoch": 0.21, "learning_rate": 0.0018413262495830245, "loss": 2.6481, "step": 7678 }, { "epoch": 0.21, "learning_rate": 0.0018412791993053354, "loss": 2.1393, "step": 7679 }, { "epoch": 0.21, "learning_rate": 0.0018412321426542655, "loss": 2.9656, "step": 7680 }, { "epoch": 0.21, "learning_rate": 0.0018411850796301713, "loss": 2.9976, "step": 7681 }, { "epoch": 0.21, "learning_rate": 0.0018411380102334091, "loss": 2.53, "step": 7682 }, { "epoch": 0.21, "learning_rate": 0.001841090934464336, "loss": 2.7296, "step": 7683 }, { "epoch": 0.21, "learning_rate": 0.0018410438523233082, "loss": 2.5656, "step": 7684 }, { "epoch": 0.21, "learning_rate": 0.0018409967638106826, "loss": 2.7356, "step": 7685 }, { "epoch": 0.21, "learning_rate": 0.001840949668926816, "loss": 2.8842, "step": 7686 }, { "epoch": 0.21, "learning_rate": 0.0018409025676720647, "loss": 2.9258, "step": 7687 }, { "epoch": 0.21, "learning_rate": 0.0018408554600467862, "loss": 2.7601, "step": 7688 }, { "epoch": 0.21, "learning_rate": 0.0018408083460513369, "loss": 2.4476, "step": 7689 }, { "epoch": 0.21, "learning_rate": 0.001840761225686074, "loss": 2.3792, "step": 7690 }, { "epoch": 0.21, "learning_rate": 0.0018407140989513543, "loss": 2.5449, "step": 7691 }, { "epoch": 0.21, "learning_rate": 0.0018406669658475351, "loss": 2.5954, "step": 7692 }, { "epoch": 0.21, "learning_rate": 0.0018406198263749727, "loss": 2.1337, "step": 7693 }, { "epoch": 0.21, "learning_rate": 0.0018405726805340256, "loss": 2.3841, "step": 7694 }, { "epoch": 0.21, "learning_rate": 0.0018405255283250495, "loss": 2.6551, "step": 7695 }, { "epoch": 0.21, "learning_rate": 0.0018404783697484025, "loss": 3.0946, "step": 7696 }, { "epoch": 0.21, "learning_rate": 0.0018404312048044416, "loss": 2.9128, "step": 7697 }, { "epoch": 0.21, "learning_rate": 0.0018403840334935242, "loss": 2.5387, "step": 7698 }, { "epoch": 0.21, "learning_rate": 0.0018403368558160074, "loss": 2.2923, "step": 7699 }, { "epoch": 0.21, "learning_rate": 0.001840289671772249, "loss": 3.0344, "step": 7700 }, { "epoch": 0.21, "learning_rate": 0.0018402424813626062, "loss": 2.9255, "step": 7701 }, { "epoch": 0.21, "learning_rate": 0.0018401952845874367, "loss": 3.0425, "step": 7702 }, { "epoch": 0.21, "learning_rate": 0.0018401480814470982, "loss": 2.9324, "step": 7703 }, { "epoch": 0.21, "learning_rate": 0.0018401008719419474, "loss": 2.4034, "step": 7704 }, { "epoch": 0.21, "learning_rate": 0.0018400536560723429, "loss": 2.3852, "step": 7705 }, { "epoch": 0.21, "learning_rate": 0.0018400064338386422, "loss": 2.6071, "step": 7706 }, { "epoch": 0.21, "learning_rate": 0.0018399592052412029, "loss": 2.7241, "step": 7707 }, { "epoch": 0.21, "learning_rate": 0.0018399119702803826, "loss": 2.463, "step": 7708 }, { "epoch": 0.21, "learning_rate": 0.0018398647289565395, "loss": 2.481, "step": 7709 }, { "epoch": 0.21, "learning_rate": 0.0018398174812700315, "loss": 2.8762, "step": 7710 }, { "epoch": 0.21, "learning_rate": 0.0018397702272212161, "loss": 3.0869, "step": 7711 }, { "epoch": 0.21, "learning_rate": 0.0018397229668104522, "loss": 3.4157, "step": 7712 }, { "epoch": 0.21, "learning_rate": 0.0018396757000380965, "loss": 2.78, "step": 7713 }, { "epoch": 0.21, "learning_rate": 0.0018396284269045085, "loss": 2.8871, "step": 7714 }, { "epoch": 0.21, "learning_rate": 0.0018395811474100452, "loss": 2.5515, "step": 7715 }, { "epoch": 0.21, "learning_rate": 0.0018395338615550653, "loss": 2.5565, "step": 7716 }, { "epoch": 0.21, "learning_rate": 0.0018394865693399272, "loss": 2.8307, "step": 7717 }, { "epoch": 0.21, "learning_rate": 0.0018394392707649888, "loss": 2.6758, "step": 7718 }, { "epoch": 0.21, "learning_rate": 0.0018393919658306083, "loss": 2.7234, "step": 7719 }, { "epoch": 0.21, "learning_rate": 0.0018393446545371447, "loss": 2.6941, "step": 7720 }, { "epoch": 0.21, "learning_rate": 0.0018392973368849556, "loss": 2.4944, "step": 7721 }, { "epoch": 0.21, "learning_rate": 0.0018392500128744005, "loss": 2.4371, "step": 7722 }, { "epoch": 0.21, "learning_rate": 0.001839202682505837, "loss": 2.4735, "step": 7723 }, { "epoch": 0.21, "learning_rate": 0.001839155345779624, "loss": 3.0065, "step": 7724 }, { "epoch": 0.21, "learning_rate": 0.0018391080026961201, "loss": 2.6717, "step": 7725 }, { "epoch": 0.21, "learning_rate": 0.0018390606532556841, "loss": 2.5913, "step": 7726 }, { "epoch": 0.21, "learning_rate": 0.001839013297458675, "loss": 2.4371, "step": 7727 }, { "epoch": 0.21, "learning_rate": 0.0018389659353054504, "loss": 2.836, "step": 7728 }, { "epoch": 0.21, "learning_rate": 0.0018389185667963704, "loss": 2.6823, "step": 7729 }, { "epoch": 0.21, "learning_rate": 0.0018388711919317933, "loss": 2.6813, "step": 7730 }, { "epoch": 0.21, "learning_rate": 0.0018388238107120776, "loss": 2.5148, "step": 7731 }, { "epoch": 0.21, "learning_rate": 0.001838776423137583, "loss": 2.6629, "step": 7732 }, { "epoch": 0.21, "learning_rate": 0.0018387290292086684, "loss": 2.5487, "step": 7733 }, { "epoch": 0.21, "learning_rate": 0.0018386816289256923, "loss": 2.7282, "step": 7734 }, { "epoch": 0.21, "learning_rate": 0.001838634222289014, "loss": 2.5352, "step": 7735 }, { "epoch": 0.21, "learning_rate": 0.001838586809298993, "loss": 2.6608, "step": 7736 }, { "epoch": 0.21, "learning_rate": 0.0018385393899559882, "loss": 2.6554, "step": 7737 }, { "epoch": 0.21, "learning_rate": 0.001838491964260359, "loss": 2.6226, "step": 7738 }, { "epoch": 0.21, "learning_rate": 0.0018384445322124643, "loss": 2.6837, "step": 7739 }, { "epoch": 0.21, "learning_rate": 0.0018383970938126639, "loss": 2.6955, "step": 7740 }, { "epoch": 0.21, "learning_rate": 0.0018383496490613173, "loss": 2.4325, "step": 7741 }, { "epoch": 0.21, "learning_rate": 0.0018383021979587833, "loss": 2.6132, "step": 7742 }, { "epoch": 0.21, "learning_rate": 0.0018382547405054218, "loss": 3.1976, "step": 7743 }, { "epoch": 0.21, "learning_rate": 0.001838207276701592, "loss": 2.8716, "step": 7744 }, { "epoch": 0.21, "learning_rate": 0.0018381598065476542, "loss": 3.0345, "step": 7745 }, { "epoch": 0.21, "learning_rate": 0.001838112330043967, "loss": 2.6227, "step": 7746 }, { "epoch": 0.21, "learning_rate": 0.0018380648471908912, "loss": 2.4136, "step": 7747 }, { "epoch": 0.21, "learning_rate": 0.0018380173579887855, "loss": 2.7571, "step": 7748 }, { "epoch": 0.21, "learning_rate": 0.0018379698624380106, "loss": 2.5048, "step": 7749 }, { "epoch": 0.21, "learning_rate": 0.0018379223605389254, "loss": 2.4981, "step": 7750 }, { "epoch": 0.21, "learning_rate": 0.0018378748522918905, "loss": 2.5915, "step": 7751 }, { "epoch": 0.21, "learning_rate": 0.0018378273376972651, "loss": 2.8907, "step": 7752 }, { "epoch": 0.21, "learning_rate": 0.0018377798167554102, "loss": 2.5611, "step": 7753 }, { "epoch": 0.21, "learning_rate": 0.001837732289466685, "loss": 2.6498, "step": 7754 }, { "epoch": 0.21, "learning_rate": 0.0018376847558314493, "loss": 2.6587, "step": 7755 }, { "epoch": 0.21, "learning_rate": 0.001837637215850064, "loss": 2.945, "step": 7756 }, { "epoch": 0.21, "learning_rate": 0.0018375896695228887, "loss": 2.9059, "step": 7757 }, { "epoch": 0.21, "learning_rate": 0.0018375421168502842, "loss": 2.777, "step": 7758 }, { "epoch": 0.21, "learning_rate": 0.0018374945578326098, "loss": 2.6833, "step": 7759 }, { "epoch": 0.21, "learning_rate": 0.0018374469924702268, "loss": 2.5486, "step": 7760 }, { "epoch": 0.21, "learning_rate": 0.0018373994207634952, "loss": 2.3949, "step": 7761 }, { "epoch": 0.21, "learning_rate": 0.0018373518427127749, "loss": 2.668, "step": 7762 }, { "epoch": 0.21, "learning_rate": 0.001837304258318427, "loss": 2.9703, "step": 7763 }, { "epoch": 0.21, "learning_rate": 0.0018372566675808116, "loss": 2.3368, "step": 7764 }, { "epoch": 0.21, "learning_rate": 0.0018372090705002894, "loss": 2.6446, "step": 7765 }, { "epoch": 0.21, "learning_rate": 0.001837161467077221, "loss": 2.518, "step": 7766 }, { "epoch": 0.21, "learning_rate": 0.0018371138573119673, "loss": 3.0851, "step": 7767 }, { "epoch": 0.21, "learning_rate": 0.0018370662412048881, "loss": 2.8808, "step": 7768 }, { "epoch": 0.21, "learning_rate": 0.0018370186187563451, "loss": 2.6097, "step": 7769 }, { "epoch": 0.21, "learning_rate": 0.0018369709899666985, "loss": 2.5463, "step": 7770 }, { "epoch": 0.21, "learning_rate": 0.0018369233548363093, "loss": 3.0887, "step": 7771 }, { "epoch": 0.21, "learning_rate": 0.0018368757133655387, "loss": 2.7143, "step": 7772 }, { "epoch": 0.21, "learning_rate": 0.0018368280655547472, "loss": 2.774, "step": 7773 }, { "epoch": 0.21, "learning_rate": 0.0018367804114042957, "loss": 2.4817, "step": 7774 }, { "epoch": 0.21, "learning_rate": 0.0018367327509145456, "loss": 2.5248, "step": 7775 }, { "epoch": 0.21, "learning_rate": 0.0018366850840858576, "loss": 2.3839, "step": 7776 }, { "epoch": 0.21, "learning_rate": 0.0018366374109185931, "loss": 3.0924, "step": 7777 }, { "epoch": 0.21, "learning_rate": 0.001836589731413113, "loss": 2.4237, "step": 7778 }, { "epoch": 0.21, "learning_rate": 0.0018365420455697787, "loss": 2.4758, "step": 7779 }, { "epoch": 0.21, "learning_rate": 0.0018364943533889515, "loss": 2.9588, "step": 7780 }, { "epoch": 0.21, "learning_rate": 0.0018364466548709925, "loss": 2.6232, "step": 7781 }, { "epoch": 0.21, "learning_rate": 0.0018363989500162635, "loss": 2.487, "step": 7782 }, { "epoch": 0.21, "learning_rate": 0.0018363512388251256, "loss": 2.1425, "step": 7783 }, { "epoch": 0.21, "learning_rate": 0.00183630352129794, "loss": 2.618, "step": 7784 }, { "epoch": 0.21, "learning_rate": 0.0018362557974350682, "loss": 2.7034, "step": 7785 }, { "epoch": 0.21, "learning_rate": 0.0018362080672368723, "loss": 2.3578, "step": 7786 }, { "epoch": 0.21, "learning_rate": 0.0018361603307037136, "loss": 2.7829, "step": 7787 }, { "epoch": 0.21, "learning_rate": 0.0018361125878359537, "loss": 2.5533, "step": 7788 }, { "epoch": 0.21, "learning_rate": 0.0018360648386339543, "loss": 2.727, "step": 7789 }, { "epoch": 0.21, "learning_rate": 0.0018360170830980771, "loss": 2.69, "step": 7790 }, { "epoch": 0.21, "learning_rate": 0.001835969321228684, "loss": 2.4129, "step": 7791 }, { "epoch": 0.21, "learning_rate": 0.001835921553026137, "loss": 2.6886, "step": 7792 }, { "epoch": 0.21, "learning_rate": 0.0018358737784907975, "loss": 2.8382, "step": 7793 }, { "epoch": 0.21, "learning_rate": 0.0018358259976230275, "loss": 2.4465, "step": 7794 }, { "epoch": 0.21, "learning_rate": 0.0018357782104231894, "loss": 2.3615, "step": 7795 }, { "epoch": 0.21, "learning_rate": 0.0018357304168916452, "loss": 2.3353, "step": 7796 }, { "epoch": 0.21, "learning_rate": 0.0018356826170287564, "loss": 2.7698, "step": 7797 }, { "epoch": 0.21, "learning_rate": 0.0018356348108348856, "loss": 2.7756, "step": 7798 }, { "epoch": 0.21, "learning_rate": 0.001835586998310395, "loss": 2.9163, "step": 7799 }, { "epoch": 0.21, "learning_rate": 0.0018355391794556467, "loss": 2.6305, "step": 7800 }, { "epoch": 0.21, "learning_rate": 0.001835491354271003, "loss": 2.7811, "step": 7801 }, { "epoch": 0.21, "learning_rate": 0.001835443522756826, "loss": 2.3451, "step": 7802 }, { "epoch": 0.21, "learning_rate": 0.0018353956849134782, "loss": 2.689, "step": 7803 }, { "epoch": 0.21, "learning_rate": 0.0018353478407413225, "loss": 2.5376, "step": 7804 }, { "epoch": 0.21, "learning_rate": 0.0018352999902407205, "loss": 2.8199, "step": 7805 }, { "epoch": 0.21, "learning_rate": 0.001835252133412035, "loss": 2.8976, "step": 7806 }, { "epoch": 0.21, "learning_rate": 0.0018352042702556289, "loss": 2.6765, "step": 7807 }, { "epoch": 0.21, "learning_rate": 0.0018351564007718644, "loss": 2.7235, "step": 7808 }, { "epoch": 0.21, "learning_rate": 0.0018351085249611043, "loss": 2.3828, "step": 7809 }, { "epoch": 0.21, "learning_rate": 0.0018350606428237115, "loss": 2.5206, "step": 7810 }, { "epoch": 0.21, "learning_rate": 0.0018350127543600486, "loss": 2.5927, "step": 7811 }, { "epoch": 0.21, "learning_rate": 0.0018349648595704783, "loss": 2.6534, "step": 7812 }, { "epoch": 0.21, "learning_rate": 0.0018349169584553633, "loss": 2.723, "step": 7813 }, { "epoch": 0.21, "learning_rate": 0.0018348690510150672, "loss": 2.6328, "step": 7814 }, { "epoch": 0.21, "learning_rate": 0.001834821137249952, "loss": 2.4989, "step": 7815 }, { "epoch": 0.21, "learning_rate": 0.001834773217160381, "loss": 2.2549, "step": 7816 }, { "epoch": 0.21, "learning_rate": 0.0018347252907467177, "loss": 2.3791, "step": 7817 }, { "epoch": 0.21, "learning_rate": 0.0018346773580093245, "loss": 2.6911, "step": 7818 }, { "epoch": 0.21, "learning_rate": 0.0018346294189485652, "loss": 2.1994, "step": 7819 }, { "epoch": 0.21, "learning_rate": 0.0018345814735648024, "loss": 2.6488, "step": 7820 }, { "epoch": 0.21, "learning_rate": 0.0018345335218583995, "loss": 2.449, "step": 7821 }, { "epoch": 0.21, "learning_rate": 0.0018344855638297202, "loss": 2.6554, "step": 7822 }, { "epoch": 0.21, "learning_rate": 0.001834437599479127, "loss": 2.6223, "step": 7823 }, { "epoch": 0.21, "learning_rate": 0.0018343896288069842, "loss": 2.7685, "step": 7824 }, { "epoch": 0.21, "learning_rate": 0.0018343416518136547, "loss": 2.1528, "step": 7825 }, { "epoch": 0.21, "learning_rate": 0.0018342936684995017, "loss": 2.9389, "step": 7826 }, { "epoch": 0.21, "learning_rate": 0.0018342456788648894, "loss": 2.4047, "step": 7827 }, { "epoch": 0.21, "learning_rate": 0.0018341976829101805, "loss": 2.4821, "step": 7828 }, { "epoch": 0.21, "learning_rate": 0.0018341496806357394, "loss": 2.8328, "step": 7829 }, { "epoch": 0.21, "learning_rate": 0.0018341016720419291, "loss": 2.6065, "step": 7830 }, { "epoch": 0.21, "learning_rate": 0.0018340536571291141, "loss": 2.7372, "step": 7831 }, { "epoch": 0.21, "learning_rate": 0.0018340056358976578, "loss": 2.6807, "step": 7832 }, { "epoch": 0.21, "learning_rate": 0.0018339576083479235, "loss": 2.9965, "step": 7833 }, { "epoch": 0.21, "learning_rate": 0.0018339095744802755, "loss": 3.0414, "step": 7834 }, { "epoch": 0.21, "learning_rate": 0.0018338615342950782, "loss": 2.8311, "step": 7835 }, { "epoch": 0.21, "learning_rate": 0.0018338134877926944, "loss": 2.9828, "step": 7836 }, { "epoch": 0.21, "learning_rate": 0.0018337654349734889, "loss": 2.2673, "step": 7837 }, { "epoch": 0.21, "learning_rate": 0.0018337173758378254, "loss": 2.6278, "step": 7838 }, { "epoch": 0.21, "learning_rate": 0.0018336693103860684, "loss": 2.0807, "step": 7839 }, { "epoch": 0.21, "learning_rate": 0.0018336212386185814, "loss": 2.4362, "step": 7840 }, { "epoch": 0.21, "learning_rate": 0.001833573160535729, "loss": 2.6461, "step": 7841 }, { "epoch": 0.21, "learning_rate": 0.0018335250761378754, "loss": 2.383, "step": 7842 }, { "epoch": 0.21, "learning_rate": 0.001833476985425385, "loss": 2.6625, "step": 7843 }, { "epoch": 0.21, "learning_rate": 0.0018334288883986218, "loss": 2.9092, "step": 7844 }, { "epoch": 0.21, "learning_rate": 0.0018333807850579506, "loss": 2.9759, "step": 7845 }, { "epoch": 0.21, "learning_rate": 0.0018333326754037353, "loss": 2.543, "step": 7846 }, { "epoch": 0.21, "learning_rate": 0.0018332845594363407, "loss": 2.5964, "step": 7847 }, { "epoch": 0.21, "learning_rate": 0.0018332364371561314, "loss": 2.5317, "step": 7848 }, { "epoch": 0.21, "learning_rate": 0.0018331883085634718, "loss": 2.8503, "step": 7849 }, { "epoch": 0.21, "learning_rate": 0.0018331401736587263, "loss": 2.8829, "step": 7850 }, { "epoch": 0.21, "learning_rate": 0.00183309203244226, "loss": 2.8702, "step": 7851 }, { "epoch": 0.21, "learning_rate": 0.0018330438849144372, "loss": 2.351, "step": 7852 }, { "epoch": 0.21, "learning_rate": 0.001832995731075623, "loss": 3.0044, "step": 7853 }, { "epoch": 0.21, "learning_rate": 0.0018329475709261823, "loss": 2.6724, "step": 7854 }, { "epoch": 0.21, "learning_rate": 0.0018328994044664792, "loss": 2.3646, "step": 7855 }, { "epoch": 0.21, "learning_rate": 0.0018328512316968795, "loss": 2.4192, "step": 7856 }, { "epoch": 0.21, "learning_rate": 0.0018328030526177477, "loss": 2.4734, "step": 7857 }, { "epoch": 0.21, "learning_rate": 0.0018327548672294487, "loss": 2.2392, "step": 7858 }, { "epoch": 0.21, "learning_rate": 0.001832706675532348, "loss": 2.6233, "step": 7859 }, { "epoch": 0.21, "learning_rate": 0.0018326584775268102, "loss": 2.4047, "step": 7860 }, { "epoch": 0.21, "learning_rate": 0.001832610273213201, "loss": 2.7492, "step": 7861 }, { "epoch": 0.21, "learning_rate": 0.0018325620625918846, "loss": 2.5506, "step": 7862 }, { "epoch": 0.21, "learning_rate": 0.0018325138456632272, "loss": 2.7235, "step": 7863 }, { "epoch": 0.21, "learning_rate": 0.0018324656224275938, "loss": 2.6686, "step": 7864 }, { "epoch": 0.21, "learning_rate": 0.0018324173928853495, "loss": 2.7528, "step": 7865 }, { "epoch": 0.21, "learning_rate": 0.00183236915703686, "loss": 2.7729, "step": 7866 }, { "epoch": 0.21, "learning_rate": 0.0018323209148824904, "loss": 2.9804, "step": 7867 }, { "epoch": 0.21, "learning_rate": 0.0018322726664226066, "loss": 2.8335, "step": 7868 }, { "epoch": 0.21, "learning_rate": 0.0018322244116575738, "loss": 2.6462, "step": 7869 }, { "epoch": 0.21, "learning_rate": 0.0018321761505877574, "loss": 2.6916, "step": 7870 }, { "epoch": 0.21, "learning_rate": 0.0018321278832135236, "loss": 2.3907, "step": 7871 }, { "epoch": 0.21, "learning_rate": 0.0018320796095352377, "loss": 2.7553, "step": 7872 }, { "epoch": 0.21, "learning_rate": 0.0018320313295532653, "loss": 2.0736, "step": 7873 }, { "epoch": 0.21, "learning_rate": 0.0018319830432679722, "loss": 2.5895, "step": 7874 }, { "epoch": 0.21, "learning_rate": 0.0018319347506797247, "loss": 2.567, "step": 7875 }, { "epoch": 0.21, "learning_rate": 0.0018318864517888878, "loss": 2.6825, "step": 7876 }, { "epoch": 0.21, "learning_rate": 0.0018318381465958283, "loss": 2.7745, "step": 7877 }, { "epoch": 0.21, "learning_rate": 0.0018317898351009113, "loss": 2.4191, "step": 7878 }, { "epoch": 0.21, "learning_rate": 0.0018317415173045033, "loss": 2.5717, "step": 7879 }, { "epoch": 0.21, "learning_rate": 0.0018316931932069705, "loss": 2.8532, "step": 7880 }, { "epoch": 0.21, "learning_rate": 0.0018316448628086786, "loss": 2.6371, "step": 7881 }, { "epoch": 0.21, "learning_rate": 0.0018315965261099941, "loss": 2.7261, "step": 7882 }, { "epoch": 0.21, "learning_rate": 0.0018315481831112828, "loss": 2.409, "step": 7883 }, { "epoch": 0.21, "learning_rate": 0.0018314998338129112, "loss": 2.7557, "step": 7884 }, { "epoch": 0.21, "learning_rate": 0.0018314514782152454, "loss": 2.7898, "step": 7885 }, { "epoch": 0.21, "learning_rate": 0.0018314031163186519, "loss": 2.279, "step": 7886 }, { "epoch": 0.21, "learning_rate": 0.001831354748123497, "loss": 2.7269, "step": 7887 }, { "epoch": 0.21, "learning_rate": 0.0018313063736301474, "loss": 2.8425, "step": 7888 }, { "epoch": 0.21, "learning_rate": 0.0018312579928389692, "loss": 3.1371, "step": 7889 }, { "epoch": 0.21, "learning_rate": 0.001831209605750329, "loss": 2.7867, "step": 7890 }, { "epoch": 0.21, "learning_rate": 0.0018311612123645933, "loss": 2.6159, "step": 7891 }, { "epoch": 0.21, "learning_rate": 0.001831112812682129, "loss": 2.627, "step": 7892 }, { "epoch": 0.21, "learning_rate": 0.0018310644067033026, "loss": 2.6938, "step": 7893 }, { "epoch": 0.21, "learning_rate": 0.001831015994428481, "loss": 2.6148, "step": 7894 }, { "epoch": 0.21, "learning_rate": 0.0018309675758580307, "loss": 2.7725, "step": 7895 }, { "epoch": 0.21, "learning_rate": 0.0018309191509923183, "loss": 2.6739, "step": 7896 }, { "epoch": 0.21, "learning_rate": 0.0018308707198317117, "loss": 2.8527, "step": 7897 }, { "epoch": 0.21, "learning_rate": 0.0018308222823765763, "loss": 2.9842, "step": 7898 }, { "epoch": 0.21, "learning_rate": 0.0018307738386272804, "loss": 2.5111, "step": 7899 }, { "epoch": 0.21, "learning_rate": 0.0018307253885841898, "loss": 2.4128, "step": 7900 }, { "epoch": 0.21, "learning_rate": 0.0018306769322476728, "loss": 2.7982, "step": 7901 }, { "epoch": 0.21, "learning_rate": 0.0018306284696180954, "loss": 2.9513, "step": 7902 }, { "epoch": 0.21, "learning_rate": 0.0018305800006958256, "loss": 2.7184, "step": 7903 }, { "epoch": 0.21, "learning_rate": 0.00183053152548123, "loss": 2.6253, "step": 7904 }, { "epoch": 0.21, "learning_rate": 0.001830483043974676, "loss": 2.5862, "step": 7905 }, { "epoch": 0.21, "learning_rate": 0.001830434556176531, "loss": 3.0237, "step": 7906 }, { "epoch": 0.21, "learning_rate": 0.0018303860620871625, "loss": 2.3401, "step": 7907 }, { "epoch": 0.21, "learning_rate": 0.0018303375617069375, "loss": 2.5902, "step": 7908 }, { "epoch": 0.21, "learning_rate": 0.0018302890550362235, "loss": 2.4935, "step": 7909 }, { "epoch": 0.21, "learning_rate": 0.001830240542075388, "loss": 2.5381, "step": 7910 }, { "epoch": 0.21, "learning_rate": 0.0018301920228247987, "loss": 2.8079, "step": 7911 }, { "epoch": 0.21, "learning_rate": 0.001830143497284823, "loss": 2.4915, "step": 7912 }, { "epoch": 0.21, "learning_rate": 0.0018300949654558286, "loss": 2.4991, "step": 7913 }, { "epoch": 0.21, "learning_rate": 0.0018300464273381832, "loss": 2.585, "step": 7914 }, { "epoch": 0.21, "learning_rate": 0.0018299978829322545, "loss": 2.3873, "step": 7915 }, { "epoch": 0.21, "learning_rate": 0.0018299493322384102, "loss": 2.3705, "step": 7916 }, { "epoch": 0.21, "learning_rate": 0.001829900775257018, "loss": 2.3986, "step": 7917 }, { "epoch": 0.21, "learning_rate": 0.0018298522119884462, "loss": 2.7831, "step": 7918 }, { "epoch": 0.21, "learning_rate": 0.001829803642433062, "loss": 2.6999, "step": 7919 }, { "epoch": 0.21, "learning_rate": 0.001829755066591234, "loss": 3.3212, "step": 7920 }, { "epoch": 0.21, "learning_rate": 0.00182970648446333, "loss": 2.7113, "step": 7921 }, { "epoch": 0.21, "learning_rate": 0.0018296578960497179, "loss": 2.9284, "step": 7922 }, { "epoch": 0.21, "learning_rate": 0.001829609301350766, "loss": 2.601, "step": 7923 }, { "epoch": 0.21, "learning_rate": 0.0018295607003668423, "loss": 2.3693, "step": 7924 }, { "epoch": 0.21, "learning_rate": 0.001829512093098315, "loss": 2.2671, "step": 7925 }, { "epoch": 0.21, "learning_rate": 0.0018294634795455523, "loss": 2.6164, "step": 7926 }, { "epoch": 0.21, "learning_rate": 0.0018294148597089227, "loss": 2.6428, "step": 7927 }, { "epoch": 0.21, "learning_rate": 0.0018293662335887944, "loss": 2.5503, "step": 7928 }, { "epoch": 0.21, "learning_rate": 0.0018293176011855358, "loss": 2.4385, "step": 7929 }, { "epoch": 0.21, "learning_rate": 0.0018292689624995156, "loss": 2.6521, "step": 7930 }, { "epoch": 0.21, "learning_rate": 0.0018292203175311016, "loss": 2.6276, "step": 7931 }, { "epoch": 0.21, "learning_rate": 0.0018291716662806627, "loss": 2.7037, "step": 7932 }, { "epoch": 0.21, "learning_rate": 0.0018291230087485678, "loss": 2.1981, "step": 7933 }, { "epoch": 0.21, "learning_rate": 0.001829074344935185, "loss": 2.7319, "step": 7934 }, { "epoch": 0.21, "learning_rate": 0.0018290256748408834, "loss": 2.9676, "step": 7935 }, { "epoch": 0.21, "learning_rate": 0.0018289769984660312, "loss": 2.2052, "step": 7936 }, { "epoch": 0.21, "learning_rate": 0.0018289283158109976, "loss": 2.5456, "step": 7937 }, { "epoch": 0.21, "learning_rate": 0.0018288796268761513, "loss": 2.9968, "step": 7938 }, { "epoch": 0.21, "learning_rate": 0.0018288309316618612, "loss": 2.444, "step": 7939 }, { "epoch": 0.21, "learning_rate": 0.0018287822301684962, "loss": 2.555, "step": 7940 }, { "epoch": 0.21, "learning_rate": 0.001828733522396425, "loss": 2.5452, "step": 7941 }, { "epoch": 0.21, "learning_rate": 0.0018286848083460168, "loss": 2.7404, "step": 7942 }, { "epoch": 0.21, "learning_rate": 0.0018286360880176407, "loss": 2.8414, "step": 7943 }, { "epoch": 0.21, "learning_rate": 0.0018285873614116658, "loss": 2.5015, "step": 7944 }, { "epoch": 0.21, "learning_rate": 0.0018285386285284613, "loss": 2.5811, "step": 7945 }, { "epoch": 0.21, "learning_rate": 0.0018284898893683962, "loss": 2.5709, "step": 7946 }, { "epoch": 0.21, "learning_rate": 0.0018284411439318396, "loss": 2.6407, "step": 7947 }, { "epoch": 0.21, "learning_rate": 0.0018283923922191613, "loss": 2.2945, "step": 7948 }, { "epoch": 0.21, "learning_rate": 0.00182834363423073, "loss": 2.4944, "step": 7949 }, { "epoch": 0.21, "learning_rate": 0.0018282948699669156, "loss": 2.5766, "step": 7950 }, { "epoch": 0.21, "learning_rate": 0.0018282460994280875, "loss": 2.4955, "step": 7951 }, { "epoch": 0.21, "learning_rate": 0.0018281973226146149, "loss": 2.6663, "step": 7952 }, { "epoch": 0.21, "learning_rate": 0.0018281485395268673, "loss": 2.9011, "step": 7953 }, { "epoch": 0.21, "learning_rate": 0.0018280997501652148, "loss": 2.5649, "step": 7954 }, { "epoch": 0.21, "learning_rate": 0.0018280509545300263, "loss": 2.5624, "step": 7955 }, { "epoch": 0.21, "learning_rate": 0.0018280021526216718, "loss": 2.9575, "step": 7956 }, { "epoch": 0.21, "learning_rate": 0.0018279533444405212, "loss": 3.1481, "step": 7957 }, { "epoch": 0.21, "learning_rate": 0.0018279045299869439, "loss": 2.6476, "step": 7958 }, { "epoch": 0.21, "learning_rate": 0.0018278557092613102, "loss": 2.6041, "step": 7959 }, { "epoch": 0.21, "learning_rate": 0.0018278068822639895, "loss": 2.5395, "step": 7960 }, { "epoch": 0.21, "learning_rate": 0.001827758048995352, "loss": 2.8214, "step": 7961 }, { "epoch": 0.21, "learning_rate": 0.0018277092094557672, "loss": 2.2687, "step": 7962 }, { "epoch": 0.21, "learning_rate": 0.0018276603636456054, "loss": 2.6147, "step": 7963 }, { "epoch": 0.21, "learning_rate": 0.001827611511565237, "loss": 2.5637, "step": 7964 }, { "epoch": 0.21, "learning_rate": 0.0018275626532150314, "loss": 2.8209, "step": 7965 }, { "epoch": 0.21, "learning_rate": 0.0018275137885953594, "loss": 2.8879, "step": 7966 }, { "epoch": 0.21, "learning_rate": 0.0018274649177065908, "loss": 2.7363, "step": 7967 }, { "epoch": 0.21, "learning_rate": 0.0018274160405490959, "loss": 2.9936, "step": 7968 }, { "epoch": 0.21, "learning_rate": 0.0018273671571232449, "loss": 2.2988, "step": 7969 }, { "epoch": 0.21, "learning_rate": 0.0018273182674294081, "loss": 2.7217, "step": 7970 }, { "epoch": 0.21, "learning_rate": 0.0018272693714679565, "loss": 2.3989, "step": 7971 }, { "epoch": 0.21, "learning_rate": 0.0018272204692392595, "loss": 2.877, "step": 7972 }, { "epoch": 0.21, "learning_rate": 0.0018271715607436885, "loss": 2.9519, "step": 7973 }, { "epoch": 0.21, "learning_rate": 0.0018271226459816137, "loss": 2.3049, "step": 7974 }, { "epoch": 0.21, "learning_rate": 0.0018270737249534053, "loss": 2.8146, "step": 7975 }, { "epoch": 0.21, "learning_rate": 0.0018270247976594344, "loss": 2.8427, "step": 7976 }, { "epoch": 0.21, "learning_rate": 0.0018269758641000717, "loss": 2.4958, "step": 7977 }, { "epoch": 0.21, "learning_rate": 0.0018269269242756872, "loss": 2.6573, "step": 7978 }, { "epoch": 0.21, "learning_rate": 0.0018268779781866525, "loss": 3.0248, "step": 7979 }, { "epoch": 0.21, "learning_rate": 0.0018268290258333377, "loss": 3.0797, "step": 7980 }, { "epoch": 0.21, "learning_rate": 0.0018267800672161145, "loss": 2.6772, "step": 7981 }, { "epoch": 0.21, "learning_rate": 0.0018267311023353531, "loss": 2.8237, "step": 7982 }, { "epoch": 0.21, "learning_rate": 0.0018266821311914247, "loss": 2.6901, "step": 7983 }, { "epoch": 0.21, "learning_rate": 0.0018266331537847003, "loss": 2.437, "step": 7984 }, { "epoch": 0.21, "learning_rate": 0.001826584170115551, "loss": 2.8829, "step": 7985 }, { "epoch": 0.21, "learning_rate": 0.0018265351801843477, "loss": 2.7486, "step": 7986 }, { "epoch": 0.21, "learning_rate": 0.0018264861839914618, "loss": 2.9616, "step": 7987 }, { "epoch": 0.21, "learning_rate": 0.001826437181537264, "loss": 2.3228, "step": 7988 }, { "epoch": 0.21, "learning_rate": 0.0018263881728221262, "loss": 2.479, "step": 7989 }, { "epoch": 0.21, "learning_rate": 0.001826339157846419, "loss": 2.6813, "step": 7990 }, { "epoch": 0.21, "learning_rate": 0.0018262901366105143, "loss": 2.7446, "step": 7991 }, { "epoch": 0.21, "learning_rate": 0.0018262411091147833, "loss": 2.6164, "step": 7992 }, { "epoch": 0.21, "learning_rate": 0.0018261920753595974, "loss": 2.6055, "step": 7993 }, { "epoch": 0.21, "learning_rate": 0.0018261430353453277, "loss": 2.7458, "step": 7994 }, { "epoch": 0.21, "learning_rate": 0.0018260939890723466, "loss": 2.7823, "step": 7995 }, { "epoch": 0.21, "learning_rate": 0.0018260449365410248, "loss": 2.6341, "step": 7996 }, { "epoch": 0.21, "learning_rate": 0.0018259958777517343, "loss": 2.5808, "step": 7997 }, { "epoch": 0.21, "learning_rate": 0.0018259468127048467, "loss": 2.665, "step": 7998 }, { "epoch": 0.21, "learning_rate": 0.0018258977414007337, "loss": 2.6625, "step": 7999 }, { "epoch": 0.21, "learning_rate": 0.001825848663839767, "loss": 2.8599, "step": 8000 }, { "epoch": 0.22, "learning_rate": 0.0018257995800223183, "loss": 2.7295, "step": 8001 }, { "epoch": 0.22, "learning_rate": 0.00182575048994876, "loss": 2.6641, "step": 8002 }, { "epoch": 0.22, "learning_rate": 0.0018257013936194633, "loss": 2.5831, "step": 8003 }, { "epoch": 0.22, "learning_rate": 0.0018256522910348007, "loss": 2.5865, "step": 8004 }, { "epoch": 0.22, "learning_rate": 0.001825603182195144, "loss": 2.301, "step": 8005 }, { "epoch": 0.22, "learning_rate": 0.0018255540671008653, "loss": 2.3984, "step": 8006 }, { "epoch": 0.22, "learning_rate": 0.001825504945752336, "loss": 2.5499, "step": 8007 }, { "epoch": 0.22, "learning_rate": 0.0018254558181499294, "loss": 2.2845, "step": 8008 }, { "epoch": 0.22, "learning_rate": 0.001825406684294017, "loss": 3.0048, "step": 8009 }, { "epoch": 0.22, "learning_rate": 0.0018253575441849708, "loss": 2.4246, "step": 8010 }, { "epoch": 0.22, "learning_rate": 0.0018253083978231636, "loss": 2.2507, "step": 8011 }, { "epoch": 0.22, "learning_rate": 0.0018252592452089678, "loss": 2.7253, "step": 8012 }, { "epoch": 0.22, "learning_rate": 0.001825210086342755, "loss": 2.543, "step": 8013 }, { "epoch": 0.22, "learning_rate": 0.0018251609212248986, "loss": 2.5903, "step": 8014 }, { "epoch": 0.22, "learning_rate": 0.0018251117498557703, "loss": 2.6692, "step": 8015 }, { "epoch": 0.22, "learning_rate": 0.0018250625722357429, "loss": 2.8323, "step": 8016 }, { "epoch": 0.22, "learning_rate": 0.001825013388365189, "loss": 2.4145, "step": 8017 }, { "epoch": 0.22, "learning_rate": 0.0018249641982444813, "loss": 2.1016, "step": 8018 }, { "epoch": 0.22, "learning_rate": 0.0018249150018739922, "loss": 2.4461, "step": 8019 }, { "epoch": 0.22, "learning_rate": 0.0018248657992540945, "loss": 2.4045, "step": 8020 }, { "epoch": 0.22, "learning_rate": 0.001824816590385161, "loss": 2.962, "step": 8021 }, { "epoch": 0.22, "learning_rate": 0.0018247673752675646, "loss": 2.4637, "step": 8022 }, { "epoch": 0.22, "learning_rate": 0.001824718153901678, "loss": 2.5538, "step": 8023 }, { "epoch": 0.22, "learning_rate": 0.0018246689262878739, "loss": 2.6941, "step": 8024 }, { "epoch": 0.22, "learning_rate": 0.0018246196924265256, "loss": 2.878, "step": 8025 }, { "epoch": 0.22, "learning_rate": 0.0018245704523180057, "loss": 2.6397, "step": 8026 }, { "epoch": 0.22, "learning_rate": 0.0018245212059626878, "loss": 2.3563, "step": 8027 }, { "epoch": 0.22, "learning_rate": 0.0018244719533609447, "loss": 2.3637, "step": 8028 }, { "epoch": 0.22, "learning_rate": 0.0018244226945131493, "loss": 2.3666, "step": 8029 }, { "epoch": 0.22, "learning_rate": 0.001824373429419675, "loss": 2.6184, "step": 8030 }, { "epoch": 0.22, "learning_rate": 0.001824324158080895, "loss": 2.517, "step": 8031 }, { "epoch": 0.22, "learning_rate": 0.0018242748804971824, "loss": 2.406, "step": 8032 }, { "epoch": 0.22, "learning_rate": 0.0018242255966689107, "loss": 2.5327, "step": 8033 }, { "epoch": 0.22, "learning_rate": 0.0018241763065964534, "loss": 2.6518, "step": 8034 }, { "epoch": 0.22, "learning_rate": 0.0018241270102801836, "loss": 2.5509, "step": 8035 }, { "epoch": 0.22, "learning_rate": 0.001824077707720475, "loss": 2.4845, "step": 8036 }, { "epoch": 0.22, "learning_rate": 0.001824028398917701, "loss": 2.7363, "step": 8037 }, { "epoch": 0.22, "learning_rate": 0.0018239790838722354, "loss": 2.9826, "step": 8038 }, { "epoch": 0.22, "learning_rate": 0.0018239297625844513, "loss": 2.2176, "step": 8039 }, { "epoch": 0.22, "learning_rate": 0.0018238804350547224, "loss": 2.7547, "step": 8040 }, { "epoch": 0.22, "learning_rate": 0.0018238311012834232, "loss": 2.4496, "step": 8041 }, { "epoch": 0.22, "learning_rate": 0.0018237817612709265, "loss": 2.1143, "step": 8042 }, { "epoch": 0.22, "learning_rate": 0.0018237324150176067, "loss": 2.6051, "step": 8043 }, { "epoch": 0.22, "learning_rate": 0.001823683062523837, "loss": 2.6632, "step": 8044 }, { "epoch": 0.22, "learning_rate": 0.0018236337037899918, "loss": 2.1463, "step": 8045 }, { "epoch": 0.22, "learning_rate": 0.001823584338816445, "loss": 2.87, "step": 8046 }, { "epoch": 0.22, "learning_rate": 0.0018235349676035705, "loss": 2.5423, "step": 8047 }, { "epoch": 0.22, "learning_rate": 0.0018234855901517425, "loss": 2.4132, "step": 8048 }, { "epoch": 0.22, "learning_rate": 0.0018234362064613345, "loss": 2.2745, "step": 8049 }, { "epoch": 0.22, "learning_rate": 0.0018233868165327212, "loss": 2.6258, "step": 8050 }, { "epoch": 0.22, "learning_rate": 0.001823337420366277, "loss": 2.4169, "step": 8051 }, { "epoch": 0.22, "learning_rate": 0.001823288017962375, "loss": 2.309, "step": 8052 }, { "epoch": 0.22, "learning_rate": 0.0018232386093213907, "loss": 2.9391, "step": 8053 }, { "epoch": 0.22, "learning_rate": 0.0018231891944436973, "loss": 2.0643, "step": 8054 }, { "epoch": 0.22, "learning_rate": 0.0018231397733296704, "loss": 2.7899, "step": 8055 }, { "epoch": 0.22, "learning_rate": 0.0018230903459796834, "loss": 2.9863, "step": 8056 }, { "epoch": 0.22, "learning_rate": 0.0018230409123941112, "loss": 2.8142, "step": 8057 }, { "epoch": 0.22, "learning_rate": 0.001822991472573328, "loss": 2.4173, "step": 8058 }, { "epoch": 0.22, "learning_rate": 0.0018229420265177087, "loss": 2.6677, "step": 8059 }, { "epoch": 0.22, "learning_rate": 0.0018228925742276277, "loss": 2.8589, "step": 8060 }, { "epoch": 0.22, "learning_rate": 0.0018228431157034596, "loss": 2.4321, "step": 8061 }, { "epoch": 0.22, "learning_rate": 0.0018227936509455792, "loss": 2.5845, "step": 8062 }, { "epoch": 0.22, "learning_rate": 0.0018227441799543614, "loss": 2.3533, "step": 8063 }, { "epoch": 0.22, "learning_rate": 0.0018226947027301806, "loss": 2.5208, "step": 8064 }, { "epoch": 0.22, "learning_rate": 0.0018226452192734118, "loss": 2.8114, "step": 8065 }, { "epoch": 0.22, "learning_rate": 0.00182259572958443, "loss": 2.4133, "step": 8066 }, { "epoch": 0.22, "learning_rate": 0.00182254623366361, "loss": 2.2612, "step": 8067 }, { "epoch": 0.22, "learning_rate": 0.0018224967315113266, "loss": 2.4186, "step": 8068 }, { "epoch": 0.22, "learning_rate": 0.0018224472231279552, "loss": 2.9286, "step": 8069 }, { "epoch": 0.22, "learning_rate": 0.0018223977085138705, "loss": 2.6833, "step": 8070 }, { "epoch": 0.22, "learning_rate": 0.0018223481876694478, "loss": 2.6461, "step": 8071 }, { "epoch": 0.22, "learning_rate": 0.0018222986605950626, "loss": 2.7159, "step": 8072 }, { "epoch": 0.22, "learning_rate": 0.0018222491272910895, "loss": 2.7805, "step": 8073 }, { "epoch": 0.22, "learning_rate": 0.001822199587757904, "loss": 2.5785, "step": 8074 }, { "epoch": 0.22, "learning_rate": 0.0018221500419958816, "loss": 2.5957, "step": 8075 }, { "epoch": 0.22, "learning_rate": 0.0018221004900053975, "loss": 2.4289, "step": 8076 }, { "epoch": 0.22, "learning_rate": 0.0018220509317868267, "loss": 2.7399, "step": 8077 }, { "epoch": 0.22, "learning_rate": 0.0018220013673405453, "loss": 2.3985, "step": 8078 }, { "epoch": 0.22, "learning_rate": 0.0018219517966669284, "loss": 2.7649, "step": 8079 }, { "epoch": 0.22, "learning_rate": 0.0018219022197663514, "loss": 2.6499, "step": 8080 }, { "epoch": 0.22, "learning_rate": 0.0018218526366391905, "loss": 2.5341, "step": 8081 }, { "epoch": 0.22, "learning_rate": 0.001821803047285821, "loss": 2.8644, "step": 8082 }, { "epoch": 0.22, "learning_rate": 0.0018217534517066182, "loss": 2.5516, "step": 8083 }, { "epoch": 0.22, "learning_rate": 0.0018217038499019585, "loss": 3.1887, "step": 8084 }, { "epoch": 0.22, "learning_rate": 0.0018216542418722172, "loss": 2.9415, "step": 8085 }, { "epoch": 0.22, "learning_rate": 0.0018216046276177701, "loss": 2.464, "step": 8086 }, { "epoch": 0.22, "learning_rate": 0.0018215550071389935, "loss": 2.531, "step": 8087 }, { "epoch": 0.22, "learning_rate": 0.001821505380436263, "loss": 2.8938, "step": 8088 }, { "epoch": 0.22, "learning_rate": 0.0018214557475099541, "loss": 2.6344, "step": 8089 }, { "epoch": 0.22, "learning_rate": 0.0018214061083604441, "loss": 2.1604, "step": 8090 }, { "epoch": 0.22, "learning_rate": 0.0018213564629881078, "loss": 2.3764, "step": 8091 }, { "epoch": 0.22, "learning_rate": 0.001821306811393322, "loss": 2.658, "step": 8092 }, { "epoch": 0.22, "learning_rate": 0.0018212571535764627, "loss": 2.9927, "step": 8093 }, { "epoch": 0.22, "learning_rate": 0.0018212074895379057, "loss": 2.8639, "step": 8094 }, { "epoch": 0.22, "learning_rate": 0.001821157819278028, "loss": 2.6846, "step": 8095 }, { "epoch": 0.22, "learning_rate": 0.001821108142797205, "loss": 2.6427, "step": 8096 }, { "epoch": 0.22, "learning_rate": 0.0018210584600958138, "loss": 3.1021, "step": 8097 }, { "epoch": 0.22, "learning_rate": 0.0018210087711742302, "loss": 2.6199, "step": 8098 }, { "epoch": 0.22, "learning_rate": 0.0018209590760328313, "loss": 2.7285, "step": 8099 }, { "epoch": 0.22, "learning_rate": 0.0018209093746719932, "loss": 2.5439, "step": 8100 }, { "epoch": 0.22, "learning_rate": 0.0018208596670920923, "loss": 2.323, "step": 8101 }, { "epoch": 0.22, "learning_rate": 0.0018208099532935052, "loss": 2.6242, "step": 8102 }, { "epoch": 0.22, "learning_rate": 0.0018207602332766088, "loss": 2.4311, "step": 8103 }, { "epoch": 0.22, "learning_rate": 0.0018207105070417798, "loss": 2.7562, "step": 8104 }, { "epoch": 0.22, "learning_rate": 0.0018206607745893941, "loss": 2.8446, "step": 8105 }, { "epoch": 0.22, "learning_rate": 0.0018206110359198298, "loss": 2.6003, "step": 8106 }, { "epoch": 0.22, "learning_rate": 0.0018205612910334628, "loss": 2.3268, "step": 8107 }, { "epoch": 0.22, "learning_rate": 0.00182051153993067, "loss": 2.0296, "step": 8108 }, { "epoch": 0.22, "learning_rate": 0.0018204617826118286, "loss": 1.8533, "step": 8109 }, { "epoch": 0.22, "learning_rate": 0.0018204120190773152, "loss": 2.4967, "step": 8110 }, { "epoch": 0.22, "learning_rate": 0.0018203622493275073, "loss": 2.7387, "step": 8111 }, { "epoch": 0.22, "learning_rate": 0.0018203124733627814, "loss": 2.8526, "step": 8112 }, { "epoch": 0.22, "learning_rate": 0.001820262691183515, "loss": 2.4491, "step": 8113 }, { "epoch": 0.22, "learning_rate": 0.0018202129027900852, "loss": 2.498, "step": 8114 }, { "epoch": 0.22, "learning_rate": 0.001820163108182869, "loss": 2.7218, "step": 8115 }, { "epoch": 0.22, "learning_rate": 0.0018201133073622439, "loss": 2.5657, "step": 8116 }, { "epoch": 0.22, "learning_rate": 0.0018200635003285865, "loss": 2.2576, "step": 8117 }, { "epoch": 0.22, "learning_rate": 0.001820013687082275, "loss": 2.9967, "step": 8118 }, { "epoch": 0.22, "learning_rate": 0.0018199638676236864, "loss": 2.6345, "step": 8119 }, { "epoch": 0.22, "learning_rate": 0.001819914041953198, "loss": 2.936, "step": 8120 }, { "epoch": 0.22, "learning_rate": 0.0018198642100711877, "loss": 2.5419, "step": 8121 }, { "epoch": 0.22, "learning_rate": 0.0018198143719780325, "loss": 2.6905, "step": 8122 }, { "epoch": 0.22, "learning_rate": 0.0018197645276741103, "loss": 2.5146, "step": 8123 }, { "epoch": 0.22, "learning_rate": 0.0018197146771597983, "loss": 2.9493, "step": 8124 }, { "epoch": 0.22, "learning_rate": 0.0018196648204354747, "loss": 2.7431, "step": 8125 }, { "epoch": 0.22, "learning_rate": 0.001819614957501517, "loss": 2.5844, "step": 8126 }, { "epoch": 0.22, "learning_rate": 0.0018195650883583029, "loss": 2.807, "step": 8127 }, { "epoch": 0.22, "learning_rate": 0.0018195152130062102, "loss": 2.4108, "step": 8128 }, { "epoch": 0.22, "learning_rate": 0.001819465331445617, "loss": 2.3375, "step": 8129 }, { "epoch": 0.22, "learning_rate": 0.0018194154436769003, "loss": 2.4992, "step": 8130 }, { "epoch": 0.22, "learning_rate": 0.0018193655497004393, "loss": 2.3659, "step": 8131 }, { "epoch": 0.22, "learning_rate": 0.0018193156495166112, "loss": 2.5482, "step": 8132 }, { "epoch": 0.22, "learning_rate": 0.001819265743125794, "loss": 2.7778, "step": 8133 }, { "epoch": 0.22, "learning_rate": 0.0018192158305283665, "loss": 2.4522, "step": 8134 }, { "epoch": 0.22, "learning_rate": 0.001819165911724706, "loss": 2.6621, "step": 8135 }, { "epoch": 0.22, "learning_rate": 0.001819115986715191, "loss": 2.8132, "step": 8136 }, { "epoch": 0.22, "learning_rate": 0.0018190660555001995, "loss": 2.3343, "step": 8137 }, { "epoch": 0.22, "learning_rate": 0.00181901611808011, "loss": 2.664, "step": 8138 }, { "epoch": 0.22, "learning_rate": 0.0018189661744553015, "loss": 2.7804, "step": 8139 }, { "epoch": 0.22, "learning_rate": 0.0018189162246261513, "loss": 2.5435, "step": 8140 }, { "epoch": 0.22, "learning_rate": 0.001818866268593038, "loss": 2.6219, "step": 8141 }, { "epoch": 0.22, "learning_rate": 0.0018188163063563403, "loss": 2.9969, "step": 8142 }, { "epoch": 0.22, "learning_rate": 0.0018187663379164367, "loss": 2.5706, "step": 8143 }, { "epoch": 0.22, "learning_rate": 0.0018187163632737058, "loss": 2.6295, "step": 8144 }, { "epoch": 0.22, "learning_rate": 0.0018186663824285262, "loss": 2.7235, "step": 8145 }, { "epoch": 0.22, "learning_rate": 0.0018186163953812762, "loss": 2.7494, "step": 8146 }, { "epoch": 0.22, "learning_rate": 0.0018185664021323348, "loss": 2.432, "step": 8147 }, { "epoch": 0.22, "learning_rate": 0.0018185164026820809, "loss": 2.3788, "step": 8148 }, { "epoch": 0.22, "learning_rate": 0.0018184663970308929, "loss": 2.4317, "step": 8149 }, { "epoch": 0.22, "learning_rate": 0.0018184163851791496, "loss": 2.4325, "step": 8150 }, { "epoch": 0.22, "learning_rate": 0.0018183663671272304, "loss": 2.5914, "step": 8151 }, { "epoch": 0.22, "learning_rate": 0.0018183163428755135, "loss": 2.3193, "step": 8152 }, { "epoch": 0.22, "learning_rate": 0.0018182663124243787, "loss": 2.8473, "step": 8153 }, { "epoch": 0.22, "learning_rate": 0.0018182162757742046, "loss": 2.7196, "step": 8154 }, { "epoch": 0.22, "learning_rate": 0.0018181662329253704, "loss": 2.7085, "step": 8155 }, { "epoch": 0.22, "learning_rate": 0.0018181161838782547, "loss": 2.5147, "step": 8156 }, { "epoch": 0.22, "learning_rate": 0.0018180661286332372, "loss": 2.7516, "step": 8157 }, { "epoch": 0.22, "learning_rate": 0.0018180160671906972, "loss": 2.3513, "step": 8158 }, { "epoch": 0.22, "learning_rate": 0.001817965999551013, "loss": 2.557, "step": 8159 }, { "epoch": 0.22, "learning_rate": 0.0018179159257145654, "loss": 2.7435, "step": 8160 }, { "epoch": 0.22, "learning_rate": 0.0018178658456817326, "loss": 2.798, "step": 8161 }, { "epoch": 0.22, "learning_rate": 0.0018178157594528949, "loss": 2.7594, "step": 8162 }, { "epoch": 0.22, "learning_rate": 0.0018177656670284304, "loss": 2.3072, "step": 8163 }, { "epoch": 0.22, "learning_rate": 0.00181771556840872, "loss": 2.5947, "step": 8164 }, { "epoch": 0.22, "learning_rate": 0.0018176654635941425, "loss": 2.2695, "step": 8165 }, { "epoch": 0.22, "learning_rate": 0.0018176153525850775, "loss": 2.6808, "step": 8166 }, { "epoch": 0.22, "learning_rate": 0.0018175652353819049, "loss": 2.7891, "step": 8167 }, { "epoch": 0.22, "learning_rate": 0.0018175151119850042, "loss": 2.6159, "step": 8168 }, { "epoch": 0.22, "learning_rate": 0.0018174649823947551, "loss": 2.4615, "step": 8169 }, { "epoch": 0.22, "learning_rate": 0.0018174148466115377, "loss": 2.8677, "step": 8170 }, { "epoch": 0.22, "learning_rate": 0.0018173647046357314, "loss": 2.59, "step": 8171 }, { "epoch": 0.22, "learning_rate": 0.001817314556467716, "loss": 2.537, "step": 8172 }, { "epoch": 0.22, "learning_rate": 0.0018172644021078718, "loss": 2.7356, "step": 8173 }, { "epoch": 0.22, "learning_rate": 0.001817214241556579, "loss": 2.7123, "step": 8174 }, { "epoch": 0.22, "learning_rate": 0.0018171640748142167, "loss": 2.946, "step": 8175 }, { "epoch": 0.22, "learning_rate": 0.0018171139018811659, "loss": 3.0168, "step": 8176 }, { "epoch": 0.22, "learning_rate": 0.0018170637227578057, "loss": 2.6504, "step": 8177 }, { "epoch": 0.22, "learning_rate": 0.0018170135374445172, "loss": 2.5615, "step": 8178 }, { "epoch": 0.22, "learning_rate": 0.00181696334594168, "loss": 2.7743, "step": 8179 }, { "epoch": 0.22, "learning_rate": 0.0018169131482496748, "loss": 2.3287, "step": 8180 }, { "epoch": 0.22, "learning_rate": 0.0018168629443688813, "loss": 2.8224, "step": 8181 }, { "epoch": 0.22, "learning_rate": 0.0018168127342996804, "loss": 2.3289, "step": 8182 }, { "epoch": 0.22, "learning_rate": 0.0018167625180424522, "loss": 2.2604, "step": 8183 }, { "epoch": 0.22, "learning_rate": 0.0018167122955975775, "loss": 2.7677, "step": 8184 }, { "epoch": 0.22, "learning_rate": 0.0018166620669654362, "loss": 2.375, "step": 8185 }, { "epoch": 0.22, "learning_rate": 0.001816611832146409, "loss": 2.9654, "step": 8186 }, { "epoch": 0.22, "learning_rate": 0.0018165615911408767, "loss": 2.3237, "step": 8187 }, { "epoch": 0.22, "learning_rate": 0.0018165113439492196, "loss": 2.6248, "step": 8188 }, { "epoch": 0.22, "learning_rate": 0.0018164610905718186, "loss": 2.5524, "step": 8189 }, { "epoch": 0.22, "learning_rate": 0.0018164108310090544, "loss": 2.8155, "step": 8190 }, { "epoch": 0.22, "learning_rate": 0.0018163605652613075, "loss": 2.5913, "step": 8191 }, { "epoch": 0.22, "learning_rate": 0.0018163102933289594, "loss": 2.647, "step": 8192 }, { "epoch": 0.22, "learning_rate": 0.00181626001521239, "loss": 2.7908, "step": 8193 }, { "epoch": 0.22, "learning_rate": 0.001816209730911981, "loss": 3.0242, "step": 8194 }, { "epoch": 0.22, "learning_rate": 0.0018161594404281127, "loss": 2.4171, "step": 8195 }, { "epoch": 0.22, "learning_rate": 0.0018161091437611666, "loss": 2.623, "step": 8196 }, { "epoch": 0.22, "learning_rate": 0.0018160588409115235, "loss": 2.5637, "step": 8197 }, { "epoch": 0.22, "learning_rate": 0.0018160085318795645, "loss": 2.7325, "step": 8198 }, { "epoch": 0.22, "learning_rate": 0.0018159582166656705, "loss": 2.3648, "step": 8199 }, { "epoch": 0.22, "learning_rate": 0.0018159078952702233, "loss": 2.8729, "step": 8200 }, { "epoch": 0.22, "learning_rate": 0.0018158575676936036, "loss": 2.6114, "step": 8201 }, { "epoch": 0.22, "learning_rate": 0.001815807233936193, "loss": 2.3874, "step": 8202 }, { "epoch": 0.22, "learning_rate": 0.0018157568939983723, "loss": 2.7546, "step": 8203 }, { "epoch": 0.22, "learning_rate": 0.0018157065478805235, "loss": 2.4099, "step": 8204 }, { "epoch": 0.22, "learning_rate": 0.0018156561955830275, "loss": 2.8139, "step": 8205 }, { "epoch": 0.22, "learning_rate": 0.0018156058371062663, "loss": 2.6418, "step": 8206 }, { "epoch": 0.22, "learning_rate": 0.0018155554724506207, "loss": 2.5358, "step": 8207 }, { "epoch": 0.22, "learning_rate": 0.001815505101616473, "loss": 2.5596, "step": 8208 }, { "epoch": 0.22, "learning_rate": 0.001815454724604204, "loss": 2.5806, "step": 8209 }, { "epoch": 0.22, "learning_rate": 0.0018154043414141962, "loss": 3.0629, "step": 8210 }, { "epoch": 0.22, "learning_rate": 0.001815353952046831, "loss": 2.6894, "step": 8211 }, { "epoch": 0.22, "learning_rate": 0.0018153035565024898, "loss": 2.9486, "step": 8212 }, { "epoch": 0.22, "learning_rate": 0.0018152531547815545, "loss": 2.5798, "step": 8213 }, { "epoch": 0.22, "learning_rate": 0.0018152027468844073, "loss": 2.8193, "step": 8214 }, { "epoch": 0.22, "learning_rate": 0.0018151523328114299, "loss": 2.5513, "step": 8215 }, { "epoch": 0.22, "learning_rate": 0.0018151019125630036, "loss": 2.81, "step": 8216 }, { "epoch": 0.22, "learning_rate": 0.0018150514861395117, "loss": 2.5238, "step": 8217 }, { "epoch": 0.22, "learning_rate": 0.001815001053541335, "loss": 2.9318, "step": 8218 }, { "epoch": 0.22, "learning_rate": 0.001814950614768856, "loss": 2.4998, "step": 8219 }, { "epoch": 0.22, "learning_rate": 0.0018149001698224572, "loss": 2.4357, "step": 8220 }, { "epoch": 0.22, "learning_rate": 0.00181484971870252, "loss": 3.0129, "step": 8221 }, { "epoch": 0.22, "learning_rate": 0.0018147992614094273, "loss": 2.5147, "step": 8222 }, { "epoch": 0.22, "learning_rate": 0.0018147487979435608, "loss": 2.5551, "step": 8223 }, { "epoch": 0.22, "learning_rate": 0.0018146983283053033, "loss": 2.8728, "step": 8224 }, { "epoch": 0.22, "learning_rate": 0.0018146478524950368, "loss": 2.7163, "step": 8225 }, { "epoch": 0.22, "learning_rate": 0.0018145973705131439, "loss": 2.9483, "step": 8226 }, { "epoch": 0.22, "learning_rate": 0.0018145468823600069, "loss": 2.3754, "step": 8227 }, { "epoch": 0.22, "learning_rate": 0.0018144963880360084, "loss": 2.7692, "step": 8228 }, { "epoch": 0.22, "learning_rate": 0.0018144458875415305, "loss": 2.6464, "step": 8229 }, { "epoch": 0.22, "learning_rate": 0.0018143953808769568, "loss": 2.911, "step": 8230 }, { "epoch": 0.22, "learning_rate": 0.0018143448680426688, "loss": 2.3353, "step": 8231 }, { "epoch": 0.22, "learning_rate": 0.00181429434903905, "loss": 2.3617, "step": 8232 }, { "epoch": 0.22, "learning_rate": 0.0018142438238664827, "loss": 2.3814, "step": 8233 }, { "epoch": 0.22, "learning_rate": 0.0018141932925253496, "loss": 2.2734, "step": 8234 }, { "epoch": 0.22, "learning_rate": 0.0018141427550160338, "loss": 2.6591, "step": 8235 }, { "epoch": 0.22, "learning_rate": 0.001814092211338918, "loss": 2.6545, "step": 8236 }, { "epoch": 0.22, "learning_rate": 0.0018140416614943853, "loss": 2.4623, "step": 8237 }, { "epoch": 0.22, "learning_rate": 0.0018139911054828185, "loss": 2.5968, "step": 8238 }, { "epoch": 0.22, "learning_rate": 0.0018139405433046005, "loss": 3.0132, "step": 8239 }, { "epoch": 0.22, "learning_rate": 0.0018138899749601145, "loss": 2.9701, "step": 8240 }, { "epoch": 0.22, "learning_rate": 0.0018138394004497433, "loss": 2.5222, "step": 8241 }, { "epoch": 0.22, "learning_rate": 0.0018137888197738707, "loss": 2.196, "step": 8242 }, { "epoch": 0.22, "learning_rate": 0.0018137382329328792, "loss": 2.4855, "step": 8243 }, { "epoch": 0.22, "learning_rate": 0.0018136876399271527, "loss": 2.5506, "step": 8244 }, { "epoch": 0.22, "learning_rate": 0.0018136370407570736, "loss": 2.2723, "step": 8245 }, { "epoch": 0.22, "learning_rate": 0.0018135864354230263, "loss": 2.9939, "step": 8246 }, { "epoch": 0.22, "learning_rate": 0.0018135358239253932, "loss": 2.4982, "step": 8247 }, { "epoch": 0.22, "learning_rate": 0.0018134852062645585, "loss": 2.5602, "step": 8248 }, { "epoch": 0.22, "learning_rate": 0.0018134345824409048, "loss": 2.4262, "step": 8249 }, { "epoch": 0.22, "learning_rate": 0.0018133839524548168, "loss": 2.6023, "step": 8250 }, { "epoch": 0.22, "learning_rate": 0.001813333316306677, "loss": 2.8849, "step": 8251 }, { "epoch": 0.22, "learning_rate": 0.0018132826739968692, "loss": 2.7713, "step": 8252 }, { "epoch": 0.22, "learning_rate": 0.0018132320255257778, "loss": 2.8375, "step": 8253 }, { "epoch": 0.22, "learning_rate": 0.0018131813708937856, "loss": 2.9627, "step": 8254 }, { "epoch": 0.22, "learning_rate": 0.0018131307101012766, "loss": 2.6545, "step": 8255 }, { "epoch": 0.22, "learning_rate": 0.0018130800431486352, "loss": 2.5003, "step": 8256 }, { "epoch": 0.22, "learning_rate": 0.0018130293700362441, "loss": 2.5691, "step": 8257 }, { "epoch": 0.22, "learning_rate": 0.0018129786907644886, "loss": 2.5497, "step": 8258 }, { "epoch": 0.22, "learning_rate": 0.0018129280053337511, "loss": 2.4916, "step": 8259 }, { "epoch": 0.22, "learning_rate": 0.001812877313744417, "loss": 2.3914, "step": 8260 }, { "epoch": 0.22, "learning_rate": 0.0018128266159968694, "loss": 2.7167, "step": 8261 }, { "epoch": 0.22, "learning_rate": 0.0018127759120914928, "loss": 2.6708, "step": 8262 }, { "epoch": 0.22, "learning_rate": 0.001812725202028671, "loss": 2.9666, "step": 8263 }, { "epoch": 0.22, "learning_rate": 0.0018126744858087886, "loss": 2.6846, "step": 8264 }, { "epoch": 0.22, "learning_rate": 0.0018126237634322293, "loss": 2.5302, "step": 8265 }, { "epoch": 0.22, "learning_rate": 0.0018125730348993781, "loss": 2.7432, "step": 8266 }, { "epoch": 0.22, "learning_rate": 0.0018125223002106185, "loss": 2.4997, "step": 8267 }, { "epoch": 0.22, "learning_rate": 0.0018124715593663355, "loss": 2.455, "step": 8268 }, { "epoch": 0.22, "learning_rate": 0.0018124208123669128, "loss": 2.8484, "step": 8269 }, { "epoch": 0.22, "learning_rate": 0.0018123700592127356, "loss": 2.564, "step": 8270 }, { "epoch": 0.22, "learning_rate": 0.0018123192999041882, "loss": 2.6904, "step": 8271 }, { "epoch": 0.22, "learning_rate": 0.0018122685344416545, "loss": 2.552, "step": 8272 }, { "epoch": 0.22, "learning_rate": 0.00181221776282552, "loss": 2.2359, "step": 8273 }, { "epoch": 0.22, "learning_rate": 0.001812166985056169, "loss": 2.4345, "step": 8274 }, { "epoch": 0.22, "learning_rate": 0.001812116201133986, "loss": 2.4634, "step": 8275 }, { "epoch": 0.22, "learning_rate": 0.0018120654110593557, "loss": 2.5999, "step": 8276 }, { "epoch": 0.22, "learning_rate": 0.0018120146148326633, "loss": 2.6839, "step": 8277 }, { "epoch": 0.22, "learning_rate": 0.0018119638124542933, "loss": 2.7238, "step": 8278 }, { "epoch": 0.22, "learning_rate": 0.0018119130039246307, "loss": 2.5981, "step": 8279 }, { "epoch": 0.22, "learning_rate": 0.00181186218924406, "loss": 2.6347, "step": 8280 }, { "epoch": 0.22, "learning_rate": 0.0018118113684129666, "loss": 2.2735, "step": 8281 }, { "epoch": 0.22, "learning_rate": 0.0018117605414317355, "loss": 2.6581, "step": 8282 }, { "epoch": 0.22, "learning_rate": 0.0018117097083007517, "loss": 2.5127, "step": 8283 }, { "epoch": 0.22, "learning_rate": 0.0018116588690204002, "loss": 2.7976, "step": 8284 }, { "epoch": 0.22, "learning_rate": 0.001811608023591066, "loss": 2.887, "step": 8285 }, { "epoch": 0.22, "learning_rate": 0.001811557172013135, "loss": 2.751, "step": 8286 }, { "epoch": 0.22, "learning_rate": 0.0018115063142869917, "loss": 2.7891, "step": 8287 }, { "epoch": 0.22, "learning_rate": 0.0018114554504130216, "loss": 2.7847, "step": 8288 }, { "epoch": 0.22, "learning_rate": 0.0018114045803916102, "loss": 2.49, "step": 8289 }, { "epoch": 0.22, "learning_rate": 0.0018113537042231424, "loss": 3.0052, "step": 8290 }, { "epoch": 0.22, "learning_rate": 0.0018113028219080049, "loss": 3.0614, "step": 8291 }, { "epoch": 0.22, "learning_rate": 0.0018112519334465814, "loss": 2.8402, "step": 8292 }, { "epoch": 0.22, "learning_rate": 0.0018112010388392585, "loss": 2.4787, "step": 8293 }, { "epoch": 0.22, "learning_rate": 0.0018111501380864215, "loss": 2.8008, "step": 8294 }, { "epoch": 0.22, "learning_rate": 0.0018110992311884564, "loss": 2.9485, "step": 8295 }, { "epoch": 0.22, "learning_rate": 0.0018110483181457482, "loss": 2.4442, "step": 8296 }, { "epoch": 0.22, "learning_rate": 0.001810997398958683, "loss": 2.5113, "step": 8297 }, { "epoch": 0.22, "learning_rate": 0.0018109464736276468, "loss": 2.3058, "step": 8298 }, { "epoch": 0.22, "learning_rate": 0.0018108955421530246, "loss": 2.5747, "step": 8299 }, { "epoch": 0.22, "learning_rate": 0.0018108446045352032, "loss": 2.8003, "step": 8300 }, { "epoch": 0.22, "learning_rate": 0.0018107936607745679, "loss": 2.7096, "step": 8301 }, { "epoch": 0.22, "learning_rate": 0.0018107427108715046, "loss": 2.3854, "step": 8302 }, { "epoch": 0.22, "learning_rate": 0.0018106917548263996, "loss": 2.4681, "step": 8303 }, { "epoch": 0.22, "learning_rate": 0.0018106407926396391, "loss": 2.2298, "step": 8304 }, { "epoch": 0.22, "learning_rate": 0.0018105898243116084, "loss": 2.6566, "step": 8305 }, { "epoch": 0.22, "learning_rate": 0.0018105388498426943, "loss": 2.2676, "step": 8306 }, { "epoch": 0.22, "learning_rate": 0.001810487869233283, "loss": 2.232, "step": 8307 }, { "epoch": 0.22, "learning_rate": 0.00181043688248376, "loss": 2.9126, "step": 8308 }, { "epoch": 0.22, "learning_rate": 0.0018103858895945125, "loss": 2.8493, "step": 8309 }, { "epoch": 0.22, "learning_rate": 0.0018103348905659262, "loss": 2.4423, "step": 8310 }, { "epoch": 0.22, "learning_rate": 0.0018102838853983876, "loss": 2.6016, "step": 8311 }, { "epoch": 0.22, "learning_rate": 0.0018102328740922835, "loss": 3.1121, "step": 8312 }, { "epoch": 0.22, "learning_rate": 0.0018101818566479998, "loss": 2.454, "step": 8313 }, { "epoch": 0.22, "learning_rate": 0.001810130833065923, "loss": 2.7301, "step": 8314 }, { "epoch": 0.22, "learning_rate": 0.00181007980334644, "loss": 2.8487, "step": 8315 }, { "epoch": 0.22, "learning_rate": 0.0018100287674899375, "loss": 2.686, "step": 8316 }, { "epoch": 0.22, "learning_rate": 0.0018099777254968012, "loss": 2.7417, "step": 8317 }, { "epoch": 0.22, "learning_rate": 0.001809926677367419, "loss": 2.585, "step": 8318 }, { "epoch": 0.22, "learning_rate": 0.001809875623102177, "loss": 2.5713, "step": 8319 }, { "epoch": 0.22, "learning_rate": 0.0018098245627014623, "loss": 2.9721, "step": 8320 }, { "epoch": 0.22, "learning_rate": 0.0018097734961656608, "loss": 2.9744, "step": 8321 }, { "epoch": 0.22, "learning_rate": 0.0018097224234951605, "loss": 2.5703, "step": 8322 }, { "epoch": 0.22, "learning_rate": 0.0018096713446903482, "loss": 2.6599, "step": 8323 }, { "epoch": 0.22, "learning_rate": 0.0018096202597516103, "loss": 2.5255, "step": 8324 }, { "epoch": 0.22, "learning_rate": 0.0018095691686793338, "loss": 2.4615, "step": 8325 }, { "epoch": 0.22, "learning_rate": 0.0018095180714739062, "loss": 2.7361, "step": 8326 }, { "epoch": 0.22, "learning_rate": 0.0018094669681357144, "loss": 2.2323, "step": 8327 }, { "epoch": 0.22, "learning_rate": 0.0018094158586651457, "loss": 2.3402, "step": 8328 }, { "epoch": 0.22, "learning_rate": 0.001809364743062587, "loss": 3.0805, "step": 8329 }, { "epoch": 0.22, "learning_rate": 0.0018093136213284259, "loss": 3.0212, "step": 8330 }, { "epoch": 0.22, "learning_rate": 0.0018092624934630494, "loss": 2.7602, "step": 8331 }, { "epoch": 0.22, "learning_rate": 0.0018092113594668448, "loss": 2.8152, "step": 8332 }, { "epoch": 0.22, "learning_rate": 0.0018091602193401996, "loss": 2.4591, "step": 8333 }, { "epoch": 0.22, "learning_rate": 0.0018091090730835014, "loss": 2.5596, "step": 8334 }, { "epoch": 0.22, "learning_rate": 0.0018090579206971374, "loss": 2.5786, "step": 8335 }, { "epoch": 0.22, "learning_rate": 0.0018090067621814954, "loss": 2.5196, "step": 8336 }, { "epoch": 0.22, "learning_rate": 0.0018089555975369627, "loss": 2.6789, "step": 8337 }, { "epoch": 0.22, "learning_rate": 0.001808904426763927, "loss": 2.6754, "step": 8338 }, { "epoch": 0.22, "learning_rate": 0.0018088532498627761, "loss": 2.8547, "step": 8339 }, { "epoch": 0.22, "learning_rate": 0.0018088020668338976, "loss": 2.6974, "step": 8340 }, { "epoch": 0.22, "learning_rate": 0.0018087508776776788, "loss": 2.2979, "step": 8341 }, { "epoch": 0.22, "learning_rate": 0.0018086996823945085, "loss": 2.7346, "step": 8342 }, { "epoch": 0.22, "learning_rate": 0.0018086484809847739, "loss": 2.736, "step": 8343 }, { "epoch": 0.22, "learning_rate": 0.0018085972734488628, "loss": 2.7106, "step": 8344 }, { "epoch": 0.22, "learning_rate": 0.0018085460597871636, "loss": 2.325, "step": 8345 }, { "epoch": 0.22, "learning_rate": 0.0018084948400000633, "loss": 2.6187, "step": 8346 }, { "epoch": 0.22, "learning_rate": 0.0018084436140879514, "loss": 2.7287, "step": 8347 }, { "epoch": 0.22, "learning_rate": 0.001808392382051215, "loss": 2.6042, "step": 8348 }, { "epoch": 0.22, "learning_rate": 0.0018083411438902424, "loss": 2.5226, "step": 8349 }, { "epoch": 0.22, "learning_rate": 0.0018082898996054217, "loss": 2.8825, "step": 8350 }, { "epoch": 0.22, "learning_rate": 0.0018082386491971411, "loss": 2.7482, "step": 8351 }, { "epoch": 0.22, "learning_rate": 0.0018081873926657894, "loss": 2.7758, "step": 8352 }, { "epoch": 0.22, "learning_rate": 0.0018081361300117545, "loss": 2.5621, "step": 8353 }, { "epoch": 0.22, "learning_rate": 0.0018080848612354243, "loss": 2.54, "step": 8354 }, { "epoch": 0.22, "learning_rate": 0.0018080335863371881, "loss": 2.7671, "step": 8355 }, { "epoch": 0.22, "learning_rate": 0.0018079823053174335, "loss": 2.8676, "step": 8356 }, { "epoch": 0.22, "learning_rate": 0.0018079310181765501, "loss": 2.6144, "step": 8357 }, { "epoch": 0.22, "learning_rate": 0.001807879724914925, "loss": 3.0084, "step": 8358 }, { "epoch": 0.22, "learning_rate": 0.001807828425532948, "loss": 2.4549, "step": 8359 }, { "epoch": 0.22, "learning_rate": 0.001807777120031007, "loss": 2.9797, "step": 8360 }, { "epoch": 0.22, "learning_rate": 0.001807725808409491, "loss": 2.4982, "step": 8361 }, { "epoch": 0.22, "learning_rate": 0.001807674490668789, "loss": 2.7392, "step": 8362 }, { "epoch": 0.22, "learning_rate": 0.001807623166809289, "loss": 2.7712, "step": 8363 }, { "epoch": 0.22, "learning_rate": 0.0018075718368313807, "loss": 2.5485, "step": 8364 }, { "epoch": 0.22, "learning_rate": 0.0018075205007354524, "loss": 2.6181, "step": 8365 }, { "epoch": 0.22, "learning_rate": 0.001807469158521893, "loss": 2.5925, "step": 8366 }, { "epoch": 0.22, "learning_rate": 0.0018074178101910917, "loss": 2.8735, "step": 8367 }, { "epoch": 0.22, "learning_rate": 0.0018073664557434375, "loss": 2.5635, "step": 8368 }, { "epoch": 0.22, "learning_rate": 0.0018073150951793192, "loss": 2.2742, "step": 8369 }, { "epoch": 0.22, "learning_rate": 0.0018072637284991262, "loss": 2.8804, "step": 8370 }, { "epoch": 0.22, "learning_rate": 0.0018072123557032476, "loss": 2.8016, "step": 8371 }, { "epoch": 0.22, "learning_rate": 0.0018071609767920725, "loss": 2.509, "step": 8372 }, { "epoch": 0.23, "learning_rate": 0.00180710959176599, "loss": 2.6786, "step": 8373 }, { "epoch": 0.23, "learning_rate": 0.0018070582006253894, "loss": 2.3921, "step": 8374 }, { "epoch": 0.23, "learning_rate": 0.0018070068033706607, "loss": 2.7494, "step": 8375 }, { "epoch": 0.23, "learning_rate": 0.0018069554000021922, "loss": 2.3891, "step": 8376 }, { "epoch": 0.23, "learning_rate": 0.0018069039905203742, "loss": 2.7247, "step": 8377 }, { "epoch": 0.23, "learning_rate": 0.0018068525749255957, "loss": 2.3938, "step": 8378 }, { "epoch": 0.23, "learning_rate": 0.0018068011532182463, "loss": 2.4881, "step": 8379 }, { "epoch": 0.23, "learning_rate": 0.0018067497253987156, "loss": 2.8376, "step": 8380 }, { "epoch": 0.23, "learning_rate": 0.0018066982914673932, "loss": 2.7955, "step": 8381 }, { "epoch": 0.23, "learning_rate": 0.0018066468514246687, "loss": 2.6924, "step": 8382 }, { "epoch": 0.23, "learning_rate": 0.001806595405270932, "loss": 2.6594, "step": 8383 }, { "epoch": 0.23, "learning_rate": 0.0018065439530065728, "loss": 2.6657, "step": 8384 }, { "epoch": 0.23, "learning_rate": 0.0018064924946319808, "loss": 2.6516, "step": 8385 }, { "epoch": 0.23, "learning_rate": 0.0018064410301475457, "loss": 2.3842, "step": 8386 }, { "epoch": 0.23, "learning_rate": 0.0018063895595536576, "loss": 2.4422, "step": 8387 }, { "epoch": 0.23, "learning_rate": 0.0018063380828507063, "loss": 2.7058, "step": 8388 }, { "epoch": 0.23, "learning_rate": 0.0018062866000390818, "loss": 2.8269, "step": 8389 }, { "epoch": 0.23, "learning_rate": 0.0018062351111191744, "loss": 2.222, "step": 8390 }, { "epoch": 0.23, "learning_rate": 0.001806183616091374, "loss": 2.9128, "step": 8391 }, { "epoch": 0.23, "learning_rate": 0.0018061321149560703, "loss": 2.712, "step": 8392 }, { "epoch": 0.23, "learning_rate": 0.0018060806077136538, "loss": 3.0877, "step": 8393 }, { "epoch": 0.23, "learning_rate": 0.001806029094364515, "loss": 2.9353, "step": 8394 }, { "epoch": 0.23, "learning_rate": 0.0018059775749090438, "loss": 2.7876, "step": 8395 }, { "epoch": 0.23, "learning_rate": 0.0018059260493476306, "loss": 2.5928, "step": 8396 }, { "epoch": 0.23, "learning_rate": 0.0018058745176806658, "loss": 2.8008, "step": 8397 }, { "epoch": 0.23, "learning_rate": 0.0018058229799085396, "loss": 2.8264, "step": 8398 }, { "epoch": 0.23, "learning_rate": 0.0018057714360316427, "loss": 2.4076, "step": 8399 }, { "epoch": 0.23, "learning_rate": 0.0018057198860503654, "loss": 2.4392, "step": 8400 }, { "epoch": 0.23, "learning_rate": 0.0018056683299650983, "loss": 2.4324, "step": 8401 }, { "epoch": 0.23, "learning_rate": 0.0018056167677762318, "loss": 2.6999, "step": 8402 }, { "epoch": 0.23, "learning_rate": 0.001805565199484157, "loss": 2.8258, "step": 8403 }, { "epoch": 0.23, "learning_rate": 0.001805513625089264, "loss": 2.7143, "step": 8404 }, { "epoch": 0.23, "learning_rate": 0.001805462044591944, "loss": 2.3643, "step": 8405 }, { "epoch": 0.23, "learning_rate": 0.0018054104579925873, "loss": 2.5598, "step": 8406 }, { "epoch": 0.23, "learning_rate": 0.001805358865291585, "loss": 2.6175, "step": 8407 }, { "epoch": 0.23, "learning_rate": 0.0018053072664893284, "loss": 2.5942, "step": 8408 }, { "epoch": 0.23, "learning_rate": 0.0018052556615862074, "loss": 3.0265, "step": 8409 }, { "epoch": 0.23, "learning_rate": 0.0018052040505826138, "loss": 2.7121, "step": 8410 }, { "epoch": 0.23, "learning_rate": 0.001805152433478938, "loss": 2.5832, "step": 8411 }, { "epoch": 0.23, "learning_rate": 0.0018051008102755715, "loss": 2.3863, "step": 8412 }, { "epoch": 0.23, "learning_rate": 0.001805049180972905, "loss": 2.2081, "step": 8413 }, { "epoch": 0.23, "learning_rate": 0.0018049975455713299, "loss": 2.5172, "step": 8414 }, { "epoch": 0.23, "learning_rate": 0.0018049459040712374, "loss": 2.4335, "step": 8415 }, { "epoch": 0.23, "learning_rate": 0.0018048942564730186, "loss": 2.4619, "step": 8416 }, { "epoch": 0.23, "learning_rate": 0.0018048426027770649, "loss": 3.0212, "step": 8417 }, { "epoch": 0.23, "learning_rate": 0.0018047909429837674, "loss": 2.7623, "step": 8418 }, { "epoch": 0.23, "learning_rate": 0.0018047392770935177, "loss": 2.9041, "step": 8419 }, { "epoch": 0.23, "learning_rate": 0.0018046876051067068, "loss": 2.4782, "step": 8420 }, { "epoch": 0.23, "learning_rate": 0.0018046359270237268, "loss": 2.9793, "step": 8421 }, { "epoch": 0.23, "learning_rate": 0.001804584242844969, "loss": 3.0317, "step": 8422 }, { "epoch": 0.23, "learning_rate": 0.0018045325525708248, "loss": 2.5735, "step": 8423 }, { "epoch": 0.23, "learning_rate": 0.0018044808562016855, "loss": 2.7512, "step": 8424 }, { "epoch": 0.23, "learning_rate": 0.0018044291537379431, "loss": 2.4743, "step": 8425 }, { "epoch": 0.23, "learning_rate": 0.0018043774451799895, "loss": 2.9882, "step": 8426 }, { "epoch": 0.23, "learning_rate": 0.0018043257305282161, "loss": 2.652, "step": 8427 }, { "epoch": 0.23, "learning_rate": 0.001804274009783015, "loss": 2.5902, "step": 8428 }, { "epoch": 0.23, "learning_rate": 0.0018042222829447773, "loss": 2.5354, "step": 8429 }, { "epoch": 0.23, "learning_rate": 0.0018041705500138954, "loss": 2.2514, "step": 8430 }, { "epoch": 0.23, "learning_rate": 0.0018041188109907615, "loss": 2.6663, "step": 8431 }, { "epoch": 0.23, "learning_rate": 0.001804067065875767, "loss": 2.6798, "step": 8432 }, { "epoch": 0.23, "learning_rate": 0.0018040153146693045, "loss": 2.9719, "step": 8433 }, { "epoch": 0.23, "learning_rate": 0.0018039635573717653, "loss": 2.4536, "step": 8434 }, { "epoch": 0.23, "learning_rate": 0.0018039117939835422, "loss": 3.0197, "step": 8435 }, { "epoch": 0.23, "learning_rate": 0.001803860024505027, "loss": 2.3321, "step": 8436 }, { "epoch": 0.23, "learning_rate": 0.0018038082489366118, "loss": 2.7832, "step": 8437 }, { "epoch": 0.23, "learning_rate": 0.0018037564672786892, "loss": 2.4959, "step": 8438 }, { "epoch": 0.23, "learning_rate": 0.0018037046795316514, "loss": 2.6352, "step": 8439 }, { "epoch": 0.23, "learning_rate": 0.0018036528856958905, "loss": 2.5622, "step": 8440 }, { "epoch": 0.23, "learning_rate": 0.0018036010857717991, "loss": 2.7678, "step": 8441 }, { "epoch": 0.23, "learning_rate": 0.0018035492797597694, "loss": 2.2201, "step": 8442 }, { "epoch": 0.23, "learning_rate": 0.001803497467660194, "loss": 2.7144, "step": 8443 }, { "epoch": 0.23, "learning_rate": 0.0018034456494734658, "loss": 2.6023, "step": 8444 }, { "epoch": 0.23, "learning_rate": 0.0018033938251999766, "loss": 2.9896, "step": 8445 }, { "epoch": 0.23, "learning_rate": 0.0018033419948401195, "loss": 2.6707, "step": 8446 }, { "epoch": 0.23, "learning_rate": 0.0018032901583942872, "loss": 3.0056, "step": 8447 }, { "epoch": 0.23, "learning_rate": 0.0018032383158628723, "loss": 2.3859, "step": 8448 }, { "epoch": 0.23, "learning_rate": 0.0018031864672462673, "loss": 2.3771, "step": 8449 }, { "epoch": 0.23, "learning_rate": 0.0018031346125448652, "loss": 2.8216, "step": 8450 }, { "epoch": 0.23, "learning_rate": 0.001803082751759059, "loss": 2.6986, "step": 8451 }, { "epoch": 0.23, "learning_rate": 0.0018030308848892417, "loss": 2.6064, "step": 8452 }, { "epoch": 0.23, "learning_rate": 0.0018029790119358056, "loss": 2.8321, "step": 8453 }, { "epoch": 0.23, "learning_rate": 0.0018029271328991441, "loss": 2.599, "step": 8454 }, { "epoch": 0.23, "learning_rate": 0.0018028752477796503, "loss": 2.3007, "step": 8455 }, { "epoch": 0.23, "learning_rate": 0.0018028233565777173, "loss": 2.87, "step": 8456 }, { "epoch": 0.23, "learning_rate": 0.0018027714592937377, "loss": 2.9453, "step": 8457 }, { "epoch": 0.23, "learning_rate": 0.0018027195559281056, "loss": 2.7173, "step": 8458 }, { "epoch": 0.23, "learning_rate": 0.0018026676464812132, "loss": 2.839, "step": 8459 }, { "epoch": 0.23, "learning_rate": 0.0018026157309534543, "loss": 2.6523, "step": 8460 }, { "epoch": 0.23, "learning_rate": 0.0018025638093452222, "loss": 2.5745, "step": 8461 }, { "epoch": 0.23, "learning_rate": 0.0018025118816569102, "loss": 2.2632, "step": 8462 }, { "epoch": 0.23, "learning_rate": 0.0018024599478889116, "loss": 2.5871, "step": 8463 }, { "epoch": 0.23, "learning_rate": 0.0018024080080416198, "loss": 2.7182, "step": 8464 }, { "epoch": 0.23, "learning_rate": 0.0018023560621154284, "loss": 3.2708, "step": 8465 }, { "epoch": 0.23, "learning_rate": 0.001802304110110731, "loss": 2.4304, "step": 8466 }, { "epoch": 0.23, "learning_rate": 0.0018022521520279211, "loss": 2.9333, "step": 8467 }, { "epoch": 0.23, "learning_rate": 0.0018022001878673923, "loss": 2.8479, "step": 8468 }, { "epoch": 0.23, "learning_rate": 0.0018021482176295385, "loss": 2.8153, "step": 8469 }, { "epoch": 0.23, "learning_rate": 0.0018020962413147531, "loss": 2.6121, "step": 8470 }, { "epoch": 0.23, "learning_rate": 0.0018020442589234298, "loss": 2.4911, "step": 8471 }, { "epoch": 0.23, "learning_rate": 0.0018019922704559628, "loss": 2.4833, "step": 8472 }, { "epoch": 0.23, "learning_rate": 0.0018019402759127457, "loss": 2.413, "step": 8473 }, { "epoch": 0.23, "learning_rate": 0.0018018882752941724, "loss": 2.6537, "step": 8474 }, { "epoch": 0.23, "learning_rate": 0.0018018362686006368, "loss": 2.7149, "step": 8475 }, { "epoch": 0.23, "learning_rate": 0.001801784255832533, "loss": 2.3094, "step": 8476 }, { "epoch": 0.23, "learning_rate": 0.0018017322369902554, "loss": 2.6008, "step": 8477 }, { "epoch": 0.23, "learning_rate": 0.0018016802120741971, "loss": 2.6615, "step": 8478 }, { "epoch": 0.23, "learning_rate": 0.0018016281810847533, "loss": 2.5761, "step": 8479 }, { "epoch": 0.23, "learning_rate": 0.0018015761440223176, "loss": 2.1627, "step": 8480 }, { "epoch": 0.23, "learning_rate": 0.0018015241008872843, "loss": 2.6584, "step": 8481 }, { "epoch": 0.23, "learning_rate": 0.0018014720516800478, "loss": 2.5288, "step": 8482 }, { "epoch": 0.23, "learning_rate": 0.0018014199964010021, "loss": 2.831, "step": 8483 }, { "epoch": 0.23, "learning_rate": 0.0018013679350505419, "loss": 2.9355, "step": 8484 }, { "epoch": 0.23, "learning_rate": 0.0018013158676290614, "loss": 2.5339, "step": 8485 }, { "epoch": 0.23, "learning_rate": 0.0018012637941369554, "loss": 2.4006, "step": 8486 }, { "epoch": 0.23, "learning_rate": 0.001801211714574618, "loss": 2.6367, "step": 8487 }, { "epoch": 0.23, "learning_rate": 0.0018011596289424436, "loss": 2.5933, "step": 8488 }, { "epoch": 0.23, "learning_rate": 0.0018011075372408277, "loss": 2.6133, "step": 8489 }, { "epoch": 0.23, "learning_rate": 0.001801055439470164, "loss": 2.4007, "step": 8490 }, { "epoch": 0.23, "learning_rate": 0.0018010033356308478, "loss": 2.6542, "step": 8491 }, { "epoch": 0.23, "learning_rate": 0.001800951225723273, "loss": 2.847, "step": 8492 }, { "epoch": 0.23, "learning_rate": 0.001800899109747835, "loss": 2.5601, "step": 8493 }, { "epoch": 0.23, "learning_rate": 0.001800846987704929, "loss": 2.3378, "step": 8494 }, { "epoch": 0.23, "learning_rate": 0.001800794859594949, "loss": 2.5034, "step": 8495 }, { "epoch": 0.23, "learning_rate": 0.0018007427254182905, "loss": 2.6587, "step": 8496 }, { "epoch": 0.23, "learning_rate": 0.001800690585175348, "loss": 2.3687, "step": 8497 }, { "epoch": 0.23, "learning_rate": 0.0018006384388665172, "loss": 2.6849, "step": 8498 }, { "epoch": 0.23, "learning_rate": 0.0018005862864921922, "loss": 2.901, "step": 8499 }, { "epoch": 0.23, "learning_rate": 0.001800534128052769, "loss": 2.6663, "step": 8500 }, { "epoch": 0.23, "learning_rate": 0.0018004819635486422, "loss": 2.3785, "step": 8501 }, { "epoch": 0.23, "learning_rate": 0.0018004297929802074, "loss": 2.8828, "step": 8502 }, { "epoch": 0.23, "learning_rate": 0.0018003776163478594, "loss": 2.5984, "step": 8503 }, { "epoch": 0.23, "learning_rate": 0.0018003254336519938, "loss": 2.8719, "step": 8504 }, { "epoch": 0.23, "learning_rate": 0.0018002732448930056, "loss": 2.3202, "step": 8505 }, { "epoch": 0.23, "learning_rate": 0.0018002210500712903, "loss": 2.4708, "step": 8506 }, { "epoch": 0.23, "learning_rate": 0.001800168849187244, "loss": 2.8155, "step": 8507 }, { "epoch": 0.23, "learning_rate": 0.0018001166422412606, "loss": 2.4286, "step": 8508 }, { "epoch": 0.23, "learning_rate": 0.0018000644292337374, "loss": 2.4725, "step": 8509 }, { "epoch": 0.23, "learning_rate": 0.0018000122101650686, "loss": 2.5342, "step": 8510 }, { "epoch": 0.23, "learning_rate": 0.0017999599850356508, "loss": 2.5825, "step": 8511 }, { "epoch": 0.23, "learning_rate": 0.0017999077538458788, "loss": 2.2522, "step": 8512 }, { "epoch": 0.23, "learning_rate": 0.0017998555165961488, "loss": 2.5101, "step": 8513 }, { "epoch": 0.23, "learning_rate": 0.0017998032732868562, "loss": 2.7385, "step": 8514 }, { "epoch": 0.23, "learning_rate": 0.0017997510239183975, "loss": 2.7359, "step": 8515 }, { "epoch": 0.23, "learning_rate": 0.0017996987684911674, "loss": 2.7925, "step": 8516 }, { "epoch": 0.23, "learning_rate": 0.001799646507005563, "loss": 2.7546, "step": 8517 }, { "epoch": 0.23, "learning_rate": 0.0017995942394619792, "loss": 2.7425, "step": 8518 }, { "epoch": 0.23, "learning_rate": 0.0017995419658608123, "loss": 2.8584, "step": 8519 }, { "epoch": 0.23, "learning_rate": 0.0017994896862024588, "loss": 2.9252, "step": 8520 }, { "epoch": 0.23, "learning_rate": 0.0017994374004873142, "loss": 2.8955, "step": 8521 }, { "epoch": 0.23, "learning_rate": 0.0017993851087157748, "loss": 2.7214, "step": 8522 }, { "epoch": 0.23, "learning_rate": 0.0017993328108882368, "loss": 2.841, "step": 8523 }, { "epoch": 0.23, "learning_rate": 0.0017992805070050962, "loss": 2.278, "step": 8524 }, { "epoch": 0.23, "learning_rate": 0.0017992281970667494, "loss": 2.1993, "step": 8525 }, { "epoch": 0.23, "learning_rate": 0.0017991758810735929, "loss": 3.1317, "step": 8526 }, { "epoch": 0.23, "learning_rate": 0.0017991235590260224, "loss": 2.5822, "step": 8527 }, { "epoch": 0.23, "learning_rate": 0.001799071230924435, "loss": 2.8685, "step": 8528 }, { "epoch": 0.23, "learning_rate": 0.0017990188967692267, "loss": 2.4295, "step": 8529 }, { "epoch": 0.23, "learning_rate": 0.001798966556560794, "loss": 2.3627, "step": 8530 }, { "epoch": 0.23, "learning_rate": 0.0017989142102995336, "loss": 2.9795, "step": 8531 }, { "epoch": 0.23, "learning_rate": 0.001798861857985842, "loss": 2.5415, "step": 8532 }, { "epoch": 0.23, "learning_rate": 0.0017988094996201159, "loss": 3.201, "step": 8533 }, { "epoch": 0.23, "learning_rate": 0.0017987571352027513, "loss": 2.7256, "step": 8534 }, { "epoch": 0.23, "learning_rate": 0.0017987047647341462, "loss": 2.3862, "step": 8535 }, { "epoch": 0.23, "learning_rate": 0.001798652388214696, "loss": 2.4786, "step": 8536 }, { "epoch": 0.23, "learning_rate": 0.0017986000056447985, "loss": 2.5986, "step": 8537 }, { "epoch": 0.23, "learning_rate": 0.00179854761702485, "loss": 2.3983, "step": 8538 }, { "epoch": 0.23, "learning_rate": 0.0017984952223552475, "loss": 2.5374, "step": 8539 }, { "epoch": 0.23, "learning_rate": 0.001798442821636388, "loss": 2.5163, "step": 8540 }, { "epoch": 0.23, "learning_rate": 0.0017983904148686683, "loss": 2.4509, "step": 8541 }, { "epoch": 0.23, "learning_rate": 0.0017983380020524858, "loss": 2.4541, "step": 8542 }, { "epoch": 0.23, "learning_rate": 0.0017982855831882372, "loss": 2.9873, "step": 8543 }, { "epoch": 0.23, "learning_rate": 0.0017982331582763196, "loss": 2.4113, "step": 8544 }, { "epoch": 0.23, "learning_rate": 0.0017981807273171305, "loss": 2.0886, "step": 8545 }, { "epoch": 0.23, "learning_rate": 0.0017981282903110668, "loss": 2.9658, "step": 8546 }, { "epoch": 0.23, "learning_rate": 0.0017980758472585258, "loss": 2.4666, "step": 8547 }, { "epoch": 0.23, "learning_rate": 0.001798023398159905, "loss": 2.9461, "step": 8548 }, { "epoch": 0.23, "learning_rate": 0.0017979709430156015, "loss": 2.4794, "step": 8549 }, { "epoch": 0.23, "learning_rate": 0.001797918481826013, "loss": 2.6661, "step": 8550 }, { "epoch": 0.23, "learning_rate": 0.0017978660145915365, "loss": 2.3764, "step": 8551 }, { "epoch": 0.23, "learning_rate": 0.0017978135413125697, "loss": 2.6796, "step": 8552 }, { "epoch": 0.23, "learning_rate": 0.0017977610619895105, "loss": 2.3756, "step": 8553 }, { "epoch": 0.23, "learning_rate": 0.001797708576622756, "loss": 2.3416, "step": 8554 }, { "epoch": 0.23, "learning_rate": 0.0017976560852127036, "loss": 2.2238, "step": 8555 }, { "epoch": 0.23, "learning_rate": 0.0017976035877597517, "loss": 2.8869, "step": 8556 }, { "epoch": 0.23, "learning_rate": 0.0017975510842642972, "loss": 2.5941, "step": 8557 }, { "epoch": 0.23, "learning_rate": 0.0017974985747267387, "loss": 2.8891, "step": 8558 }, { "epoch": 0.23, "learning_rate": 0.0017974460591474732, "loss": 2.7721, "step": 8559 }, { "epoch": 0.23, "learning_rate": 0.001797393537526899, "loss": 2.2644, "step": 8560 }, { "epoch": 0.23, "learning_rate": 0.001797341009865414, "loss": 2.7151, "step": 8561 }, { "epoch": 0.23, "learning_rate": 0.0017972884761634164, "loss": 2.5978, "step": 8562 }, { "epoch": 0.23, "learning_rate": 0.0017972359364213032, "loss": 2.056, "step": 8563 }, { "epoch": 0.23, "learning_rate": 0.0017971833906394736, "loss": 3.0566, "step": 8564 }, { "epoch": 0.23, "learning_rate": 0.0017971308388183252, "loss": 2.8385, "step": 8565 }, { "epoch": 0.23, "learning_rate": 0.0017970782809582557, "loss": 2.4335, "step": 8566 }, { "epoch": 0.23, "learning_rate": 0.0017970257170596639, "loss": 2.6823, "step": 8567 }, { "epoch": 0.23, "learning_rate": 0.0017969731471229476, "loss": 3.1024, "step": 8568 }, { "epoch": 0.23, "learning_rate": 0.0017969205711485055, "loss": 2.7219, "step": 8569 }, { "epoch": 0.23, "learning_rate": 0.0017968679891367351, "loss": 2.2482, "step": 8570 }, { "epoch": 0.23, "learning_rate": 0.0017968154010880358, "loss": 2.752, "step": 8571 }, { "epoch": 0.23, "learning_rate": 0.0017967628070028052, "loss": 2.5149, "step": 8572 }, { "epoch": 0.23, "learning_rate": 0.0017967102068814423, "loss": 2.857, "step": 8573 }, { "epoch": 0.23, "learning_rate": 0.001796657600724345, "loss": 2.6808, "step": 8574 }, { "epoch": 0.23, "learning_rate": 0.0017966049885319122, "loss": 2.6919, "step": 8575 }, { "epoch": 0.23, "learning_rate": 0.0017965523703045425, "loss": 2.785, "step": 8576 }, { "epoch": 0.23, "learning_rate": 0.0017964997460426344, "loss": 2.5352, "step": 8577 }, { "epoch": 0.23, "learning_rate": 0.0017964471157465866, "loss": 2.4014, "step": 8578 }, { "epoch": 0.23, "learning_rate": 0.0017963944794167981, "loss": 2.6244, "step": 8579 }, { "epoch": 0.23, "learning_rate": 0.0017963418370536672, "loss": 2.6491, "step": 8580 }, { "epoch": 0.23, "learning_rate": 0.001796289188657593, "loss": 2.7233, "step": 8581 }, { "epoch": 0.23, "learning_rate": 0.0017962365342289739, "loss": 2.505, "step": 8582 }, { "epoch": 0.23, "learning_rate": 0.0017961838737682097, "loss": 2.747, "step": 8583 }, { "epoch": 0.23, "learning_rate": 0.0017961312072756986, "loss": 2.258, "step": 8584 }, { "epoch": 0.23, "learning_rate": 0.0017960785347518398, "loss": 2.5408, "step": 8585 }, { "epoch": 0.23, "learning_rate": 0.0017960258561970322, "loss": 2.3795, "step": 8586 }, { "epoch": 0.23, "learning_rate": 0.0017959731716116751, "loss": 2.4746, "step": 8587 }, { "epoch": 0.23, "learning_rate": 0.0017959204809961677, "loss": 3.0, "step": 8588 }, { "epoch": 0.23, "learning_rate": 0.0017958677843509091, "loss": 2.8389, "step": 8589 }, { "epoch": 0.23, "learning_rate": 0.0017958150816762984, "loss": 2.443, "step": 8590 }, { "epoch": 0.23, "learning_rate": 0.0017957623729727347, "loss": 2.516, "step": 8591 }, { "epoch": 0.23, "learning_rate": 0.0017957096582406175, "loss": 2.8368, "step": 8592 }, { "epoch": 0.23, "learning_rate": 0.0017956569374803467, "loss": 2.3853, "step": 8593 }, { "epoch": 0.23, "learning_rate": 0.0017956042106923207, "loss": 2.8531, "step": 8594 }, { "epoch": 0.23, "learning_rate": 0.0017955514778769395, "loss": 2.6624, "step": 8595 }, { "epoch": 0.23, "learning_rate": 0.0017954987390346028, "loss": 2.3113, "step": 8596 }, { "epoch": 0.23, "learning_rate": 0.0017954459941657097, "loss": 2.8337, "step": 8597 }, { "epoch": 0.23, "learning_rate": 0.0017953932432706599, "loss": 2.9885, "step": 8598 }, { "epoch": 0.23, "learning_rate": 0.0017953404863498533, "loss": 2.4423, "step": 8599 }, { "epoch": 0.23, "learning_rate": 0.001795287723403689, "loss": 2.2843, "step": 8600 }, { "epoch": 0.23, "learning_rate": 0.0017952349544325674, "loss": 2.592, "step": 8601 }, { "epoch": 0.23, "learning_rate": 0.0017951821794368879, "loss": 2.4627, "step": 8602 }, { "epoch": 0.23, "learning_rate": 0.0017951293984170503, "loss": 2.7802, "step": 8603 }, { "epoch": 0.23, "learning_rate": 0.0017950766113734545, "loss": 2.3236, "step": 8604 }, { "epoch": 0.23, "learning_rate": 0.0017950238183065007, "loss": 2.291, "step": 8605 }, { "epoch": 0.23, "learning_rate": 0.0017949710192165882, "loss": 2.7309, "step": 8606 }, { "epoch": 0.23, "learning_rate": 0.0017949182141041176, "loss": 2.968, "step": 8607 }, { "epoch": 0.23, "learning_rate": 0.0017948654029694888, "loss": 2.594, "step": 8608 }, { "epoch": 0.23, "learning_rate": 0.0017948125858131018, "loss": 2.3832, "step": 8609 }, { "epoch": 0.23, "learning_rate": 0.0017947597626353567, "loss": 2.2784, "step": 8610 }, { "epoch": 0.23, "learning_rate": 0.0017947069334366538, "loss": 2.6966, "step": 8611 }, { "epoch": 0.23, "learning_rate": 0.001794654098217393, "loss": 2.6568, "step": 8612 }, { "epoch": 0.23, "learning_rate": 0.001794601256977975, "loss": 2.9467, "step": 8613 }, { "epoch": 0.23, "learning_rate": 0.0017945484097188, "loss": 2.9304, "step": 8614 }, { "epoch": 0.23, "learning_rate": 0.0017944955564402681, "loss": 2.9595, "step": 8615 }, { "epoch": 0.23, "learning_rate": 0.0017944426971427802, "loss": 2.2559, "step": 8616 }, { "epoch": 0.23, "learning_rate": 0.0017943898318267361, "loss": 2.1964, "step": 8617 }, { "epoch": 0.23, "learning_rate": 0.001794336960492537, "loss": 2.7295, "step": 8618 }, { "epoch": 0.23, "learning_rate": 0.001794284083140583, "loss": 2.396, "step": 8619 }, { "epoch": 0.23, "learning_rate": 0.0017942311997712745, "loss": 2.4022, "step": 8620 }, { "epoch": 0.23, "learning_rate": 0.0017941783103850128, "loss": 2.787, "step": 8621 }, { "epoch": 0.23, "learning_rate": 0.0017941254149821983, "loss": 2.5754, "step": 8622 }, { "epoch": 0.23, "learning_rate": 0.0017940725135632315, "loss": 2.2469, "step": 8623 }, { "epoch": 0.23, "learning_rate": 0.001794019606128513, "loss": 2.6245, "step": 8624 }, { "epoch": 0.23, "learning_rate": 0.0017939666926784443, "loss": 2.7875, "step": 8625 }, { "epoch": 0.23, "learning_rate": 0.0017939137732134256, "loss": 2.7304, "step": 8626 }, { "epoch": 0.23, "learning_rate": 0.0017938608477338584, "loss": 2.7254, "step": 8627 }, { "epoch": 0.23, "learning_rate": 0.001793807916240143, "loss": 2.8157, "step": 8628 }, { "epoch": 0.23, "learning_rate": 0.0017937549787326809, "loss": 2.2492, "step": 8629 }, { "epoch": 0.23, "learning_rate": 0.001793702035211873, "loss": 2.9578, "step": 8630 }, { "epoch": 0.23, "learning_rate": 0.0017936490856781202, "loss": 2.1704, "step": 8631 }, { "epoch": 0.23, "learning_rate": 0.0017935961301318239, "loss": 2.6169, "step": 8632 }, { "epoch": 0.23, "learning_rate": 0.0017935431685733856, "loss": 2.6857, "step": 8633 }, { "epoch": 0.23, "learning_rate": 0.0017934902010032056, "loss": 2.6862, "step": 8634 }, { "epoch": 0.23, "learning_rate": 0.0017934372274216858, "loss": 2.6345, "step": 8635 }, { "epoch": 0.23, "learning_rate": 0.0017933842478292277, "loss": 2.5363, "step": 8636 }, { "epoch": 0.23, "learning_rate": 0.0017933312622262323, "loss": 2.6769, "step": 8637 }, { "epoch": 0.23, "learning_rate": 0.001793278270613101, "loss": 2.6506, "step": 8638 }, { "epoch": 0.23, "learning_rate": 0.0017932252729902353, "loss": 2.4765, "step": 8639 }, { "epoch": 0.23, "learning_rate": 0.0017931722693580367, "loss": 2.755, "step": 8640 }, { "epoch": 0.23, "learning_rate": 0.001793119259716907, "loss": 3.1587, "step": 8641 }, { "epoch": 0.23, "learning_rate": 0.0017930662440672474, "loss": 2.5459, "step": 8642 }, { "epoch": 0.23, "learning_rate": 0.00179301322240946, "loss": 2.736, "step": 8643 }, { "epoch": 0.23, "learning_rate": 0.001792960194743946, "loss": 2.5643, "step": 8644 }, { "epoch": 0.23, "learning_rate": 0.0017929071610711072, "loss": 2.7153, "step": 8645 }, { "epoch": 0.23, "learning_rate": 0.0017928541213913457, "loss": 2.4151, "step": 8646 }, { "epoch": 0.23, "learning_rate": 0.001792801075705063, "loss": 2.7201, "step": 8647 }, { "epoch": 0.23, "learning_rate": 0.0017927480240126613, "loss": 2.7191, "step": 8648 }, { "epoch": 0.23, "learning_rate": 0.0017926949663145421, "loss": 2.4906, "step": 8649 }, { "epoch": 0.23, "learning_rate": 0.0017926419026111078, "loss": 2.2511, "step": 8650 }, { "epoch": 0.23, "learning_rate": 0.00179258883290276, "loss": 2.9707, "step": 8651 }, { "epoch": 0.23, "learning_rate": 0.0017925357571899009, "loss": 2.5867, "step": 8652 }, { "epoch": 0.23, "learning_rate": 0.0017924826754729323, "loss": 2.8573, "step": 8653 }, { "epoch": 0.23, "learning_rate": 0.001792429587752257, "loss": 2.149, "step": 8654 }, { "epoch": 0.23, "learning_rate": 0.0017923764940282769, "loss": 2.6422, "step": 8655 }, { "epoch": 0.23, "learning_rate": 0.0017923233943013938, "loss": 2.3314, "step": 8656 }, { "epoch": 0.23, "learning_rate": 0.0017922702885720106, "loss": 3.2633, "step": 8657 }, { "epoch": 0.23, "learning_rate": 0.0017922171768405292, "loss": 2.6239, "step": 8658 }, { "epoch": 0.23, "learning_rate": 0.001792164059107352, "loss": 2.3359, "step": 8659 }, { "epoch": 0.23, "learning_rate": 0.001792110935372882, "loss": 2.1057, "step": 8660 }, { "epoch": 0.23, "learning_rate": 0.0017920578056375206, "loss": 2.7452, "step": 8661 }, { "epoch": 0.23, "learning_rate": 0.001792004669901671, "loss": 2.4594, "step": 8662 }, { "epoch": 0.23, "learning_rate": 0.0017919515281657357, "loss": 2.6983, "step": 8663 }, { "epoch": 0.23, "learning_rate": 0.0017918983804301174, "loss": 2.9776, "step": 8664 }, { "epoch": 0.23, "learning_rate": 0.0017918452266952184, "loss": 2.6745, "step": 8665 }, { "epoch": 0.23, "learning_rate": 0.0017917920669614413, "loss": 2.6516, "step": 8666 }, { "epoch": 0.23, "learning_rate": 0.0017917389012291893, "loss": 2.3932, "step": 8667 }, { "epoch": 0.23, "learning_rate": 0.0017916857294988649, "loss": 2.4205, "step": 8668 }, { "epoch": 0.23, "learning_rate": 0.0017916325517708712, "loss": 2.2011, "step": 8669 }, { "epoch": 0.23, "learning_rate": 0.0017915793680456104, "loss": 2.8437, "step": 8670 }, { "epoch": 0.23, "learning_rate": 0.001791526178323486, "loss": 2.5125, "step": 8671 }, { "epoch": 0.23, "learning_rate": 0.0017914729826049008, "loss": 3.0344, "step": 8672 }, { "epoch": 0.23, "learning_rate": 0.0017914197808902577, "loss": 3.0646, "step": 8673 }, { "epoch": 0.23, "learning_rate": 0.00179136657317996, "loss": 2.5992, "step": 8674 }, { "epoch": 0.23, "learning_rate": 0.0017913133594744104, "loss": 2.5858, "step": 8675 }, { "epoch": 0.23, "learning_rate": 0.0017912601397740123, "loss": 3.4618, "step": 8676 }, { "epoch": 0.23, "learning_rate": 0.0017912069140791692, "loss": 2.5814, "step": 8677 }, { "epoch": 0.23, "learning_rate": 0.0017911536823902834, "loss": 2.3328, "step": 8678 }, { "epoch": 0.23, "learning_rate": 0.0017911004447077592, "loss": 2.877, "step": 8679 }, { "epoch": 0.23, "learning_rate": 0.0017910472010319995, "loss": 2.9133, "step": 8680 }, { "epoch": 0.23, "learning_rate": 0.001790993951363407, "loss": 2.3044, "step": 8681 }, { "epoch": 0.23, "learning_rate": 0.0017909406957023863, "loss": 2.6174, "step": 8682 }, { "epoch": 0.23, "learning_rate": 0.0017908874340493402, "loss": 2.5493, "step": 8683 }, { "epoch": 0.23, "learning_rate": 0.0017908341664046726, "loss": 3.2412, "step": 8684 }, { "epoch": 0.23, "learning_rate": 0.0017907808927687863, "loss": 2.4868, "step": 8685 }, { "epoch": 0.23, "learning_rate": 0.0017907276131420853, "loss": 2.7383, "step": 8686 }, { "epoch": 0.23, "learning_rate": 0.0017906743275249734, "loss": 2.2406, "step": 8687 }, { "epoch": 0.23, "learning_rate": 0.0017906210359178542, "loss": 2.3233, "step": 8688 }, { "epoch": 0.23, "learning_rate": 0.0017905677383211315, "loss": 2.8808, "step": 8689 }, { "epoch": 0.23, "learning_rate": 0.0017905144347352088, "loss": 2.544, "step": 8690 }, { "epoch": 0.23, "learning_rate": 0.0017904611251604902, "loss": 2.5363, "step": 8691 }, { "epoch": 0.23, "learning_rate": 0.0017904078095973793, "loss": 2.8194, "step": 8692 }, { "epoch": 0.23, "learning_rate": 0.0017903544880462801, "loss": 3.0965, "step": 8693 }, { "epoch": 0.23, "learning_rate": 0.0017903011605075966, "loss": 2.4039, "step": 8694 }, { "epoch": 0.23, "learning_rate": 0.001790247826981733, "loss": 3.1223, "step": 8695 }, { "epoch": 0.23, "learning_rate": 0.001790194487469093, "loss": 2.1674, "step": 8696 }, { "epoch": 0.23, "learning_rate": 0.0017901411419700807, "loss": 2.6276, "step": 8697 }, { "epoch": 0.23, "learning_rate": 0.0017900877904851007, "loss": 2.9189, "step": 8698 }, { "epoch": 0.23, "learning_rate": 0.0017900344330145565, "loss": 2.8211, "step": 8699 }, { "epoch": 0.23, "learning_rate": 0.001789981069558853, "loss": 2.6429, "step": 8700 }, { "epoch": 0.23, "learning_rate": 0.001789927700118394, "loss": 2.7845, "step": 8701 }, { "epoch": 0.23, "learning_rate": 0.001789874324693584, "loss": 2.839, "step": 8702 }, { "epoch": 0.23, "learning_rate": 0.0017898209432848273, "loss": 2.2731, "step": 8703 }, { "epoch": 0.23, "learning_rate": 0.0017897675558925285, "loss": 2.5913, "step": 8704 }, { "epoch": 0.23, "learning_rate": 0.0017897141625170916, "loss": 2.7238, "step": 8705 }, { "epoch": 0.23, "learning_rate": 0.0017896607631589215, "loss": 2.4941, "step": 8706 }, { "epoch": 0.23, "learning_rate": 0.0017896073578184226, "loss": 2.2593, "step": 8707 }, { "epoch": 0.23, "learning_rate": 0.0017895539464959998, "loss": 2.8099, "step": 8708 }, { "epoch": 0.23, "learning_rate": 0.0017895005291920572, "loss": 2.7762, "step": 8709 }, { "epoch": 0.23, "learning_rate": 0.001789447105907, "loss": 2.7344, "step": 8710 }, { "epoch": 0.23, "learning_rate": 0.0017893936766412324, "loss": 2.8357, "step": 8711 }, { "epoch": 0.23, "learning_rate": 0.0017893402413951597, "loss": 2.4176, "step": 8712 }, { "epoch": 0.23, "learning_rate": 0.001789286800169186, "loss": 3.0692, "step": 8713 }, { "epoch": 0.23, "learning_rate": 0.0017892333529637167, "loss": 2.4583, "step": 8714 }, { "epoch": 0.23, "learning_rate": 0.001789179899779157, "loss": 2.5747, "step": 8715 }, { "epoch": 0.23, "learning_rate": 0.0017891264406159114, "loss": 2.711, "step": 8716 }, { "epoch": 0.23, "learning_rate": 0.001789072975474385, "loss": 2.6973, "step": 8717 }, { "epoch": 0.23, "learning_rate": 0.0017890195043549825, "loss": 3.0093, "step": 8718 }, { "epoch": 0.23, "learning_rate": 0.0017889660272581095, "loss": 2.5844, "step": 8719 }, { "epoch": 0.23, "learning_rate": 0.0017889125441841707, "loss": 2.8254, "step": 8720 }, { "epoch": 0.23, "learning_rate": 0.0017888590551335716, "loss": 2.9042, "step": 8721 }, { "epoch": 0.23, "learning_rate": 0.0017888055601067174, "loss": 2.6544, "step": 8722 }, { "epoch": 0.23, "learning_rate": 0.0017887520591040134, "loss": 2.5877, "step": 8723 }, { "epoch": 0.23, "learning_rate": 0.0017886985521258648, "loss": 2.4781, "step": 8724 }, { "epoch": 0.23, "learning_rate": 0.001788645039172677, "loss": 2.9044, "step": 8725 }, { "epoch": 0.23, "learning_rate": 0.001788591520244855, "loss": 2.7382, "step": 8726 }, { "epoch": 0.23, "learning_rate": 0.001788537995342805, "loss": 2.4172, "step": 8727 }, { "epoch": 0.23, "learning_rate": 0.001788484464466932, "loss": 2.4832, "step": 8728 }, { "epoch": 0.23, "learning_rate": 0.001788430927617642, "loss": 2.6243, "step": 8729 }, { "epoch": 0.23, "learning_rate": 0.0017883773847953398, "loss": 2.4001, "step": 8730 }, { "epoch": 0.23, "learning_rate": 0.0017883238360004317, "loss": 2.5851, "step": 8731 }, { "epoch": 0.23, "learning_rate": 0.001788270281233323, "loss": 2.6687, "step": 8732 }, { "epoch": 0.23, "learning_rate": 0.0017882167204944198, "loss": 2.4444, "step": 8733 }, { "epoch": 0.23, "learning_rate": 0.0017881631537841273, "loss": 2.3545, "step": 8734 }, { "epoch": 0.23, "learning_rate": 0.001788109581102852, "loss": 2.3677, "step": 8735 }, { "epoch": 0.23, "learning_rate": 0.0017880560024509994, "loss": 2.4681, "step": 8736 }, { "epoch": 0.23, "learning_rate": 0.001788002417828975, "loss": 2.5459, "step": 8737 }, { "epoch": 0.23, "learning_rate": 0.0017879488272371858, "loss": 2.7436, "step": 8738 }, { "epoch": 0.23, "learning_rate": 0.0017878952306760367, "loss": 2.739, "step": 8739 }, { "epoch": 0.23, "learning_rate": 0.0017878416281459344, "loss": 2.5175, "step": 8740 }, { "epoch": 0.23, "learning_rate": 0.0017877880196472847, "loss": 2.307, "step": 8741 }, { "epoch": 0.23, "learning_rate": 0.0017877344051804938, "loss": 3.0318, "step": 8742 }, { "epoch": 0.23, "learning_rate": 0.001787680784745968, "loss": 2.3227, "step": 8743 }, { "epoch": 0.23, "learning_rate": 0.001787627158344113, "loss": 2.3424, "step": 8744 }, { "epoch": 0.24, "learning_rate": 0.001787573525975336, "loss": 2.7405, "step": 8745 }, { "epoch": 0.24, "learning_rate": 0.0017875198876400424, "loss": 2.309, "step": 8746 }, { "epoch": 0.24, "learning_rate": 0.0017874662433386393, "loss": 2.8836, "step": 8747 }, { "epoch": 0.24, "learning_rate": 0.0017874125930715324, "loss": 2.4527, "step": 8748 }, { "epoch": 0.24, "learning_rate": 0.0017873589368391284, "loss": 2.5947, "step": 8749 }, { "epoch": 0.24, "learning_rate": 0.0017873052746418341, "loss": 2.4391, "step": 8750 }, { "epoch": 0.24, "learning_rate": 0.0017872516064800557, "loss": 2.5424, "step": 8751 }, { "epoch": 0.24, "learning_rate": 0.0017871979323542, "loss": 2.7141, "step": 8752 }, { "epoch": 0.24, "learning_rate": 0.0017871442522646732, "loss": 2.2641, "step": 8753 }, { "epoch": 0.24, "learning_rate": 0.0017870905662118826, "loss": 2.6268, "step": 8754 }, { "epoch": 0.24, "learning_rate": 0.0017870368741962344, "loss": 2.6796, "step": 8755 }, { "epoch": 0.24, "learning_rate": 0.0017869831762181356, "loss": 2.62, "step": 8756 }, { "epoch": 0.24, "learning_rate": 0.001786929472277993, "loss": 2.8836, "step": 8757 }, { "epoch": 0.24, "learning_rate": 0.0017868757623762134, "loss": 2.568, "step": 8758 }, { "epoch": 0.24, "learning_rate": 0.0017868220465132034, "loss": 2.329, "step": 8759 }, { "epoch": 0.24, "learning_rate": 0.0017867683246893709, "loss": 2.5785, "step": 8760 }, { "epoch": 0.24, "learning_rate": 0.0017867145969051217, "loss": 2.3491, "step": 8761 }, { "epoch": 0.24, "learning_rate": 0.0017866608631608636, "loss": 2.6549, "step": 8762 }, { "epoch": 0.24, "learning_rate": 0.0017866071234570035, "loss": 2.5494, "step": 8763 }, { "epoch": 0.24, "learning_rate": 0.0017865533777939482, "loss": 2.7732, "step": 8764 }, { "epoch": 0.24, "learning_rate": 0.0017864996261721053, "loss": 2.2589, "step": 8765 }, { "epoch": 0.24, "learning_rate": 0.0017864458685918816, "loss": 2.6496, "step": 8766 }, { "epoch": 0.24, "learning_rate": 0.0017863921050536846, "loss": 2.7109, "step": 8767 }, { "epoch": 0.24, "learning_rate": 0.001786338335557922, "loss": 2.5428, "step": 8768 }, { "epoch": 0.24, "learning_rate": 0.0017862845601050005, "loss": 2.5068, "step": 8769 }, { "epoch": 0.24, "learning_rate": 0.001786230778695328, "loss": 2.2223, "step": 8770 }, { "epoch": 0.24, "learning_rate": 0.0017861769913293114, "loss": 2.87, "step": 8771 }, { "epoch": 0.24, "learning_rate": 0.0017861231980073585, "loss": 2.8233, "step": 8772 }, { "epoch": 0.24, "learning_rate": 0.001786069398729877, "loss": 2.2568, "step": 8773 }, { "epoch": 0.24, "learning_rate": 0.0017860155934972739, "loss": 2.7728, "step": 8774 }, { "epoch": 0.24, "learning_rate": 0.0017859617823099577, "loss": 2.3967, "step": 8775 }, { "epoch": 0.24, "learning_rate": 0.0017859079651683352, "loss": 2.9072, "step": 8776 }, { "epoch": 0.24, "learning_rate": 0.0017858541420728146, "loss": 2.5038, "step": 8777 }, { "epoch": 0.24, "learning_rate": 0.0017858003130238034, "loss": 3.0993, "step": 8778 }, { "epoch": 0.24, "learning_rate": 0.0017857464780217094, "loss": 2.8134, "step": 8779 }, { "epoch": 0.24, "learning_rate": 0.0017856926370669408, "loss": 2.4223, "step": 8780 }, { "epoch": 0.24, "learning_rate": 0.0017856387901599052, "loss": 2.893, "step": 8781 }, { "epoch": 0.24, "learning_rate": 0.0017855849373010107, "loss": 2.8071, "step": 8782 }, { "epoch": 0.24, "learning_rate": 0.0017855310784906648, "loss": 2.6657, "step": 8783 }, { "epoch": 0.24, "learning_rate": 0.0017854772137292762, "loss": 2.5424, "step": 8784 }, { "epoch": 0.24, "learning_rate": 0.0017854233430172526, "loss": 2.7294, "step": 8785 }, { "epoch": 0.24, "learning_rate": 0.0017853694663550021, "loss": 2.6193, "step": 8786 }, { "epoch": 0.24, "learning_rate": 0.001785315583742933, "loss": 2.731, "step": 8787 }, { "epoch": 0.24, "learning_rate": 0.0017852616951814536, "loss": 2.3502, "step": 8788 }, { "epoch": 0.24, "learning_rate": 0.0017852078006709718, "loss": 2.7279, "step": 8789 }, { "epoch": 0.24, "learning_rate": 0.001785153900211896, "loss": 2.7473, "step": 8790 }, { "epoch": 0.24, "learning_rate": 0.0017850999938046348, "loss": 2.6921, "step": 8791 }, { "epoch": 0.24, "learning_rate": 0.0017850460814495964, "loss": 2.7415, "step": 8792 }, { "epoch": 0.24, "learning_rate": 0.0017849921631471891, "loss": 2.5078, "step": 8793 }, { "epoch": 0.24, "learning_rate": 0.0017849382388978215, "loss": 2.4951, "step": 8794 }, { "epoch": 0.24, "learning_rate": 0.0017848843087019022, "loss": 2.4584, "step": 8795 }, { "epoch": 0.24, "learning_rate": 0.0017848303725598398, "loss": 2.8238, "step": 8796 }, { "epoch": 0.24, "learning_rate": 0.0017847764304720428, "loss": 2.2734, "step": 8797 }, { "epoch": 0.24, "learning_rate": 0.0017847224824389198, "loss": 2.2863, "step": 8798 }, { "epoch": 0.24, "learning_rate": 0.0017846685284608795, "loss": 2.1914, "step": 8799 }, { "epoch": 0.24, "learning_rate": 0.001784614568538331, "loss": 2.6807, "step": 8800 }, { "epoch": 0.24, "learning_rate": 0.0017845606026716824, "loss": 2.7236, "step": 8801 }, { "epoch": 0.24, "learning_rate": 0.0017845066308613431, "loss": 2.5188, "step": 8802 }, { "epoch": 0.24, "learning_rate": 0.0017844526531077222, "loss": 2.2147, "step": 8803 }, { "epoch": 0.24, "learning_rate": 0.0017843986694112278, "loss": 2.9773, "step": 8804 }, { "epoch": 0.24, "learning_rate": 0.0017843446797722693, "loss": 2.5818, "step": 8805 }, { "epoch": 0.24, "learning_rate": 0.0017842906841912557, "loss": 2.8087, "step": 8806 }, { "epoch": 0.24, "learning_rate": 0.0017842366826685964, "loss": 2.2983, "step": 8807 }, { "epoch": 0.24, "learning_rate": 0.0017841826752047001, "loss": 2.984, "step": 8808 }, { "epoch": 0.24, "learning_rate": 0.0017841286617999762, "loss": 2.4522, "step": 8809 }, { "epoch": 0.24, "learning_rate": 0.0017840746424548333, "loss": 2.5108, "step": 8810 }, { "epoch": 0.24, "learning_rate": 0.0017840206171696813, "loss": 2.6092, "step": 8811 }, { "epoch": 0.24, "learning_rate": 0.0017839665859449294, "loss": 2.6233, "step": 8812 }, { "epoch": 0.24, "learning_rate": 0.0017839125487809867, "loss": 2.5256, "step": 8813 }, { "epoch": 0.24, "learning_rate": 0.0017838585056782629, "loss": 2.5925, "step": 8814 }, { "epoch": 0.24, "learning_rate": 0.0017838044566371668, "loss": 2.7025, "step": 8815 }, { "epoch": 0.24, "learning_rate": 0.0017837504016581084, "loss": 3.0804, "step": 8816 }, { "epoch": 0.24, "learning_rate": 0.0017836963407414973, "loss": 2.6813, "step": 8817 }, { "epoch": 0.24, "learning_rate": 0.0017836422738877426, "loss": 2.7328, "step": 8818 }, { "epoch": 0.24, "learning_rate": 0.001783588201097254, "loss": 2.5473, "step": 8819 }, { "epoch": 0.24, "learning_rate": 0.0017835341223704417, "loss": 2.5132, "step": 8820 }, { "epoch": 0.24, "learning_rate": 0.0017834800377077148, "loss": 2.544, "step": 8821 }, { "epoch": 0.24, "learning_rate": 0.0017834259471094832, "loss": 2.9459, "step": 8822 }, { "epoch": 0.24, "learning_rate": 0.0017833718505761566, "loss": 2.4844, "step": 8823 }, { "epoch": 0.24, "learning_rate": 0.001783317748108145, "loss": 2.4377, "step": 8824 }, { "epoch": 0.24, "learning_rate": 0.001783263639705858, "loss": 2.7161, "step": 8825 }, { "epoch": 0.24, "learning_rate": 0.001783209525369706, "loss": 2.6831, "step": 8826 }, { "epoch": 0.24, "learning_rate": 0.0017831554051000985, "loss": 2.4497, "step": 8827 }, { "epoch": 0.24, "learning_rate": 0.0017831012788974458, "loss": 2.6616, "step": 8828 }, { "epoch": 0.24, "learning_rate": 0.0017830471467621576, "loss": 2.637, "step": 8829 }, { "epoch": 0.24, "learning_rate": 0.0017829930086946445, "loss": 2.6829, "step": 8830 }, { "epoch": 0.24, "learning_rate": 0.001782938864695316, "loss": 2.5029, "step": 8831 }, { "epoch": 0.24, "learning_rate": 0.0017828847147645828, "loss": 3.1228, "step": 8832 }, { "epoch": 0.24, "learning_rate": 0.0017828305589028548, "loss": 2.8104, "step": 8833 }, { "epoch": 0.24, "learning_rate": 0.0017827763971105428, "loss": 2.5209, "step": 8834 }, { "epoch": 0.24, "learning_rate": 0.0017827222293880565, "loss": 2.8157, "step": 8835 }, { "epoch": 0.24, "learning_rate": 0.0017826680557358067, "loss": 2.4968, "step": 8836 }, { "epoch": 0.24, "learning_rate": 0.0017826138761542034, "loss": 2.6362, "step": 8837 }, { "epoch": 0.24, "learning_rate": 0.0017825596906436575, "loss": 2.7825, "step": 8838 }, { "epoch": 0.24, "learning_rate": 0.0017825054992045794, "loss": 2.499, "step": 8839 }, { "epoch": 0.24, "learning_rate": 0.001782451301837379, "loss": 2.7251, "step": 8840 }, { "epoch": 0.24, "learning_rate": 0.001782397098542468, "loss": 2.3428, "step": 8841 }, { "epoch": 0.24, "learning_rate": 0.0017823428893202565, "loss": 2.4406, "step": 8842 }, { "epoch": 0.24, "learning_rate": 0.0017822886741711546, "loss": 2.3753, "step": 8843 }, { "epoch": 0.24, "learning_rate": 0.0017822344530955738, "loss": 2.6013, "step": 8844 }, { "epoch": 0.24, "learning_rate": 0.0017821802260939248, "loss": 2.8464, "step": 8845 }, { "epoch": 0.24, "learning_rate": 0.001782125993166618, "loss": 2.6834, "step": 8846 }, { "epoch": 0.24, "learning_rate": 0.0017820717543140649, "loss": 2.8551, "step": 8847 }, { "epoch": 0.24, "learning_rate": 0.0017820175095366758, "loss": 2.4498, "step": 8848 }, { "epoch": 0.24, "learning_rate": 0.0017819632588348619, "loss": 2.5915, "step": 8849 }, { "epoch": 0.24, "learning_rate": 0.0017819090022090339, "loss": 2.8762, "step": 8850 }, { "epoch": 0.24, "learning_rate": 0.0017818547396596031, "loss": 2.3436, "step": 8851 }, { "epoch": 0.24, "learning_rate": 0.0017818004711869808, "loss": 2.9729, "step": 8852 }, { "epoch": 0.24, "learning_rate": 0.001781746196791578, "loss": 2.3254, "step": 8853 }, { "epoch": 0.24, "learning_rate": 0.0017816919164738054, "loss": 2.656, "step": 8854 }, { "epoch": 0.24, "learning_rate": 0.001781637630234075, "loss": 2.6179, "step": 8855 }, { "epoch": 0.24, "learning_rate": 0.0017815833380727972, "loss": 2.6541, "step": 8856 }, { "epoch": 0.24, "learning_rate": 0.0017815290399903843, "loss": 2.7116, "step": 8857 }, { "epoch": 0.24, "learning_rate": 0.0017814747359872467, "loss": 2.8205, "step": 8858 }, { "epoch": 0.24, "learning_rate": 0.0017814204260637966, "loss": 2.5486, "step": 8859 }, { "epoch": 0.24, "learning_rate": 0.0017813661102204447, "loss": 2.4503, "step": 8860 }, { "epoch": 0.24, "learning_rate": 0.0017813117884576029, "loss": 2.4979, "step": 8861 }, { "epoch": 0.24, "learning_rate": 0.0017812574607756826, "loss": 2.5271, "step": 8862 }, { "epoch": 0.24, "learning_rate": 0.0017812031271750956, "loss": 2.8302, "step": 8863 }, { "epoch": 0.24, "learning_rate": 0.0017811487876562536, "loss": 2.7588, "step": 8864 }, { "epoch": 0.24, "learning_rate": 0.0017810944422195676, "loss": 2.2515, "step": 8865 }, { "epoch": 0.24, "learning_rate": 0.00178104009086545, "loss": 2.5536, "step": 8866 }, { "epoch": 0.24, "learning_rate": 0.0017809857335943124, "loss": 2.9141, "step": 8867 }, { "epoch": 0.24, "learning_rate": 0.0017809313704065662, "loss": 2.7314, "step": 8868 }, { "epoch": 0.24, "learning_rate": 0.001780877001302624, "loss": 2.7544, "step": 8869 }, { "epoch": 0.24, "learning_rate": 0.001780822626282897, "loss": 2.4149, "step": 8870 }, { "epoch": 0.24, "learning_rate": 0.0017807682453477973, "loss": 2.899, "step": 8871 }, { "epoch": 0.24, "learning_rate": 0.0017807138584977368, "loss": 2.9474, "step": 8872 }, { "epoch": 0.24, "learning_rate": 0.001780659465733128, "loss": 2.4308, "step": 8873 }, { "epoch": 0.24, "learning_rate": 0.0017806050670543824, "loss": 2.7338, "step": 8874 }, { "epoch": 0.24, "learning_rate": 0.0017805506624619127, "loss": 2.7422, "step": 8875 }, { "epoch": 0.24, "learning_rate": 0.0017804962519561306, "loss": 2.5637, "step": 8876 }, { "epoch": 0.24, "learning_rate": 0.0017804418355374483, "loss": 2.6631, "step": 8877 }, { "epoch": 0.24, "learning_rate": 0.0017803874132062782, "loss": 2.7238, "step": 8878 }, { "epoch": 0.24, "learning_rate": 0.001780332984963033, "loss": 2.3591, "step": 8879 }, { "epoch": 0.24, "learning_rate": 0.001780278550808124, "loss": 2.2202, "step": 8880 }, { "epoch": 0.24, "learning_rate": 0.0017802241107419646, "loss": 2.6239, "step": 8881 }, { "epoch": 0.24, "learning_rate": 0.0017801696647649669, "loss": 2.1171, "step": 8882 }, { "epoch": 0.24, "learning_rate": 0.0017801152128775431, "loss": 2.9234, "step": 8883 }, { "epoch": 0.24, "learning_rate": 0.0017800607550801058, "loss": 2.3336, "step": 8884 }, { "epoch": 0.24, "learning_rate": 0.0017800062913730676, "loss": 2.6654, "step": 8885 }, { "epoch": 0.24, "learning_rate": 0.0017799518217568415, "loss": 2.1652, "step": 8886 }, { "epoch": 0.24, "learning_rate": 0.0017798973462318398, "loss": 2.3762, "step": 8887 }, { "epoch": 0.24, "learning_rate": 0.0017798428647984752, "loss": 2.8295, "step": 8888 }, { "epoch": 0.24, "learning_rate": 0.0017797883774571606, "loss": 2.6231, "step": 8889 }, { "epoch": 0.24, "learning_rate": 0.0017797338842083085, "loss": 2.9002, "step": 8890 }, { "epoch": 0.24, "learning_rate": 0.0017796793850523318, "loss": 2.8391, "step": 8891 }, { "epoch": 0.24, "learning_rate": 0.0017796248799896435, "loss": 2.5958, "step": 8892 }, { "epoch": 0.24, "learning_rate": 0.0017795703690206568, "loss": 2.7508, "step": 8893 }, { "epoch": 0.24, "learning_rate": 0.0017795158521457842, "loss": 2.5751, "step": 8894 }, { "epoch": 0.24, "learning_rate": 0.0017794613293654385, "loss": 3.0695, "step": 8895 }, { "epoch": 0.24, "learning_rate": 0.0017794068006800336, "loss": 2.4266, "step": 8896 }, { "epoch": 0.24, "learning_rate": 0.001779352266089982, "loss": 2.6793, "step": 8897 }, { "epoch": 0.24, "learning_rate": 0.001779297725595697, "loss": 2.919, "step": 8898 }, { "epoch": 0.24, "learning_rate": 0.0017792431791975917, "loss": 2.8047, "step": 8899 }, { "epoch": 0.24, "learning_rate": 0.001779188626896079, "loss": 2.5559, "step": 8900 }, { "epoch": 0.24, "learning_rate": 0.0017791340686915732, "loss": 2.3447, "step": 8901 }, { "epoch": 0.24, "learning_rate": 0.0017790795045844864, "loss": 2.6066, "step": 8902 }, { "epoch": 0.24, "learning_rate": 0.001779024934575233, "loss": 2.8778, "step": 8903 }, { "epoch": 0.24, "learning_rate": 0.001778970358664226, "loss": 2.7455, "step": 8904 }, { "epoch": 0.24, "learning_rate": 0.0017789157768518787, "loss": 2.6213, "step": 8905 }, { "epoch": 0.24, "learning_rate": 0.0017788611891386048, "loss": 2.3398, "step": 8906 }, { "epoch": 0.24, "learning_rate": 0.0017788065955248176, "loss": 2.8894, "step": 8907 }, { "epoch": 0.24, "learning_rate": 0.0017787519960109311, "loss": 2.9662, "step": 8908 }, { "epoch": 0.24, "learning_rate": 0.0017786973905973584, "loss": 2.0918, "step": 8909 }, { "epoch": 0.24, "learning_rate": 0.0017786427792845139, "loss": 2.4761, "step": 8910 }, { "epoch": 0.24, "learning_rate": 0.0017785881620728105, "loss": 3.135, "step": 8911 }, { "epoch": 0.24, "learning_rate": 0.0017785335389626624, "loss": 2.6436, "step": 8912 }, { "epoch": 0.24, "learning_rate": 0.0017784789099544837, "loss": 2.9292, "step": 8913 }, { "epoch": 0.24, "learning_rate": 0.0017784242750486878, "loss": 2.5224, "step": 8914 }, { "epoch": 0.24, "learning_rate": 0.001778369634245689, "loss": 2.6404, "step": 8915 }, { "epoch": 0.24, "learning_rate": 0.0017783149875459005, "loss": 3.008, "step": 8916 }, { "epoch": 0.24, "learning_rate": 0.0017782603349497373, "loss": 2.8078, "step": 8917 }, { "epoch": 0.24, "learning_rate": 0.0017782056764576127, "loss": 2.2895, "step": 8918 }, { "epoch": 0.24, "learning_rate": 0.001778151012069941, "loss": 2.8905, "step": 8919 }, { "epoch": 0.24, "learning_rate": 0.0017780963417871366, "loss": 2.5617, "step": 8920 }, { "epoch": 0.24, "learning_rate": 0.0017780416656096132, "loss": 2.33, "step": 8921 }, { "epoch": 0.24, "learning_rate": 0.0017779869835377851, "loss": 2.8301, "step": 8922 }, { "epoch": 0.24, "learning_rate": 0.001777932295572067, "loss": 2.203, "step": 8923 }, { "epoch": 0.24, "learning_rate": 0.0017778776017128726, "loss": 2.4652, "step": 8924 }, { "epoch": 0.24, "learning_rate": 0.001777822901960617, "loss": 2.6137, "step": 8925 }, { "epoch": 0.24, "learning_rate": 0.001777768196315714, "loss": 2.4338, "step": 8926 }, { "epoch": 0.24, "learning_rate": 0.001777713484778578, "loss": 2.703, "step": 8927 }, { "epoch": 0.24, "learning_rate": 0.0017776587673496236, "loss": 2.5415, "step": 8928 }, { "epoch": 0.24, "learning_rate": 0.0017776040440292658, "loss": 2.8012, "step": 8929 }, { "epoch": 0.24, "learning_rate": 0.0017775493148179185, "loss": 2.6248, "step": 8930 }, { "epoch": 0.24, "learning_rate": 0.0017774945797159967, "loss": 2.9488, "step": 8931 }, { "epoch": 0.24, "learning_rate": 0.001777439838723915, "loss": 2.5555, "step": 8932 }, { "epoch": 0.24, "learning_rate": 0.001777385091842088, "loss": 2.8775, "step": 8933 }, { "epoch": 0.24, "learning_rate": 0.0017773303390709305, "loss": 2.5234, "step": 8934 }, { "epoch": 0.24, "learning_rate": 0.0017772755804108574, "loss": 2.8039, "step": 8935 }, { "epoch": 0.24, "learning_rate": 0.0017772208158622833, "loss": 2.8129, "step": 8936 }, { "epoch": 0.24, "learning_rate": 0.0017771660454256235, "loss": 2.7996, "step": 8937 }, { "epoch": 0.24, "learning_rate": 0.0017771112691012925, "loss": 2.0805, "step": 8938 }, { "epoch": 0.24, "learning_rate": 0.0017770564868897056, "loss": 2.677, "step": 8939 }, { "epoch": 0.24, "learning_rate": 0.0017770016987912775, "loss": 2.5751, "step": 8940 }, { "epoch": 0.24, "learning_rate": 0.0017769469048064237, "loss": 2.7115, "step": 8941 }, { "epoch": 0.24, "learning_rate": 0.0017768921049355591, "loss": 2.294, "step": 8942 }, { "epoch": 0.24, "learning_rate": 0.0017768372991790985, "loss": 2.5976, "step": 8943 }, { "epoch": 0.24, "learning_rate": 0.0017767824875374574, "loss": 2.504, "step": 8944 }, { "epoch": 0.24, "learning_rate": 0.0017767276700110513, "loss": 2.8702, "step": 8945 }, { "epoch": 0.24, "learning_rate": 0.0017766728466002953, "loss": 2.4546, "step": 8946 }, { "epoch": 0.24, "learning_rate": 0.0017766180173056044, "loss": 2.5496, "step": 8947 }, { "epoch": 0.24, "learning_rate": 0.0017765631821273944, "loss": 2.6092, "step": 8948 }, { "epoch": 0.24, "learning_rate": 0.0017765083410660805, "loss": 2.9087, "step": 8949 }, { "epoch": 0.24, "learning_rate": 0.001776453494122078, "loss": 2.5416, "step": 8950 }, { "epoch": 0.24, "learning_rate": 0.0017763986412958031, "loss": 2.523, "step": 8951 }, { "epoch": 0.24, "learning_rate": 0.0017763437825876706, "loss": 2.7465, "step": 8952 }, { "epoch": 0.24, "learning_rate": 0.0017762889179980968, "loss": 2.5582, "step": 8953 }, { "epoch": 0.24, "learning_rate": 0.0017762340475274963, "loss": 2.4543, "step": 8954 }, { "epoch": 0.24, "learning_rate": 0.001776179171176286, "loss": 2.3969, "step": 8955 }, { "epoch": 0.24, "learning_rate": 0.0017761242889448808, "loss": 2.3972, "step": 8956 }, { "epoch": 0.24, "learning_rate": 0.0017760694008336967, "loss": 2.8599, "step": 8957 }, { "epoch": 0.24, "learning_rate": 0.0017760145068431497, "loss": 2.7477, "step": 8958 }, { "epoch": 0.24, "learning_rate": 0.0017759596069736555, "loss": 3.0317, "step": 8959 }, { "epoch": 0.24, "learning_rate": 0.0017759047012256299, "loss": 3.0265, "step": 8960 }, { "epoch": 0.24, "learning_rate": 0.0017758497895994894, "loss": 2.4305, "step": 8961 }, { "epoch": 0.24, "learning_rate": 0.0017757948720956492, "loss": 2.6274, "step": 8962 }, { "epoch": 0.24, "learning_rate": 0.001775739948714526, "loss": 2.514, "step": 8963 }, { "epoch": 0.24, "learning_rate": 0.0017756850194565353, "loss": 2.5246, "step": 8964 }, { "epoch": 0.24, "learning_rate": 0.0017756300843220938, "loss": 2.5142, "step": 8965 }, { "epoch": 0.24, "learning_rate": 0.0017755751433116177, "loss": 2.3685, "step": 8966 }, { "epoch": 0.24, "learning_rate": 0.0017755201964255226, "loss": 2.3663, "step": 8967 }, { "epoch": 0.24, "learning_rate": 0.0017754652436642252, "loss": 2.2557, "step": 8968 }, { "epoch": 0.24, "learning_rate": 0.001775410285028142, "loss": 2.4905, "step": 8969 }, { "epoch": 0.24, "learning_rate": 0.0017753553205176887, "loss": 2.4516, "step": 8970 }, { "epoch": 0.24, "learning_rate": 0.0017753003501332824, "loss": 2.6069, "step": 8971 }, { "epoch": 0.24, "learning_rate": 0.001775245373875339, "loss": 2.2684, "step": 8972 }, { "epoch": 0.24, "learning_rate": 0.0017751903917442755, "loss": 2.7589, "step": 8973 }, { "epoch": 0.24, "learning_rate": 0.0017751354037405082, "loss": 2.545, "step": 8974 }, { "epoch": 0.24, "learning_rate": 0.0017750804098644534, "loss": 2.4799, "step": 8975 }, { "epoch": 0.24, "learning_rate": 0.0017750254101165286, "loss": 2.7411, "step": 8976 }, { "epoch": 0.24, "learning_rate": 0.0017749704044971494, "loss": 2.7005, "step": 8977 }, { "epoch": 0.24, "learning_rate": 0.001774915393006733, "loss": 2.5583, "step": 8978 }, { "epoch": 0.24, "learning_rate": 0.001774860375645696, "loss": 2.5221, "step": 8979 }, { "epoch": 0.24, "learning_rate": 0.0017748053524144556, "loss": 2.6332, "step": 8980 }, { "epoch": 0.24, "learning_rate": 0.0017747503233134282, "loss": 2.6141, "step": 8981 }, { "epoch": 0.24, "learning_rate": 0.0017746952883430308, "loss": 2.4096, "step": 8982 }, { "epoch": 0.24, "learning_rate": 0.0017746402475036804, "loss": 2.7279, "step": 8983 }, { "epoch": 0.24, "learning_rate": 0.001774585200795794, "loss": 2.7025, "step": 8984 }, { "epoch": 0.24, "learning_rate": 0.001774530148219789, "loss": 2.3835, "step": 8985 }, { "epoch": 0.24, "learning_rate": 0.0017744750897760815, "loss": 2.8252, "step": 8986 }, { "epoch": 0.24, "learning_rate": 0.0017744200254650893, "loss": 2.607, "step": 8987 }, { "epoch": 0.24, "learning_rate": 0.0017743649552872296, "loss": 2.4967, "step": 8988 }, { "epoch": 0.24, "learning_rate": 0.0017743098792429195, "loss": 2.5705, "step": 8989 }, { "epoch": 0.24, "learning_rate": 0.001774254797332576, "loss": 2.3775, "step": 8990 }, { "epoch": 0.24, "learning_rate": 0.001774199709556617, "loss": 2.5045, "step": 8991 }, { "epoch": 0.24, "learning_rate": 0.001774144615915459, "loss": 2.8853, "step": 8992 }, { "epoch": 0.24, "learning_rate": 0.0017740895164095197, "loss": 2.6147, "step": 8993 }, { "epoch": 0.24, "learning_rate": 0.0017740344110392168, "loss": 2.5931, "step": 8994 }, { "epoch": 0.24, "learning_rate": 0.0017739792998049677, "loss": 2.6904, "step": 8995 }, { "epoch": 0.24, "learning_rate": 0.0017739241827071895, "loss": 2.2826, "step": 8996 }, { "epoch": 0.24, "learning_rate": 0.0017738690597463003, "loss": 2.56, "step": 8997 }, { "epoch": 0.24, "learning_rate": 0.0017738139309227176, "loss": 2.4224, "step": 8998 }, { "epoch": 0.24, "learning_rate": 0.0017737587962368586, "loss": 2.4726, "step": 8999 }, { "epoch": 0.24, "learning_rate": 0.0017737036556891414, "loss": 2.65, "step": 9000 }, { "epoch": 0.24, "learning_rate": 0.0017736485092799837, "loss": 2.8224, "step": 9001 }, { "epoch": 0.24, "learning_rate": 0.001773593357009803, "loss": 2.9424, "step": 9002 }, { "epoch": 0.24, "learning_rate": 0.0017735381988790175, "loss": 2.6697, "step": 9003 }, { "epoch": 0.24, "learning_rate": 0.0017734830348880449, "loss": 2.5216, "step": 9004 }, { "epoch": 0.24, "learning_rate": 0.001773427865037303, "loss": 2.6766, "step": 9005 }, { "epoch": 0.24, "learning_rate": 0.00177337268932721, "loss": 2.3293, "step": 9006 }, { "epoch": 0.24, "learning_rate": 0.0017733175077581835, "loss": 2.5145, "step": 9007 }, { "epoch": 0.24, "learning_rate": 0.001773262320330642, "loss": 2.5172, "step": 9008 }, { "epoch": 0.24, "learning_rate": 0.0017732071270450036, "loss": 2.6696, "step": 9009 }, { "epoch": 0.24, "learning_rate": 0.0017731519279016862, "loss": 2.7575, "step": 9010 }, { "epoch": 0.24, "learning_rate": 0.0017730967229011077, "loss": 2.3687, "step": 9011 }, { "epoch": 0.24, "learning_rate": 0.0017730415120436871, "loss": 2.4221, "step": 9012 }, { "epoch": 0.24, "learning_rate": 0.0017729862953298418, "loss": 2.5726, "step": 9013 }, { "epoch": 0.24, "learning_rate": 0.0017729310727599907, "loss": 2.7419, "step": 9014 }, { "epoch": 0.24, "learning_rate": 0.001772875844334552, "loss": 2.9297, "step": 9015 }, { "epoch": 0.24, "learning_rate": 0.001772820610053944, "loss": 2.354, "step": 9016 }, { "epoch": 0.24, "learning_rate": 0.0017727653699185853, "loss": 2.2766, "step": 9017 }, { "epoch": 0.24, "learning_rate": 0.0017727101239288943, "loss": 2.9069, "step": 9018 }, { "epoch": 0.24, "learning_rate": 0.0017726548720852894, "loss": 2.625, "step": 9019 }, { "epoch": 0.24, "learning_rate": 0.0017725996143881898, "loss": 2.8408, "step": 9020 }, { "epoch": 0.24, "learning_rate": 0.0017725443508380132, "loss": 2.871, "step": 9021 }, { "epoch": 0.24, "learning_rate": 0.0017724890814351788, "loss": 2.4562, "step": 9022 }, { "epoch": 0.24, "learning_rate": 0.0017724338061801052, "loss": 2.589, "step": 9023 }, { "epoch": 0.24, "learning_rate": 0.0017723785250732115, "loss": 2.8522, "step": 9024 }, { "epoch": 0.24, "learning_rate": 0.0017723232381149157, "loss": 2.8008, "step": 9025 }, { "epoch": 0.24, "learning_rate": 0.0017722679453056373, "loss": 2.5055, "step": 9026 }, { "epoch": 0.24, "learning_rate": 0.0017722126466457953, "loss": 2.64, "step": 9027 }, { "epoch": 0.24, "learning_rate": 0.0017721573421358079, "loss": 2.7856, "step": 9028 }, { "epoch": 0.24, "learning_rate": 0.0017721020317760948, "loss": 2.8347, "step": 9029 }, { "epoch": 0.24, "learning_rate": 0.0017720467155670746, "loss": 2.3642, "step": 9030 }, { "epoch": 0.24, "learning_rate": 0.0017719913935091668, "loss": 2.6633, "step": 9031 }, { "epoch": 0.24, "learning_rate": 0.00177193606560279, "loss": 2.4677, "step": 9032 }, { "epoch": 0.24, "learning_rate": 0.0017718807318483636, "loss": 2.2229, "step": 9033 }, { "epoch": 0.24, "learning_rate": 0.0017718253922463067, "loss": 2.4265, "step": 9034 }, { "epoch": 0.24, "learning_rate": 0.0017717700467970389, "loss": 2.5758, "step": 9035 }, { "epoch": 0.24, "learning_rate": 0.0017717146955009788, "loss": 2.7402, "step": 9036 }, { "epoch": 0.24, "learning_rate": 0.0017716593383585461, "loss": 2.4128, "step": 9037 }, { "epoch": 0.24, "learning_rate": 0.0017716039753701606, "loss": 2.6563, "step": 9038 }, { "epoch": 0.24, "learning_rate": 0.0017715486065362411, "loss": 2.6923, "step": 9039 }, { "epoch": 0.24, "learning_rate": 0.0017714932318572075, "loss": 2.5629, "step": 9040 }, { "epoch": 0.24, "learning_rate": 0.001771437851333479, "loss": 2.8309, "step": 9041 }, { "epoch": 0.24, "learning_rate": 0.0017713824649654751, "loss": 2.724, "step": 9042 }, { "epoch": 0.24, "learning_rate": 0.0017713270727536157, "loss": 2.3738, "step": 9043 }, { "epoch": 0.24, "learning_rate": 0.0017712716746983205, "loss": 2.6316, "step": 9044 }, { "epoch": 0.24, "learning_rate": 0.0017712162708000087, "loss": 2.8642, "step": 9045 }, { "epoch": 0.24, "learning_rate": 0.0017711608610591, "loss": 2.9174, "step": 9046 }, { "epoch": 0.24, "learning_rate": 0.001771105445476015, "loss": 2.4966, "step": 9047 }, { "epoch": 0.24, "learning_rate": 0.0017710500240511729, "loss": 2.6174, "step": 9048 }, { "epoch": 0.24, "learning_rate": 0.001770994596784994, "loss": 2.4624, "step": 9049 }, { "epoch": 0.24, "learning_rate": 0.0017709391636778972, "loss": 2.5289, "step": 9050 }, { "epoch": 0.24, "learning_rate": 0.0017708837247303033, "loss": 2.5161, "step": 9051 }, { "epoch": 0.24, "learning_rate": 0.0017708282799426326, "loss": 2.6044, "step": 9052 }, { "epoch": 0.24, "learning_rate": 0.0017707728293153042, "loss": 2.486, "step": 9053 }, { "epoch": 0.24, "learning_rate": 0.0017707173728487389, "loss": 2.7662, "step": 9054 }, { "epoch": 0.24, "learning_rate": 0.0017706619105433564, "loss": 2.6543, "step": 9055 }, { "epoch": 0.24, "learning_rate": 0.001770606442399577, "loss": 2.7826, "step": 9056 }, { "epoch": 0.24, "learning_rate": 0.001770550968417821, "loss": 2.8612, "step": 9057 }, { "epoch": 0.24, "learning_rate": 0.0017704954885985086, "loss": 2.8316, "step": 9058 }, { "epoch": 0.24, "learning_rate": 0.0017704400029420605, "loss": 2.7523, "step": 9059 }, { "epoch": 0.24, "learning_rate": 0.0017703845114488963, "loss": 2.518, "step": 9060 }, { "epoch": 0.24, "learning_rate": 0.0017703290141194371, "loss": 2.7511, "step": 9061 }, { "epoch": 0.24, "learning_rate": 0.0017702735109541025, "loss": 2.4955, "step": 9062 }, { "epoch": 0.24, "learning_rate": 0.0017702180019533139, "loss": 2.7293, "step": 9063 }, { "epoch": 0.24, "learning_rate": 0.0017701624871174913, "loss": 2.5582, "step": 9064 }, { "epoch": 0.24, "learning_rate": 0.0017701069664470554, "loss": 2.8322, "step": 9065 }, { "epoch": 0.24, "learning_rate": 0.0017700514399424268, "loss": 2.3134, "step": 9066 }, { "epoch": 0.24, "learning_rate": 0.001769995907604026, "loss": 2.6728, "step": 9067 }, { "epoch": 0.24, "learning_rate": 0.0017699403694322743, "loss": 2.7376, "step": 9068 }, { "epoch": 0.24, "learning_rate": 0.0017698848254275915, "loss": 2.0804, "step": 9069 }, { "epoch": 0.24, "learning_rate": 0.0017698292755903991, "loss": 2.3181, "step": 9070 }, { "epoch": 0.24, "learning_rate": 0.0017697737199211176, "loss": 2.8564, "step": 9071 }, { "epoch": 0.24, "learning_rate": 0.0017697181584201685, "loss": 2.739, "step": 9072 }, { "epoch": 0.24, "learning_rate": 0.0017696625910879717, "loss": 2.2855, "step": 9073 }, { "epoch": 0.24, "learning_rate": 0.0017696070179249494, "loss": 2.8826, "step": 9074 }, { "epoch": 0.24, "learning_rate": 0.0017695514389315212, "loss": 2.1574, "step": 9075 }, { "epoch": 0.24, "learning_rate": 0.0017694958541081092, "loss": 2.4695, "step": 9076 }, { "epoch": 0.24, "learning_rate": 0.0017694402634551342, "loss": 3.0615, "step": 9077 }, { "epoch": 0.24, "learning_rate": 0.0017693846669730173, "loss": 2.7039, "step": 9078 }, { "epoch": 0.24, "learning_rate": 0.0017693290646621795, "loss": 2.7964, "step": 9079 }, { "epoch": 0.24, "learning_rate": 0.0017692734565230427, "loss": 2.7259, "step": 9080 }, { "epoch": 0.24, "learning_rate": 0.0017692178425560273, "loss": 2.8372, "step": 9081 }, { "epoch": 0.24, "learning_rate": 0.0017691622227615552, "loss": 2.8867, "step": 9082 }, { "epoch": 0.24, "learning_rate": 0.0017691065971400476, "loss": 2.8941, "step": 9083 }, { "epoch": 0.24, "learning_rate": 0.001769050965691926, "loss": 2.4436, "step": 9084 }, { "epoch": 0.24, "learning_rate": 0.0017689953284176117, "loss": 2.7307, "step": 9085 }, { "epoch": 0.24, "learning_rate": 0.0017689396853175264, "loss": 2.6929, "step": 9086 }, { "epoch": 0.24, "learning_rate": 0.0017688840363920912, "loss": 2.5767, "step": 9087 }, { "epoch": 0.24, "learning_rate": 0.0017688283816417283, "loss": 2.6695, "step": 9088 }, { "epoch": 0.24, "learning_rate": 0.0017687727210668588, "loss": 2.6113, "step": 9089 }, { "epoch": 0.24, "learning_rate": 0.001768717054667905, "loss": 2.5827, "step": 9090 }, { "epoch": 0.24, "learning_rate": 0.001768661382445288, "loss": 2.4899, "step": 9091 }, { "epoch": 0.24, "learning_rate": 0.0017686057043994298, "loss": 2.7729, "step": 9092 }, { "epoch": 0.24, "learning_rate": 0.001768550020530752, "loss": 2.6704, "step": 9093 }, { "epoch": 0.24, "learning_rate": 0.001768494330839677, "loss": 2.815, "step": 9094 }, { "epoch": 0.24, "learning_rate": 0.0017684386353266262, "loss": 3.2117, "step": 9095 }, { "epoch": 0.24, "learning_rate": 0.0017683829339920215, "loss": 2.6485, "step": 9096 }, { "epoch": 0.24, "learning_rate": 0.0017683272268362853, "loss": 2.6995, "step": 9097 }, { "epoch": 0.24, "learning_rate": 0.0017682715138598393, "loss": 2.9551, "step": 9098 }, { "epoch": 0.24, "learning_rate": 0.0017682157950631057, "loss": 2.5092, "step": 9099 }, { "epoch": 0.24, "learning_rate": 0.0017681600704465067, "loss": 2.878, "step": 9100 }, { "epoch": 0.24, "learning_rate": 0.001768104340010464, "loss": 2.6013, "step": 9101 }, { "epoch": 0.24, "learning_rate": 0.0017680486037554004, "loss": 2.5199, "step": 9102 }, { "epoch": 0.24, "learning_rate": 0.001767992861681738, "loss": 2.5122, "step": 9103 }, { "epoch": 0.24, "learning_rate": 0.0017679371137898988, "loss": 2.5409, "step": 9104 }, { "epoch": 0.24, "learning_rate": 0.0017678813600803052, "loss": 2.4116, "step": 9105 }, { "epoch": 0.24, "learning_rate": 0.0017678256005533798, "loss": 2.8366, "step": 9106 }, { "epoch": 0.24, "learning_rate": 0.001767769835209545, "loss": 2.5088, "step": 9107 }, { "epoch": 0.24, "learning_rate": 0.001767714064049223, "loss": 2.4126, "step": 9108 }, { "epoch": 0.24, "learning_rate": 0.0017676582870728371, "loss": 2.6385, "step": 9109 }, { "epoch": 0.24, "learning_rate": 0.0017676025042808086, "loss": 2.3622, "step": 9110 }, { "epoch": 0.24, "learning_rate": 0.0017675467156735613, "loss": 2.6881, "step": 9111 }, { "epoch": 0.24, "learning_rate": 0.0017674909212515167, "loss": 2.3286, "step": 9112 }, { "epoch": 0.24, "learning_rate": 0.0017674351210150983, "loss": 2.5598, "step": 9113 }, { "epoch": 0.24, "learning_rate": 0.001767379314964729, "loss": 3.1799, "step": 9114 }, { "epoch": 0.24, "learning_rate": 0.0017673235031008306, "loss": 2.1589, "step": 9115 }, { "epoch": 0.24, "learning_rate": 0.001767267685423827, "loss": 2.7171, "step": 9116 }, { "epoch": 0.25, "learning_rate": 0.0017672118619341405, "loss": 2.4095, "step": 9117 }, { "epoch": 0.25, "learning_rate": 0.0017671560326321938, "loss": 2.8341, "step": 9118 }, { "epoch": 0.25, "learning_rate": 0.0017671001975184104, "loss": 2.7494, "step": 9119 }, { "epoch": 0.25, "learning_rate": 0.001767044356593213, "loss": 2.7186, "step": 9120 }, { "epoch": 0.25, "learning_rate": 0.0017669885098570248, "loss": 2.6973, "step": 9121 }, { "epoch": 0.25, "learning_rate": 0.0017669326573102686, "loss": 2.7705, "step": 9122 }, { "epoch": 0.25, "learning_rate": 0.0017668767989533678, "loss": 2.2492, "step": 9123 }, { "epoch": 0.25, "learning_rate": 0.0017668209347867457, "loss": 2.5457, "step": 9124 }, { "epoch": 0.25, "learning_rate": 0.0017667650648108251, "loss": 2.5801, "step": 9125 }, { "epoch": 0.25, "learning_rate": 0.0017667091890260294, "loss": 2.8255, "step": 9126 }, { "epoch": 0.25, "learning_rate": 0.0017666533074327817, "loss": 2.5248, "step": 9127 }, { "epoch": 0.25, "learning_rate": 0.001766597420031506, "loss": 2.788, "step": 9128 }, { "epoch": 0.25, "learning_rate": 0.0017665415268226252, "loss": 2.5532, "step": 9129 }, { "epoch": 0.25, "learning_rate": 0.0017664856278065632, "loss": 2.5188, "step": 9130 }, { "epoch": 0.25, "learning_rate": 0.0017664297229837425, "loss": 2.6697, "step": 9131 }, { "epoch": 0.25, "learning_rate": 0.0017663738123545874, "loss": 2.5973, "step": 9132 }, { "epoch": 0.25, "learning_rate": 0.0017663178959195216, "loss": 2.6464, "step": 9133 }, { "epoch": 0.25, "learning_rate": 0.0017662619736789683, "loss": 2.5104, "step": 9134 }, { "epoch": 0.25, "learning_rate": 0.0017662060456333508, "loss": 2.4638, "step": 9135 }, { "epoch": 0.25, "learning_rate": 0.001766150111783094, "loss": 2.6481, "step": 9136 }, { "epoch": 0.25, "learning_rate": 0.0017660941721286206, "loss": 2.3585, "step": 9137 }, { "epoch": 0.25, "learning_rate": 0.0017660382266703545, "loss": 2.6508, "step": 9138 }, { "epoch": 0.25, "learning_rate": 0.00176598227540872, "loss": 2.5811, "step": 9139 }, { "epoch": 0.25, "learning_rate": 0.0017659263183441407, "loss": 2.5466, "step": 9140 }, { "epoch": 0.25, "learning_rate": 0.0017658703554770407, "loss": 2.3738, "step": 9141 }, { "epoch": 0.25, "learning_rate": 0.0017658143868078439, "loss": 2.8417, "step": 9142 }, { "epoch": 0.25, "learning_rate": 0.001765758412336974, "loss": 2.3879, "step": 9143 }, { "epoch": 0.25, "learning_rate": 0.001765702432064855, "loss": 2.5666, "step": 9144 }, { "epoch": 0.25, "learning_rate": 0.0017656464459919116, "loss": 2.7718, "step": 9145 }, { "epoch": 0.25, "learning_rate": 0.0017655904541185677, "loss": 2.7931, "step": 9146 }, { "epoch": 0.25, "learning_rate": 0.001765534456445247, "loss": 2.4306, "step": 9147 }, { "epoch": 0.25, "learning_rate": 0.0017654784529723747, "loss": 2.6011, "step": 9148 }, { "epoch": 0.25, "learning_rate": 0.001765422443700374, "loss": 2.6802, "step": 9149 }, { "epoch": 0.25, "learning_rate": 0.0017653664286296697, "loss": 2.8488, "step": 9150 }, { "epoch": 0.25, "learning_rate": 0.0017653104077606865, "loss": 2.906, "step": 9151 }, { "epoch": 0.25, "learning_rate": 0.0017652543810938483, "loss": 2.5154, "step": 9152 }, { "epoch": 0.25, "learning_rate": 0.0017651983486295798, "loss": 2.0549, "step": 9153 }, { "epoch": 0.25, "learning_rate": 0.0017651423103683052, "loss": 2.8849, "step": 9154 }, { "epoch": 0.25, "learning_rate": 0.0017650862663104495, "loss": 2.6365, "step": 9155 }, { "epoch": 0.25, "learning_rate": 0.0017650302164564369, "loss": 2.5929, "step": 9156 }, { "epoch": 0.25, "learning_rate": 0.001764974160806692, "loss": 2.2841, "step": 9157 }, { "epoch": 0.25, "learning_rate": 0.00176491809936164, "loss": 3.1027, "step": 9158 }, { "epoch": 0.25, "learning_rate": 0.001764862032121705, "loss": 2.8239, "step": 9159 }, { "epoch": 0.25, "learning_rate": 0.001764805959087312, "loss": 3.0059, "step": 9160 }, { "epoch": 0.25, "learning_rate": 0.0017647498802588859, "loss": 2.5081, "step": 9161 }, { "epoch": 0.25, "learning_rate": 0.0017646937956368514, "loss": 2.6949, "step": 9162 }, { "epoch": 0.25, "learning_rate": 0.0017646377052216334, "loss": 2.6518, "step": 9163 }, { "epoch": 0.25, "learning_rate": 0.0017645816090136567, "loss": 2.5884, "step": 9164 }, { "epoch": 0.25, "learning_rate": 0.0017645255070133467, "loss": 2.8814, "step": 9165 }, { "epoch": 0.25, "learning_rate": 0.0017644693992211278, "loss": 2.701, "step": 9166 }, { "epoch": 0.25, "learning_rate": 0.0017644132856374257, "loss": 2.404, "step": 9167 }, { "epoch": 0.25, "learning_rate": 0.001764357166262665, "loss": 2.6653, "step": 9168 }, { "epoch": 0.25, "learning_rate": 0.0017643010410972712, "loss": 2.4369, "step": 9169 }, { "epoch": 0.25, "learning_rate": 0.0017642449101416694, "loss": 2.5772, "step": 9170 }, { "epoch": 0.25, "learning_rate": 0.0017641887733962846, "loss": 2.0077, "step": 9171 }, { "epoch": 0.25, "learning_rate": 0.0017641326308615425, "loss": 2.5694, "step": 9172 }, { "epoch": 0.25, "learning_rate": 0.0017640764825378682, "loss": 2.7444, "step": 9173 }, { "epoch": 0.25, "learning_rate": 0.001764020328425687, "loss": 2.5573, "step": 9174 }, { "epoch": 0.25, "learning_rate": 0.0017639641685254243, "loss": 2.9307, "step": 9175 }, { "epoch": 0.25, "learning_rate": 0.0017639080028375056, "loss": 2.8585, "step": 9176 }, { "epoch": 0.25, "learning_rate": 0.0017638518313623567, "loss": 2.4839, "step": 9177 }, { "epoch": 0.25, "learning_rate": 0.0017637956541004028, "loss": 2.1754, "step": 9178 }, { "epoch": 0.25, "learning_rate": 0.0017637394710520696, "loss": 2.6855, "step": 9179 }, { "epoch": 0.25, "learning_rate": 0.0017636832822177824, "loss": 2.6241, "step": 9180 }, { "epoch": 0.25, "learning_rate": 0.0017636270875979675, "loss": 2.433, "step": 9181 }, { "epoch": 0.25, "learning_rate": 0.0017635708871930503, "loss": 2.3781, "step": 9182 }, { "epoch": 0.25, "learning_rate": 0.0017635146810034566, "loss": 2.8171, "step": 9183 }, { "epoch": 0.25, "learning_rate": 0.001763458469029612, "loss": 1.8467, "step": 9184 }, { "epoch": 0.25, "learning_rate": 0.0017634022512719426, "loss": 2.3973, "step": 9185 }, { "epoch": 0.25, "learning_rate": 0.001763346027730874, "loss": 2.8451, "step": 9186 }, { "epoch": 0.25, "learning_rate": 0.0017632897984068328, "loss": 2.7043, "step": 9187 }, { "epoch": 0.25, "learning_rate": 0.0017632335633002442, "loss": 2.5674, "step": 9188 }, { "epoch": 0.25, "learning_rate": 0.0017631773224115349, "loss": 2.5751, "step": 9189 }, { "epoch": 0.25, "learning_rate": 0.0017631210757411305, "loss": 2.5102, "step": 9190 }, { "epoch": 0.25, "learning_rate": 0.001763064823289457, "loss": 2.3253, "step": 9191 }, { "epoch": 0.25, "learning_rate": 0.0017630085650569415, "loss": 2.5482, "step": 9192 }, { "epoch": 0.25, "learning_rate": 0.0017629523010440087, "loss": 2.4937, "step": 9193 }, { "epoch": 0.25, "learning_rate": 0.0017628960312510863, "loss": 2.774, "step": 9194 }, { "epoch": 0.25, "learning_rate": 0.0017628397556785995, "loss": 2.5705, "step": 9195 }, { "epoch": 0.25, "learning_rate": 0.0017627834743269752, "loss": 2.9381, "step": 9196 }, { "epoch": 0.25, "learning_rate": 0.0017627271871966399, "loss": 2.5968, "step": 9197 }, { "epoch": 0.25, "learning_rate": 0.0017626708942880198, "loss": 2.6562, "step": 9198 }, { "epoch": 0.25, "learning_rate": 0.0017626145956015412, "loss": 2.9143, "step": 9199 }, { "epoch": 0.25, "learning_rate": 0.0017625582911376307, "loss": 2.7493, "step": 9200 }, { "epoch": 0.25, "learning_rate": 0.001762501980896715, "loss": 2.7455, "step": 9201 }, { "epoch": 0.25, "learning_rate": 0.0017624456648792208, "loss": 2.3504, "step": 9202 }, { "epoch": 0.25, "learning_rate": 0.0017623893430855743, "loss": 2.1476, "step": 9203 }, { "epoch": 0.25, "learning_rate": 0.0017623330155162025, "loss": 3.0279, "step": 9204 }, { "epoch": 0.25, "learning_rate": 0.001762276682171532, "loss": 2.7783, "step": 9205 }, { "epoch": 0.25, "learning_rate": 0.0017622203430519901, "loss": 2.5444, "step": 9206 }, { "epoch": 0.25, "learning_rate": 0.0017621639981580026, "loss": 2.4406, "step": 9207 }, { "epoch": 0.25, "learning_rate": 0.0017621076474899971, "loss": 2.4721, "step": 9208 }, { "epoch": 0.25, "learning_rate": 0.0017620512910484006, "loss": 2.6044, "step": 9209 }, { "epoch": 0.25, "learning_rate": 0.0017619949288336394, "loss": 2.7925, "step": 9210 }, { "epoch": 0.25, "learning_rate": 0.0017619385608461408, "loss": 2.7063, "step": 9211 }, { "epoch": 0.25, "learning_rate": 0.001761882187086332, "loss": 2.1307, "step": 9212 }, { "epoch": 0.25, "learning_rate": 0.00176182580755464, "loss": 2.8136, "step": 9213 }, { "epoch": 0.25, "learning_rate": 0.0017617694222514919, "loss": 2.214, "step": 9214 }, { "epoch": 0.25, "learning_rate": 0.0017617130311773149, "loss": 2.9817, "step": 9215 }, { "epoch": 0.25, "learning_rate": 0.001761656634332536, "loss": 2.7674, "step": 9216 }, { "epoch": 0.25, "learning_rate": 0.0017616002317175825, "loss": 2.5687, "step": 9217 }, { "epoch": 0.25, "learning_rate": 0.0017615438233328823, "loss": 2.4731, "step": 9218 }, { "epoch": 0.25, "learning_rate": 0.0017614874091788617, "loss": 2.4283, "step": 9219 }, { "epoch": 0.25, "learning_rate": 0.001761430989255949, "loss": 2.4078, "step": 9220 }, { "epoch": 0.25, "learning_rate": 0.001761374563564571, "loss": 2.4393, "step": 9221 }, { "epoch": 0.25, "learning_rate": 0.0017613181321051554, "loss": 2.576, "step": 9222 }, { "epoch": 0.25, "learning_rate": 0.00176126169487813, "loss": 2.4747, "step": 9223 }, { "epoch": 0.25, "learning_rate": 0.0017612052518839222, "loss": 2.8705, "step": 9224 }, { "epoch": 0.25, "learning_rate": 0.0017611488031229591, "loss": 2.9597, "step": 9225 }, { "epoch": 0.25, "learning_rate": 0.001761092348595669, "loss": 2.8232, "step": 9226 }, { "epoch": 0.25, "learning_rate": 0.0017610358883024793, "loss": 2.7092, "step": 9227 }, { "epoch": 0.25, "learning_rate": 0.0017609794222438178, "loss": 2.9312, "step": 9228 }, { "epoch": 0.25, "learning_rate": 0.001760922950420112, "loss": 2.6862, "step": 9229 }, { "epoch": 0.25, "learning_rate": 0.0017608664728317903, "loss": 2.7463, "step": 9230 }, { "epoch": 0.25, "learning_rate": 0.0017608099894792799, "loss": 2.9132, "step": 9231 }, { "epoch": 0.25, "learning_rate": 0.0017607535003630096, "loss": 2.9393, "step": 9232 }, { "epoch": 0.25, "learning_rate": 0.0017606970054834061, "loss": 2.2897, "step": 9233 }, { "epoch": 0.25, "learning_rate": 0.0017606405048408984, "loss": 2.5514, "step": 9234 }, { "epoch": 0.25, "learning_rate": 0.0017605839984359145, "loss": 2.5139, "step": 9235 }, { "epoch": 0.25, "learning_rate": 0.0017605274862688817, "loss": 2.4962, "step": 9236 }, { "epoch": 0.25, "learning_rate": 0.001760470968340229, "loss": 2.7336, "step": 9237 }, { "epoch": 0.25, "learning_rate": 0.001760414444650384, "loss": 2.5033, "step": 9238 }, { "epoch": 0.25, "learning_rate": 0.0017603579151997753, "loss": 2.3545, "step": 9239 }, { "epoch": 0.25, "learning_rate": 0.0017603013799888307, "loss": 2.6034, "step": 9240 }, { "epoch": 0.25, "learning_rate": 0.001760244839017979, "loss": 2.4649, "step": 9241 }, { "epoch": 0.25, "learning_rate": 0.0017601882922876483, "loss": 2.1575, "step": 9242 }, { "epoch": 0.25, "learning_rate": 0.001760131739798267, "loss": 2.505, "step": 9243 }, { "epoch": 0.25, "learning_rate": 0.0017600751815502634, "loss": 2.8009, "step": 9244 }, { "epoch": 0.25, "learning_rate": 0.0017600186175440664, "loss": 2.5221, "step": 9245 }, { "epoch": 0.25, "learning_rate": 0.001759962047780104, "loss": 2.5983, "step": 9246 }, { "epoch": 0.25, "learning_rate": 0.001759905472258805, "loss": 2.6397, "step": 9247 }, { "epoch": 0.25, "learning_rate": 0.0017598488909805982, "loss": 2.4217, "step": 9248 }, { "epoch": 0.25, "learning_rate": 0.0017597923039459119, "loss": 2.2678, "step": 9249 }, { "epoch": 0.25, "learning_rate": 0.0017597357111551748, "loss": 2.2945, "step": 9250 }, { "epoch": 0.25, "learning_rate": 0.0017596791126088158, "loss": 2.1467, "step": 9251 }, { "epoch": 0.25, "learning_rate": 0.0017596225083072639, "loss": 2.7076, "step": 9252 }, { "epoch": 0.25, "learning_rate": 0.0017595658982509476, "loss": 2.7997, "step": 9253 }, { "epoch": 0.25, "learning_rate": 0.0017595092824402958, "loss": 2.644, "step": 9254 }, { "epoch": 0.25, "learning_rate": 0.0017594526608757377, "loss": 2.1581, "step": 9255 }, { "epoch": 0.25, "learning_rate": 0.0017593960335577016, "loss": 2.7991, "step": 9256 }, { "epoch": 0.25, "learning_rate": 0.001759339400486617, "loss": 2.8512, "step": 9257 }, { "epoch": 0.25, "learning_rate": 0.0017592827616629131, "loss": 2.6309, "step": 9258 }, { "epoch": 0.25, "learning_rate": 0.0017592261170870187, "loss": 2.7851, "step": 9259 }, { "epoch": 0.25, "learning_rate": 0.0017591694667593628, "loss": 2.8698, "step": 9260 }, { "epoch": 0.25, "learning_rate": 0.0017591128106803748, "loss": 2.4821, "step": 9261 }, { "epoch": 0.25, "learning_rate": 0.001759056148850484, "loss": 2.0285, "step": 9262 }, { "epoch": 0.25, "learning_rate": 0.0017589994812701195, "loss": 2.5633, "step": 9263 }, { "epoch": 0.25, "learning_rate": 0.0017589428079397105, "loss": 2.8594, "step": 9264 }, { "epoch": 0.25, "learning_rate": 0.0017588861288596865, "loss": 2.4569, "step": 9265 }, { "epoch": 0.25, "learning_rate": 0.0017588294440304768, "loss": 2.9056, "step": 9266 }, { "epoch": 0.25, "learning_rate": 0.0017587727534525111, "loss": 2.7137, "step": 9267 }, { "epoch": 0.25, "learning_rate": 0.0017587160571262187, "loss": 2.4823, "step": 9268 }, { "epoch": 0.25, "learning_rate": 0.0017586593550520289, "loss": 2.4502, "step": 9269 }, { "epoch": 0.25, "learning_rate": 0.0017586026472303712, "loss": 2.5363, "step": 9270 }, { "epoch": 0.25, "learning_rate": 0.001758545933661676, "loss": 2.4106, "step": 9271 }, { "epoch": 0.25, "learning_rate": 0.0017584892143463723, "loss": 2.494, "step": 9272 }, { "epoch": 0.25, "learning_rate": 0.0017584324892848898, "loss": 2.6422, "step": 9273 }, { "epoch": 0.25, "learning_rate": 0.0017583757584776585, "loss": 2.4399, "step": 9274 }, { "epoch": 0.25, "learning_rate": 0.0017583190219251077, "loss": 2.4027, "step": 9275 }, { "epoch": 0.25, "learning_rate": 0.001758262279627668, "loss": 2.7997, "step": 9276 }, { "epoch": 0.25, "learning_rate": 0.0017582055315857686, "loss": 2.3147, "step": 9277 }, { "epoch": 0.25, "learning_rate": 0.0017581487777998395, "loss": 2.7145, "step": 9278 }, { "epoch": 0.25, "learning_rate": 0.001758092018270311, "loss": 2.5507, "step": 9279 }, { "epoch": 0.25, "learning_rate": 0.0017580352529976131, "loss": 3.012, "step": 9280 }, { "epoch": 0.25, "learning_rate": 0.0017579784819821754, "loss": 2.3486, "step": 9281 }, { "epoch": 0.25, "learning_rate": 0.0017579217052244283, "loss": 2.5284, "step": 9282 }, { "epoch": 0.25, "learning_rate": 0.0017578649227248016, "loss": 2.7739, "step": 9283 }, { "epoch": 0.25, "learning_rate": 0.0017578081344837263, "loss": 2.3567, "step": 9284 }, { "epoch": 0.25, "learning_rate": 0.0017577513405016313, "loss": 2.5904, "step": 9285 }, { "epoch": 0.25, "learning_rate": 0.0017576945407789483, "loss": 2.6764, "step": 9286 }, { "epoch": 0.25, "learning_rate": 0.0017576377353161067, "loss": 2.6557, "step": 9287 }, { "epoch": 0.25, "learning_rate": 0.001757580924113537, "loss": 2.6272, "step": 9288 }, { "epoch": 0.25, "learning_rate": 0.0017575241071716697, "loss": 2.4796, "step": 9289 }, { "epoch": 0.25, "learning_rate": 0.0017574672844909351, "loss": 2.2291, "step": 9290 }, { "epoch": 0.25, "learning_rate": 0.0017574104560717642, "loss": 2.7611, "step": 9291 }, { "epoch": 0.25, "learning_rate": 0.0017573536219145866, "loss": 2.3363, "step": 9292 }, { "epoch": 0.25, "learning_rate": 0.0017572967820198336, "loss": 2.7996, "step": 9293 }, { "epoch": 0.25, "learning_rate": 0.0017572399363879354, "loss": 2.1404, "step": 9294 }, { "epoch": 0.25, "learning_rate": 0.0017571830850193226, "loss": 2.8247, "step": 9295 }, { "epoch": 0.25, "learning_rate": 0.0017571262279144268, "loss": 2.2081, "step": 9296 }, { "epoch": 0.25, "learning_rate": 0.0017570693650736774, "loss": 2.5496, "step": 9297 }, { "epoch": 0.25, "learning_rate": 0.0017570124964975064, "loss": 2.6896, "step": 9298 }, { "epoch": 0.25, "learning_rate": 0.0017569556221863438, "loss": 2.5663, "step": 9299 }, { "epoch": 0.25, "learning_rate": 0.0017568987421406207, "loss": 2.536, "step": 9300 }, { "epoch": 0.25, "learning_rate": 0.0017568418563607682, "loss": 2.6168, "step": 9301 }, { "epoch": 0.25, "learning_rate": 0.001756784964847217, "loss": 2.2773, "step": 9302 }, { "epoch": 0.25, "learning_rate": 0.001756728067600398, "loss": 2.3608, "step": 9303 }, { "epoch": 0.25, "learning_rate": 0.0017566711646207426, "loss": 2.5803, "step": 9304 }, { "epoch": 0.25, "learning_rate": 0.001756614255908682, "loss": 2.2968, "step": 9305 }, { "epoch": 0.25, "learning_rate": 0.0017565573414646467, "loss": 2.3896, "step": 9306 }, { "epoch": 0.25, "learning_rate": 0.0017565004212890685, "loss": 2.5866, "step": 9307 }, { "epoch": 0.25, "learning_rate": 0.0017564434953823782, "loss": 2.6597, "step": 9308 }, { "epoch": 0.25, "learning_rate": 0.0017563865637450075, "loss": 2.5005, "step": 9309 }, { "epoch": 0.25, "learning_rate": 0.0017563296263773869, "loss": 2.5965, "step": 9310 }, { "epoch": 0.25, "learning_rate": 0.0017562726832799488, "loss": 2.6361, "step": 9311 }, { "epoch": 0.25, "learning_rate": 0.0017562157344531237, "loss": 2.9592, "step": 9312 }, { "epoch": 0.25, "learning_rate": 0.0017561587798973438, "loss": 3.102, "step": 9313 }, { "epoch": 0.25, "learning_rate": 0.00175610181961304, "loss": 2.0588, "step": 9314 }, { "epoch": 0.25, "learning_rate": 0.0017560448536006437, "loss": 2.3691, "step": 9315 }, { "epoch": 0.25, "learning_rate": 0.001755987881860587, "loss": 2.594, "step": 9316 }, { "epoch": 0.25, "learning_rate": 0.001755930904393301, "loss": 2.4749, "step": 9317 }, { "epoch": 0.25, "learning_rate": 0.0017558739211992178, "loss": 2.5332, "step": 9318 }, { "epoch": 0.25, "learning_rate": 0.001755816932278769, "loss": 2.5017, "step": 9319 }, { "epoch": 0.25, "learning_rate": 0.0017557599376323862, "loss": 2.9192, "step": 9320 }, { "epoch": 0.25, "learning_rate": 0.0017557029372605012, "loss": 2.9562, "step": 9321 }, { "epoch": 0.25, "learning_rate": 0.001755645931163546, "loss": 2.5892, "step": 9322 }, { "epoch": 0.25, "learning_rate": 0.0017555889193419524, "loss": 2.3448, "step": 9323 }, { "epoch": 0.25, "learning_rate": 0.001755531901796152, "loss": 2.3121, "step": 9324 }, { "epoch": 0.25, "learning_rate": 0.001755474878526577, "loss": 2.6463, "step": 9325 }, { "epoch": 0.25, "learning_rate": 0.0017554178495336591, "loss": 2.6805, "step": 9326 }, { "epoch": 0.25, "learning_rate": 0.0017553608148178311, "loss": 2.8027, "step": 9327 }, { "epoch": 0.25, "learning_rate": 0.0017553037743795244, "loss": 2.9039, "step": 9328 }, { "epoch": 0.25, "learning_rate": 0.0017552467282191714, "loss": 2.3215, "step": 9329 }, { "epoch": 0.25, "learning_rate": 0.0017551896763372042, "loss": 2.8503, "step": 9330 }, { "epoch": 0.25, "learning_rate": 0.001755132618734055, "loss": 2.8141, "step": 9331 }, { "epoch": 0.25, "learning_rate": 0.0017550755554101563, "loss": 2.4931, "step": 9332 }, { "epoch": 0.25, "learning_rate": 0.0017550184863659398, "loss": 2.3601, "step": 9333 }, { "epoch": 0.25, "learning_rate": 0.0017549614116018387, "loss": 2.7539, "step": 9334 }, { "epoch": 0.25, "learning_rate": 0.0017549043311182845, "loss": 2.7245, "step": 9335 }, { "epoch": 0.25, "learning_rate": 0.0017548472449157102, "loss": 2.4257, "step": 9336 }, { "epoch": 0.25, "learning_rate": 0.001754790152994548, "loss": 2.5711, "step": 9337 }, { "epoch": 0.25, "learning_rate": 0.0017547330553552307, "loss": 2.5284, "step": 9338 }, { "epoch": 0.25, "learning_rate": 0.0017546759519981908, "loss": 2.6146, "step": 9339 }, { "epoch": 0.25, "learning_rate": 0.0017546188429238608, "loss": 2.7379, "step": 9340 }, { "epoch": 0.25, "learning_rate": 0.001754561728132673, "loss": 2.4355, "step": 9341 }, { "epoch": 0.25, "learning_rate": 0.0017545046076250608, "loss": 2.3588, "step": 9342 }, { "epoch": 0.25, "learning_rate": 0.0017544474814014564, "loss": 2.5671, "step": 9343 }, { "epoch": 0.25, "learning_rate": 0.001754390349462293, "loss": 2.8666, "step": 9344 }, { "epoch": 0.25, "learning_rate": 0.001754333211808003, "loss": 2.461, "step": 9345 }, { "epoch": 0.25, "learning_rate": 0.0017542760684390194, "loss": 3.2127, "step": 9346 }, { "epoch": 0.25, "learning_rate": 0.0017542189193557754, "loss": 2.6725, "step": 9347 }, { "epoch": 0.25, "learning_rate": 0.0017541617645587034, "loss": 2.5652, "step": 9348 }, { "epoch": 0.25, "learning_rate": 0.0017541046040482368, "loss": 2.6092, "step": 9349 }, { "epoch": 0.25, "learning_rate": 0.0017540474378248089, "loss": 2.5655, "step": 9350 }, { "epoch": 0.25, "learning_rate": 0.0017539902658888517, "loss": 2.8835, "step": 9351 }, { "epoch": 0.25, "learning_rate": 0.0017539330882407997, "loss": 3.0917, "step": 9352 }, { "epoch": 0.25, "learning_rate": 0.001753875904881085, "loss": 2.7632, "step": 9353 }, { "epoch": 0.25, "learning_rate": 0.0017538187158101417, "loss": 2.4139, "step": 9354 }, { "epoch": 0.25, "learning_rate": 0.0017537615210284022, "loss": 2.4372, "step": 9355 }, { "epoch": 0.25, "learning_rate": 0.0017537043205363002, "loss": 2.4014, "step": 9356 }, { "epoch": 0.25, "learning_rate": 0.0017536471143342692, "loss": 2.6654, "step": 9357 }, { "epoch": 0.25, "learning_rate": 0.0017535899024227423, "loss": 2.4111, "step": 9358 }, { "epoch": 0.25, "learning_rate": 0.001753532684802153, "loss": 2.716, "step": 9359 }, { "epoch": 0.25, "learning_rate": 0.001753475461472935, "loss": 2.8091, "step": 9360 }, { "epoch": 0.25, "learning_rate": 0.001753418232435521, "loss": 3.0232, "step": 9361 }, { "epoch": 0.25, "learning_rate": 0.0017533609976903457, "loss": 2.2489, "step": 9362 }, { "epoch": 0.25, "learning_rate": 0.001753303757237842, "loss": 2.5267, "step": 9363 }, { "epoch": 0.25, "learning_rate": 0.0017532465110784439, "loss": 2.4085, "step": 9364 }, { "epoch": 0.25, "learning_rate": 0.0017531892592125846, "loss": 2.6533, "step": 9365 }, { "epoch": 0.25, "learning_rate": 0.0017531320016406983, "loss": 2.4415, "step": 9366 }, { "epoch": 0.25, "learning_rate": 0.0017530747383632187, "loss": 2.5022, "step": 9367 }, { "epoch": 0.25, "learning_rate": 0.0017530174693805797, "loss": 2.2599, "step": 9368 }, { "epoch": 0.25, "learning_rate": 0.0017529601946932145, "loss": 2.8014, "step": 9369 }, { "epoch": 0.25, "learning_rate": 0.0017529029143015578, "loss": 2.4811, "step": 9370 }, { "epoch": 0.25, "learning_rate": 0.001752845628206043, "loss": 2.7217, "step": 9371 }, { "epoch": 0.25, "learning_rate": 0.0017527883364071043, "loss": 2.7342, "step": 9372 }, { "epoch": 0.25, "learning_rate": 0.001752731038905176, "loss": 2.3807, "step": 9373 }, { "epoch": 0.25, "learning_rate": 0.0017526737357006917, "loss": 2.8511, "step": 9374 }, { "epoch": 0.25, "learning_rate": 0.001752616426794086, "loss": 2.4715, "step": 9375 }, { "epoch": 0.25, "learning_rate": 0.0017525591121857927, "loss": 2.4406, "step": 9376 }, { "epoch": 0.25, "learning_rate": 0.001752501791876246, "loss": 2.5175, "step": 9377 }, { "epoch": 0.25, "learning_rate": 0.0017524444658658803, "loss": 2.7399, "step": 9378 }, { "epoch": 0.25, "learning_rate": 0.00175238713415513, "loss": 2.3879, "step": 9379 }, { "epoch": 0.25, "learning_rate": 0.001752329796744429, "loss": 2.4083, "step": 9380 }, { "epoch": 0.25, "learning_rate": 0.001752272453634212, "loss": 2.6352, "step": 9381 }, { "epoch": 0.25, "learning_rate": 0.0017522151048249138, "loss": 2.6332, "step": 9382 }, { "epoch": 0.25, "learning_rate": 0.0017521577503169681, "loss": 2.7793, "step": 9383 }, { "epoch": 0.25, "learning_rate": 0.00175210039011081, "loss": 2.9961, "step": 9384 }, { "epoch": 0.25, "learning_rate": 0.0017520430242068735, "loss": 2.3996, "step": 9385 }, { "epoch": 0.25, "learning_rate": 0.0017519856526055934, "loss": 2.923, "step": 9386 }, { "epoch": 0.25, "learning_rate": 0.001751928275307405, "loss": 2.5563, "step": 9387 }, { "epoch": 0.25, "learning_rate": 0.0017518708923127417, "loss": 2.7841, "step": 9388 }, { "epoch": 0.25, "learning_rate": 0.0017518135036220395, "loss": 2.3652, "step": 9389 }, { "epoch": 0.25, "learning_rate": 0.0017517561092357324, "loss": 2.7984, "step": 9390 }, { "epoch": 0.25, "learning_rate": 0.0017516987091542556, "loss": 2.7146, "step": 9391 }, { "epoch": 0.25, "learning_rate": 0.0017516413033780434, "loss": 2.8989, "step": 9392 }, { "epoch": 0.25, "learning_rate": 0.0017515838919075315, "loss": 2.9582, "step": 9393 }, { "epoch": 0.25, "learning_rate": 0.0017515264747431539, "loss": 2.76, "step": 9394 }, { "epoch": 0.25, "learning_rate": 0.0017514690518853464, "loss": 2.534, "step": 9395 }, { "epoch": 0.25, "learning_rate": 0.001751411623334544, "loss": 2.4943, "step": 9396 }, { "epoch": 0.25, "learning_rate": 0.001751354189091181, "loss": 2.2644, "step": 9397 }, { "epoch": 0.25, "learning_rate": 0.001751296749155693, "loss": 2.7473, "step": 9398 }, { "epoch": 0.25, "learning_rate": 0.0017512393035285154, "loss": 2.7001, "step": 9399 }, { "epoch": 0.25, "learning_rate": 0.0017511818522100834, "loss": 2.6866, "step": 9400 }, { "epoch": 0.25, "learning_rate": 0.0017511243952008316, "loss": 2.213, "step": 9401 }, { "epoch": 0.25, "learning_rate": 0.0017510669325011957, "loss": 2.8825, "step": 9402 }, { "epoch": 0.25, "learning_rate": 0.0017510094641116107, "loss": 2.7171, "step": 9403 }, { "epoch": 0.25, "learning_rate": 0.0017509519900325125, "loss": 2.6982, "step": 9404 }, { "epoch": 0.25, "learning_rate": 0.0017508945102643369, "loss": 2.647, "step": 9405 }, { "epoch": 0.25, "learning_rate": 0.001750837024807518, "loss": 2.9244, "step": 9406 }, { "epoch": 0.25, "learning_rate": 0.001750779533662492, "loss": 2.5981, "step": 9407 }, { "epoch": 0.25, "learning_rate": 0.001750722036829695, "loss": 2.7573, "step": 9408 }, { "epoch": 0.25, "learning_rate": 0.0017506645343095615, "loss": 2.6351, "step": 9409 }, { "epoch": 0.25, "learning_rate": 0.0017506070261025283, "loss": 2.4786, "step": 9410 }, { "epoch": 0.25, "learning_rate": 0.00175054951220903, "loss": 2.375, "step": 9411 }, { "epoch": 0.25, "learning_rate": 0.001750491992629503, "loss": 2.6063, "step": 9412 }, { "epoch": 0.25, "learning_rate": 0.0017504344673643826, "loss": 2.5833, "step": 9413 }, { "epoch": 0.25, "learning_rate": 0.0017503769364141052, "loss": 2.7503, "step": 9414 }, { "epoch": 0.25, "learning_rate": 0.001750319399779106, "loss": 2.7259, "step": 9415 }, { "epoch": 0.25, "learning_rate": 0.0017502618574598212, "loss": 2.3801, "step": 9416 }, { "epoch": 0.25, "learning_rate": 0.0017502043094566866, "loss": 3.3173, "step": 9417 }, { "epoch": 0.25, "learning_rate": 0.0017501467557701385, "loss": 2.5111, "step": 9418 }, { "epoch": 0.25, "learning_rate": 0.0017500891964006126, "loss": 2.6336, "step": 9419 }, { "epoch": 0.25, "learning_rate": 0.0017500316313485455, "loss": 2.45, "step": 9420 }, { "epoch": 0.25, "learning_rate": 0.001749974060614372, "loss": 2.3561, "step": 9421 }, { "epoch": 0.25, "learning_rate": 0.0017499164841985296, "loss": 2.5715, "step": 9422 }, { "epoch": 0.25, "learning_rate": 0.001749858902101454, "loss": 2.3944, "step": 9423 }, { "epoch": 0.25, "learning_rate": 0.0017498013143235813, "loss": 2.4309, "step": 9424 }, { "epoch": 0.25, "learning_rate": 0.0017497437208653479, "loss": 2.4797, "step": 9425 }, { "epoch": 0.25, "learning_rate": 0.0017496861217271903, "loss": 2.4628, "step": 9426 }, { "epoch": 0.25, "learning_rate": 0.0017496285169095445, "loss": 2.7082, "step": 9427 }, { "epoch": 0.25, "learning_rate": 0.0017495709064128471, "loss": 2.3864, "step": 9428 }, { "epoch": 0.25, "learning_rate": 0.0017495132902375344, "loss": 2.779, "step": 9429 }, { "epoch": 0.25, "learning_rate": 0.0017494556683840432, "loss": 2.8783, "step": 9430 }, { "epoch": 0.25, "learning_rate": 0.00174939804085281, "loss": 3.1358, "step": 9431 }, { "epoch": 0.25, "learning_rate": 0.001749340407644271, "loss": 2.7277, "step": 9432 }, { "epoch": 0.25, "learning_rate": 0.0017492827687588628, "loss": 2.5248, "step": 9433 }, { "epoch": 0.25, "learning_rate": 0.0017492251241970225, "loss": 2.7673, "step": 9434 }, { "epoch": 0.25, "learning_rate": 0.001749167473959187, "loss": 2.797, "step": 9435 }, { "epoch": 0.25, "learning_rate": 0.0017491098180457923, "loss": 2.5633, "step": 9436 }, { "epoch": 0.25, "learning_rate": 0.0017490521564572754, "loss": 2.2179, "step": 9437 }, { "epoch": 0.25, "learning_rate": 0.0017489944891940735, "loss": 2.6483, "step": 9438 }, { "epoch": 0.25, "learning_rate": 0.001748936816256623, "loss": 2.5496, "step": 9439 }, { "epoch": 0.25, "learning_rate": 0.0017488791376453615, "loss": 2.539, "step": 9440 }, { "epoch": 0.25, "learning_rate": 0.0017488214533607253, "loss": 2.5033, "step": 9441 }, { "epoch": 0.25, "learning_rate": 0.0017487637634031516, "loss": 2.8406, "step": 9442 }, { "epoch": 0.25, "learning_rate": 0.0017487060677730776, "loss": 2.5225, "step": 9443 }, { "epoch": 0.25, "learning_rate": 0.00174864836647094, "loss": 2.4157, "step": 9444 }, { "epoch": 0.25, "learning_rate": 0.0017485906594971767, "loss": 2.4004, "step": 9445 }, { "epoch": 0.25, "learning_rate": 0.0017485329468522241, "loss": 2.4074, "step": 9446 }, { "epoch": 0.25, "learning_rate": 0.0017484752285365198, "loss": 2.478, "step": 9447 }, { "epoch": 0.25, "learning_rate": 0.0017484175045505011, "loss": 2.4078, "step": 9448 }, { "epoch": 0.25, "learning_rate": 0.001748359774894605, "loss": 2.723, "step": 9449 }, { "epoch": 0.25, "learning_rate": 0.001748302039569269, "loss": 2.4185, "step": 9450 }, { "epoch": 0.25, "learning_rate": 0.0017482442985749308, "loss": 2.3314, "step": 9451 }, { "epoch": 0.25, "learning_rate": 0.0017481865519120272, "loss": 2.94, "step": 9452 }, { "epoch": 0.25, "learning_rate": 0.0017481287995809965, "loss": 2.7624, "step": 9453 }, { "epoch": 0.25, "learning_rate": 0.0017480710415822753, "loss": 2.547, "step": 9454 }, { "epoch": 0.25, "learning_rate": 0.0017480132779163018, "loss": 2.433, "step": 9455 }, { "epoch": 0.25, "learning_rate": 0.0017479555085835134, "loss": 2.5985, "step": 9456 }, { "epoch": 0.25, "learning_rate": 0.001747897733584348, "loss": 2.1676, "step": 9457 }, { "epoch": 0.25, "learning_rate": 0.001747839952919243, "loss": 2.749, "step": 9458 }, { "epoch": 0.25, "learning_rate": 0.0017477821665886361, "loss": 2.2683, "step": 9459 }, { "epoch": 0.25, "learning_rate": 0.0017477243745929653, "loss": 2.5745, "step": 9460 }, { "epoch": 0.25, "learning_rate": 0.0017476665769326682, "loss": 2.6587, "step": 9461 }, { "epoch": 0.25, "learning_rate": 0.0017476087736081828, "loss": 2.8173, "step": 9462 }, { "epoch": 0.25, "learning_rate": 0.0017475509646199471, "loss": 2.3175, "step": 9463 }, { "epoch": 0.25, "learning_rate": 0.001747493149968399, "loss": 2.6053, "step": 9464 }, { "epoch": 0.25, "learning_rate": 0.0017474353296539765, "loss": 2.7961, "step": 9465 }, { "epoch": 0.25, "learning_rate": 0.0017473775036771172, "loss": 2.8052, "step": 9466 }, { "epoch": 0.25, "learning_rate": 0.00174731967203826, "loss": 2.6393, "step": 9467 }, { "epoch": 0.25, "learning_rate": 0.0017472618347378422, "loss": 2.8221, "step": 9468 }, { "epoch": 0.25, "learning_rate": 0.0017472039917763025, "loss": 2.4696, "step": 9469 }, { "epoch": 0.25, "learning_rate": 0.0017471461431540786, "loss": 2.609, "step": 9470 }, { "epoch": 0.25, "learning_rate": 0.0017470882888716097, "loss": 2.4769, "step": 9471 }, { "epoch": 0.25, "learning_rate": 0.0017470304289293331, "loss": 2.6423, "step": 9472 }, { "epoch": 0.25, "learning_rate": 0.0017469725633276875, "loss": 2.0379, "step": 9473 }, { "epoch": 0.25, "learning_rate": 0.0017469146920671115, "loss": 2.3333, "step": 9474 }, { "epoch": 0.25, "learning_rate": 0.0017468568151480434, "loss": 2.7124, "step": 9475 }, { "epoch": 0.25, "learning_rate": 0.0017467989325709215, "loss": 3.082, "step": 9476 }, { "epoch": 0.25, "learning_rate": 0.0017467410443361845, "loss": 3.0048, "step": 9477 }, { "epoch": 0.25, "learning_rate": 0.0017466831504442705, "loss": 2.0255, "step": 9478 }, { "epoch": 0.25, "learning_rate": 0.0017466252508956189, "loss": 2.6726, "step": 9479 }, { "epoch": 0.25, "learning_rate": 0.0017465673456906674, "loss": 2.5805, "step": 9480 }, { "epoch": 0.25, "learning_rate": 0.0017465094348298555, "loss": 2.4659, "step": 9481 }, { "epoch": 0.25, "learning_rate": 0.0017464515183136214, "loss": 2.221, "step": 9482 }, { "epoch": 0.25, "learning_rate": 0.0017463935961424043, "loss": 2.6854, "step": 9483 }, { "epoch": 0.25, "learning_rate": 0.0017463356683166424, "loss": 2.5674, "step": 9484 }, { "epoch": 0.25, "learning_rate": 0.001746277734836775, "loss": 2.2003, "step": 9485 }, { "epoch": 0.25, "learning_rate": 0.0017462197957032414, "loss": 2.7114, "step": 9486 }, { "epoch": 0.25, "learning_rate": 0.0017461618509164794, "loss": 2.5584, "step": 9487 }, { "epoch": 0.25, "learning_rate": 0.0017461039004769289, "loss": 2.7875, "step": 9488 }, { "epoch": 0.26, "learning_rate": 0.0017460459443850288, "loss": 2.5498, "step": 9489 }, { "epoch": 0.26, "learning_rate": 0.0017459879826412178, "loss": 2.239, "step": 9490 }, { "epoch": 0.26, "learning_rate": 0.0017459300152459353, "loss": 2.3775, "step": 9491 }, { "epoch": 0.26, "learning_rate": 0.0017458720421996202, "loss": 2.9466, "step": 9492 }, { "epoch": 0.26, "learning_rate": 0.0017458140635027118, "loss": 2.2009, "step": 9493 }, { "epoch": 0.26, "learning_rate": 0.0017457560791556497, "loss": 2.3388, "step": 9494 }, { "epoch": 0.26, "learning_rate": 0.0017456980891588727, "loss": 2.4159, "step": 9495 }, { "epoch": 0.26, "learning_rate": 0.0017456400935128202, "loss": 2.3758, "step": 9496 }, { "epoch": 0.26, "learning_rate": 0.0017455820922179317, "loss": 2.5798, "step": 9497 }, { "epoch": 0.26, "learning_rate": 0.0017455240852746468, "loss": 2.3121, "step": 9498 }, { "epoch": 0.26, "learning_rate": 0.0017454660726834046, "loss": 2.5009, "step": 9499 }, { "epoch": 0.26, "learning_rate": 0.0017454080544446447, "loss": 2.8066, "step": 9500 }, { "epoch": 0.26, "learning_rate": 0.0017453500305588065, "loss": 2.6801, "step": 9501 }, { "epoch": 0.26, "learning_rate": 0.0017452920010263297, "loss": 2.513, "step": 9502 }, { "epoch": 0.26, "learning_rate": 0.0017452339658476541, "loss": 2.5331, "step": 9503 }, { "epoch": 0.26, "learning_rate": 0.0017451759250232195, "loss": 2.7345, "step": 9504 }, { "epoch": 0.26, "learning_rate": 0.0017451178785534648, "loss": 2.4279, "step": 9505 }, { "epoch": 0.26, "learning_rate": 0.0017450598264388308, "loss": 2.3668, "step": 9506 }, { "epoch": 0.26, "learning_rate": 0.001745001768679756, "loss": 2.4766, "step": 9507 }, { "epoch": 0.26, "learning_rate": 0.0017449437052766818, "loss": 2.4869, "step": 9508 }, { "epoch": 0.26, "learning_rate": 0.0017448856362300468, "loss": 3.0146, "step": 9509 }, { "epoch": 0.26, "learning_rate": 0.0017448275615402915, "loss": 2.6045, "step": 9510 }, { "epoch": 0.26, "learning_rate": 0.0017447694812078556, "loss": 2.8734, "step": 9511 }, { "epoch": 0.26, "learning_rate": 0.0017447113952331797, "loss": 2.491, "step": 9512 }, { "epoch": 0.26, "learning_rate": 0.0017446533036167028, "loss": 2.5885, "step": 9513 }, { "epoch": 0.26, "learning_rate": 0.0017445952063588662, "loss": 2.5863, "step": 9514 }, { "epoch": 0.26, "learning_rate": 0.001744537103460109, "loss": 2.6133, "step": 9515 }, { "epoch": 0.26, "learning_rate": 0.0017444789949208719, "loss": 2.7906, "step": 9516 }, { "epoch": 0.26, "learning_rate": 0.001744420880741595, "loss": 2.6235, "step": 9517 }, { "epoch": 0.26, "learning_rate": 0.0017443627609227189, "loss": 2.6179, "step": 9518 }, { "epoch": 0.26, "learning_rate": 0.0017443046354646834, "loss": 2.4213, "step": 9519 }, { "epoch": 0.26, "learning_rate": 0.0017442465043679292, "loss": 2.7416, "step": 9520 }, { "epoch": 0.26, "learning_rate": 0.0017441883676328964, "loss": 2.4631, "step": 9521 }, { "epoch": 0.26, "learning_rate": 0.0017441302252600255, "loss": 2.5274, "step": 9522 }, { "epoch": 0.26, "learning_rate": 0.001744072077249757, "loss": 2.5431, "step": 9523 }, { "epoch": 0.26, "learning_rate": 0.0017440139236025317, "loss": 2.6939, "step": 9524 }, { "epoch": 0.26, "learning_rate": 0.0017439557643187898, "loss": 2.5428, "step": 9525 }, { "epoch": 0.26, "learning_rate": 0.0017438975993989724, "loss": 2.9363, "step": 9526 }, { "epoch": 0.26, "learning_rate": 0.0017438394288435194, "loss": 2.3256, "step": 9527 }, { "epoch": 0.26, "learning_rate": 0.0017437812526528717, "loss": 2.2931, "step": 9528 }, { "epoch": 0.26, "learning_rate": 0.0017437230708274708, "loss": 2.9577, "step": 9529 }, { "epoch": 0.26, "learning_rate": 0.0017436648833677561, "loss": 2.4897, "step": 9530 }, { "epoch": 0.26, "learning_rate": 0.0017436066902741696, "loss": 2.4889, "step": 9531 }, { "epoch": 0.26, "learning_rate": 0.001743548491547152, "loss": 2.4853, "step": 9532 }, { "epoch": 0.26, "learning_rate": 0.001743490287187144, "loss": 2.6561, "step": 9533 }, { "epoch": 0.26, "learning_rate": 0.001743432077194586, "loss": 2.881, "step": 9534 }, { "epoch": 0.26, "learning_rate": 0.0017433738615699197, "loss": 2.9627, "step": 9535 }, { "epoch": 0.26, "learning_rate": 0.0017433156403135858, "loss": 2.9778, "step": 9536 }, { "epoch": 0.26, "learning_rate": 0.0017432574134260256, "loss": 2.6239, "step": 9537 }, { "epoch": 0.26, "learning_rate": 0.0017431991809076803, "loss": 2.6022, "step": 9538 }, { "epoch": 0.26, "learning_rate": 0.001743140942758991, "loss": 2.785, "step": 9539 }, { "epoch": 0.26, "learning_rate": 0.0017430826989803983, "loss": 2.669, "step": 9540 }, { "epoch": 0.26, "learning_rate": 0.0017430244495723443, "loss": 2.6005, "step": 9541 }, { "epoch": 0.26, "learning_rate": 0.0017429661945352697, "loss": 2.5103, "step": 9542 }, { "epoch": 0.26, "learning_rate": 0.001742907933869616, "loss": 2.7173, "step": 9543 }, { "epoch": 0.26, "learning_rate": 0.001742849667575825, "loss": 2.3149, "step": 9544 }, { "epoch": 0.26, "learning_rate": 0.0017427913956543372, "loss": 2.4705, "step": 9545 }, { "epoch": 0.26, "learning_rate": 0.001742733118105595, "loss": 2.8459, "step": 9546 }, { "epoch": 0.26, "learning_rate": 0.0017426748349300394, "loss": 2.2151, "step": 9547 }, { "epoch": 0.26, "learning_rate": 0.0017426165461281121, "loss": 3.1416, "step": 9548 }, { "epoch": 0.26, "learning_rate": 0.0017425582517002543, "loss": 2.7692, "step": 9549 }, { "epoch": 0.26, "learning_rate": 0.001742499951646908, "loss": 2.7705, "step": 9550 }, { "epoch": 0.26, "learning_rate": 0.001742441645968515, "loss": 2.6341, "step": 9551 }, { "epoch": 0.26, "learning_rate": 0.001742383334665517, "loss": 2.1909, "step": 9552 }, { "epoch": 0.26, "learning_rate": 0.0017423250177383551, "loss": 2.6326, "step": 9553 }, { "epoch": 0.26, "learning_rate": 0.001742266695187472, "loss": 2.9448, "step": 9554 }, { "epoch": 0.26, "learning_rate": 0.001742208367013309, "loss": 3.1172, "step": 9555 }, { "epoch": 0.26, "learning_rate": 0.0017421500332163078, "loss": 2.2695, "step": 9556 }, { "epoch": 0.26, "learning_rate": 0.0017420916937969108, "loss": 2.4934, "step": 9557 }, { "epoch": 0.26, "learning_rate": 0.0017420333487555603, "loss": 2.5109, "step": 9558 }, { "epoch": 0.26, "learning_rate": 0.0017419749980926971, "loss": 2.6459, "step": 9559 }, { "epoch": 0.26, "learning_rate": 0.0017419166418087642, "loss": 2.72, "step": 9560 }, { "epoch": 0.26, "learning_rate": 0.0017418582799042035, "loss": 2.519, "step": 9561 }, { "epoch": 0.26, "learning_rate": 0.0017417999123794572, "loss": 2.8934, "step": 9562 }, { "epoch": 0.26, "learning_rate": 0.0017417415392349674, "loss": 2.5287, "step": 9563 }, { "epoch": 0.26, "learning_rate": 0.001741683160471176, "loss": 2.5846, "step": 9564 }, { "epoch": 0.26, "learning_rate": 0.001741624776088526, "loss": 2.4697, "step": 9565 }, { "epoch": 0.26, "learning_rate": 0.001741566386087459, "loss": 3.1441, "step": 9566 }, { "epoch": 0.26, "learning_rate": 0.001741507990468418, "loss": 2.7625, "step": 9567 }, { "epoch": 0.26, "learning_rate": 0.0017414495892318445, "loss": 2.5811, "step": 9568 }, { "epoch": 0.26, "learning_rate": 0.0017413911823781817, "loss": 2.9071, "step": 9569 }, { "epoch": 0.26, "learning_rate": 0.001741332769907872, "loss": 2.8584, "step": 9570 }, { "epoch": 0.26, "learning_rate": 0.0017412743518213575, "loss": 2.9086, "step": 9571 }, { "epoch": 0.26, "learning_rate": 0.001741215928119081, "loss": 2.5473, "step": 9572 }, { "epoch": 0.26, "learning_rate": 0.0017411574988014857, "loss": 2.5928, "step": 9573 }, { "epoch": 0.26, "learning_rate": 0.0017410990638690135, "loss": 2.47, "step": 9574 }, { "epoch": 0.26, "learning_rate": 0.0017410406233221067, "loss": 2.3929, "step": 9575 }, { "epoch": 0.26, "learning_rate": 0.0017409821771612092, "loss": 2.7334, "step": 9576 }, { "epoch": 0.26, "learning_rate": 0.0017409237253867631, "loss": 2.6169, "step": 9577 }, { "epoch": 0.26, "learning_rate": 0.0017408652679992112, "loss": 2.3444, "step": 9578 }, { "epoch": 0.26, "learning_rate": 0.0017408068049989964, "loss": 2.6371, "step": 9579 }, { "epoch": 0.26, "learning_rate": 0.0017407483363865621, "loss": 2.8875, "step": 9580 }, { "epoch": 0.26, "learning_rate": 0.0017406898621623505, "loss": 2.4862, "step": 9581 }, { "epoch": 0.26, "learning_rate": 0.001740631382326805, "loss": 2.0965, "step": 9582 }, { "epoch": 0.26, "learning_rate": 0.0017405728968803685, "loss": 2.4829, "step": 9583 }, { "epoch": 0.26, "learning_rate": 0.0017405144058234843, "loss": 2.2725, "step": 9584 }, { "epoch": 0.26, "learning_rate": 0.0017404559091565952, "loss": 2.8604, "step": 9585 }, { "epoch": 0.26, "learning_rate": 0.0017403974068801445, "loss": 2.6078, "step": 9586 }, { "epoch": 0.26, "learning_rate": 0.0017403388989945757, "loss": 2.2034, "step": 9587 }, { "epoch": 0.26, "learning_rate": 0.0017402803855003316, "loss": 2.4076, "step": 9588 }, { "epoch": 0.26, "learning_rate": 0.0017402218663978553, "loss": 2.8097, "step": 9589 }, { "epoch": 0.26, "learning_rate": 0.001740163341687591, "loss": 2.6343, "step": 9590 }, { "epoch": 0.26, "learning_rate": 0.001740104811369981, "loss": 2.607, "step": 9591 }, { "epoch": 0.26, "learning_rate": 0.0017400462754454697, "loss": 2.5459, "step": 9592 }, { "epoch": 0.26, "learning_rate": 0.0017399877339145, "loss": 2.8717, "step": 9593 }, { "epoch": 0.26, "learning_rate": 0.0017399291867775158, "loss": 2.7762, "step": 9594 }, { "epoch": 0.26, "learning_rate": 0.0017398706340349599, "loss": 2.3656, "step": 9595 }, { "epoch": 0.26, "learning_rate": 0.0017398120756872766, "loss": 2.3907, "step": 9596 }, { "epoch": 0.26, "learning_rate": 0.0017397535117349094, "loss": 2.1705, "step": 9597 }, { "epoch": 0.26, "learning_rate": 0.0017396949421783017, "loss": 2.3329, "step": 9598 }, { "epoch": 0.26, "learning_rate": 0.0017396363670178971, "loss": 2.9451, "step": 9599 }, { "epoch": 0.26, "learning_rate": 0.0017395777862541399, "loss": 2.9192, "step": 9600 }, { "epoch": 0.26, "learning_rate": 0.0017395191998874737, "loss": 2.4198, "step": 9601 }, { "epoch": 0.26, "learning_rate": 0.0017394606079183421, "loss": 2.6482, "step": 9602 }, { "epoch": 0.26, "learning_rate": 0.0017394020103471892, "loss": 2.6955, "step": 9603 }, { "epoch": 0.26, "learning_rate": 0.0017393434071744588, "loss": 2.7648, "step": 9604 }, { "epoch": 0.26, "learning_rate": 0.001739284798400595, "loss": 2.4454, "step": 9605 }, { "epoch": 0.26, "learning_rate": 0.0017392261840260418, "loss": 2.8003, "step": 9606 }, { "epoch": 0.26, "learning_rate": 0.001739167564051243, "loss": 2.7655, "step": 9607 }, { "epoch": 0.26, "learning_rate": 0.001739108938476643, "loss": 2.9793, "step": 9608 }, { "epoch": 0.26, "learning_rate": 0.0017390503073026857, "loss": 2.3409, "step": 9609 }, { "epoch": 0.26, "learning_rate": 0.0017389916705298158, "loss": 2.5804, "step": 9610 }, { "epoch": 0.26, "learning_rate": 0.0017389330281584769, "loss": 2.7932, "step": 9611 }, { "epoch": 0.26, "learning_rate": 0.0017388743801891131, "loss": 2.8571, "step": 9612 }, { "epoch": 0.26, "learning_rate": 0.0017388157266221697, "loss": 2.8326, "step": 9613 }, { "epoch": 0.26, "learning_rate": 0.00173875706745809, "loss": 2.7119, "step": 9614 }, { "epoch": 0.26, "learning_rate": 0.001738698402697319, "loss": 2.7576, "step": 9615 }, { "epoch": 0.26, "learning_rate": 0.001738639732340301, "loss": 2.4996, "step": 9616 }, { "epoch": 0.26, "learning_rate": 0.0017385810563874805, "loss": 3.2323, "step": 9617 }, { "epoch": 0.26, "learning_rate": 0.0017385223748393017, "loss": 2.6598, "step": 9618 }, { "epoch": 0.26, "learning_rate": 0.0017384636876962096, "loss": 2.9249, "step": 9619 }, { "epoch": 0.26, "learning_rate": 0.0017384049949586485, "loss": 2.9144, "step": 9620 }, { "epoch": 0.26, "learning_rate": 0.0017383462966270634, "loss": 2.747, "step": 9621 }, { "epoch": 0.26, "learning_rate": 0.0017382875927018987, "loss": 2.8796, "step": 9622 }, { "epoch": 0.26, "learning_rate": 0.001738228883183599, "loss": 2.5989, "step": 9623 }, { "epoch": 0.26, "learning_rate": 0.0017381701680726095, "loss": 2.7939, "step": 9624 }, { "epoch": 0.26, "learning_rate": 0.001738111447369375, "loss": 2.6547, "step": 9625 }, { "epoch": 0.26, "learning_rate": 0.0017380527210743395, "loss": 2.7112, "step": 9626 }, { "epoch": 0.26, "learning_rate": 0.0017379939891879487, "loss": 2.5242, "step": 9627 }, { "epoch": 0.26, "learning_rate": 0.0017379352517106477, "loss": 2.5031, "step": 9628 }, { "epoch": 0.26, "learning_rate": 0.0017378765086428812, "loss": 2.8631, "step": 9629 }, { "epoch": 0.26, "learning_rate": 0.0017378177599850937, "loss": 2.6819, "step": 9630 }, { "epoch": 0.26, "learning_rate": 0.0017377590057377312, "loss": 2.4872, "step": 9631 }, { "epoch": 0.26, "learning_rate": 0.0017377002459012384, "loss": 2.6281, "step": 9632 }, { "epoch": 0.26, "learning_rate": 0.00173764148047606, "loss": 2.5561, "step": 9633 }, { "epoch": 0.26, "learning_rate": 0.001737582709462642, "loss": 2.8972, "step": 9634 }, { "epoch": 0.26, "learning_rate": 0.001737523932861429, "loss": 2.9829, "step": 9635 }, { "epoch": 0.26, "learning_rate": 0.0017374651506728669, "loss": 2.8903, "step": 9636 }, { "epoch": 0.26, "learning_rate": 0.0017374063628974004, "loss": 2.5804, "step": 9637 }, { "epoch": 0.26, "learning_rate": 0.001737347569535475, "loss": 2.6394, "step": 9638 }, { "epoch": 0.26, "learning_rate": 0.0017372887705875365, "loss": 2.6518, "step": 9639 }, { "epoch": 0.26, "learning_rate": 0.0017372299660540298, "loss": 2.6907, "step": 9640 }, { "epoch": 0.26, "learning_rate": 0.0017371711559354011, "loss": 2.288, "step": 9641 }, { "epoch": 0.26, "learning_rate": 0.0017371123402320952, "loss": 2.2202, "step": 9642 }, { "epoch": 0.26, "learning_rate": 0.0017370535189445582, "loss": 2.5058, "step": 9643 }, { "epoch": 0.26, "learning_rate": 0.0017369946920732353, "loss": 2.335, "step": 9644 }, { "epoch": 0.26, "learning_rate": 0.0017369358596185725, "loss": 2.3583, "step": 9645 }, { "epoch": 0.26, "learning_rate": 0.0017368770215810154, "loss": 2.4167, "step": 9646 }, { "epoch": 0.26, "learning_rate": 0.0017368181779610096, "loss": 2.5741, "step": 9647 }, { "epoch": 0.26, "learning_rate": 0.0017367593287590012, "loss": 2.7013, "step": 9648 }, { "epoch": 0.26, "learning_rate": 0.0017367004739754358, "loss": 2.4502, "step": 9649 }, { "epoch": 0.26, "learning_rate": 0.0017366416136107591, "loss": 2.459, "step": 9650 }, { "epoch": 0.26, "learning_rate": 0.0017365827476654174, "loss": 2.8423, "step": 9651 }, { "epoch": 0.26, "learning_rate": 0.0017365238761398566, "loss": 2.467, "step": 9652 }, { "epoch": 0.26, "learning_rate": 0.0017364649990345225, "loss": 2.5046, "step": 9653 }, { "epoch": 0.26, "learning_rate": 0.0017364061163498612, "loss": 2.7537, "step": 9654 }, { "epoch": 0.26, "learning_rate": 0.0017363472280863188, "loss": 2.5082, "step": 9655 }, { "epoch": 0.26, "learning_rate": 0.0017362883342443417, "loss": 3.0448, "step": 9656 }, { "epoch": 0.26, "learning_rate": 0.0017362294348243754, "loss": 2.9042, "step": 9657 }, { "epoch": 0.26, "learning_rate": 0.0017361705298268668, "loss": 2.105, "step": 9658 }, { "epoch": 0.26, "learning_rate": 0.0017361116192522617, "loss": 2.6769, "step": 9659 }, { "epoch": 0.26, "learning_rate": 0.0017360527031010068, "loss": 2.6469, "step": 9660 }, { "epoch": 0.26, "learning_rate": 0.001735993781373548, "loss": 2.5967, "step": 9661 }, { "epoch": 0.26, "learning_rate": 0.0017359348540703322, "loss": 2.6353, "step": 9662 }, { "epoch": 0.26, "learning_rate": 0.0017358759211918051, "loss": 2.495, "step": 9663 }, { "epoch": 0.26, "learning_rate": 0.0017358169827384141, "loss": 2.3092, "step": 9664 }, { "epoch": 0.26, "learning_rate": 0.0017357580387106046, "loss": 2.6769, "step": 9665 }, { "epoch": 0.26, "learning_rate": 0.001735699089108824, "loss": 2.9038, "step": 9666 }, { "epoch": 0.26, "learning_rate": 0.0017356401339335187, "loss": 2.6206, "step": 9667 }, { "epoch": 0.26, "learning_rate": 0.0017355811731851354, "loss": 2.38, "step": 9668 }, { "epoch": 0.26, "learning_rate": 0.0017355222068641204, "loss": 2.6471, "step": 9669 }, { "epoch": 0.26, "learning_rate": 0.0017354632349709208, "loss": 2.4478, "step": 9670 }, { "epoch": 0.26, "learning_rate": 0.0017354042575059832, "loss": 2.7337, "step": 9671 }, { "epoch": 0.26, "learning_rate": 0.0017353452744697541, "loss": 2.9968, "step": 9672 }, { "epoch": 0.26, "learning_rate": 0.001735286285862681, "loss": 2.5563, "step": 9673 }, { "epoch": 0.26, "learning_rate": 0.0017352272916852103, "loss": 2.1596, "step": 9674 }, { "epoch": 0.26, "learning_rate": 0.0017351682919377893, "loss": 2.8439, "step": 9675 }, { "epoch": 0.26, "learning_rate": 0.0017351092866208647, "loss": 2.8852, "step": 9676 }, { "epoch": 0.26, "learning_rate": 0.0017350502757348834, "loss": 2.5349, "step": 9677 }, { "epoch": 0.26, "learning_rate": 0.0017349912592802927, "loss": 2.9065, "step": 9678 }, { "epoch": 0.26, "learning_rate": 0.0017349322372575396, "loss": 2.5802, "step": 9679 }, { "epoch": 0.26, "learning_rate": 0.0017348732096670713, "loss": 2.3355, "step": 9680 }, { "epoch": 0.26, "learning_rate": 0.001734814176509335, "loss": 2.5345, "step": 9681 }, { "epoch": 0.26, "learning_rate": 0.0017347551377847779, "loss": 2.2221, "step": 9682 }, { "epoch": 0.26, "learning_rate": 0.0017346960934938472, "loss": 2.8936, "step": 9683 }, { "epoch": 0.26, "learning_rate": 0.0017346370436369903, "loss": 2.5287, "step": 9684 }, { "epoch": 0.26, "learning_rate": 0.0017345779882146544, "loss": 2.7438, "step": 9685 }, { "epoch": 0.26, "learning_rate": 0.001734518927227287, "loss": 2.5163, "step": 9686 }, { "epoch": 0.26, "learning_rate": 0.0017344598606753355, "loss": 2.7567, "step": 9687 }, { "epoch": 0.26, "learning_rate": 0.0017344007885592473, "loss": 2.3105, "step": 9688 }, { "epoch": 0.26, "learning_rate": 0.0017343417108794704, "loss": 2.5396, "step": 9689 }, { "epoch": 0.26, "learning_rate": 0.0017342826276364517, "loss": 2.7803, "step": 9690 }, { "epoch": 0.26, "learning_rate": 0.0017342235388306392, "loss": 2.145, "step": 9691 }, { "epoch": 0.26, "learning_rate": 0.0017341644444624803, "loss": 2.5986, "step": 9692 }, { "epoch": 0.26, "learning_rate": 0.0017341053445324229, "loss": 2.3002, "step": 9693 }, { "epoch": 0.26, "learning_rate": 0.0017340462390409146, "loss": 2.5612, "step": 9694 }, { "epoch": 0.26, "learning_rate": 0.0017339871279884035, "loss": 2.8549, "step": 9695 }, { "epoch": 0.26, "learning_rate": 0.001733928011375337, "loss": 2.7547, "step": 9696 }, { "epoch": 0.26, "learning_rate": 0.0017338688892021628, "loss": 2.476, "step": 9697 }, { "epoch": 0.26, "learning_rate": 0.0017338097614693294, "loss": 2.4141, "step": 9698 }, { "epoch": 0.26, "learning_rate": 0.0017337506281772841, "loss": 2.9403, "step": 9699 }, { "epoch": 0.26, "learning_rate": 0.0017336914893264757, "loss": 2.3564, "step": 9700 }, { "epoch": 0.26, "learning_rate": 0.0017336323449173518, "loss": 2.451, "step": 9701 }, { "epoch": 0.26, "learning_rate": 0.0017335731949503599, "loss": 2.4676, "step": 9702 }, { "epoch": 0.26, "learning_rate": 0.0017335140394259489, "loss": 2.1424, "step": 9703 }, { "epoch": 0.26, "learning_rate": 0.0017334548783445665, "loss": 3.3388, "step": 9704 }, { "epoch": 0.26, "learning_rate": 0.0017333957117066615, "loss": 2.8682, "step": 9705 }, { "epoch": 0.26, "learning_rate": 0.0017333365395126813, "loss": 2.5249, "step": 9706 }, { "epoch": 0.26, "learning_rate": 0.0017332773617630749, "loss": 2.4197, "step": 9707 }, { "epoch": 0.26, "learning_rate": 0.00173321817845829, "loss": 2.1135, "step": 9708 }, { "epoch": 0.26, "learning_rate": 0.0017331589895987754, "loss": 2.96, "step": 9709 }, { "epoch": 0.26, "learning_rate": 0.0017330997951849794, "loss": 2.8389, "step": 9710 }, { "epoch": 0.26, "learning_rate": 0.0017330405952173502, "loss": 2.4045, "step": 9711 }, { "epoch": 0.26, "learning_rate": 0.0017329813896963366, "loss": 2.4444, "step": 9712 }, { "epoch": 0.26, "learning_rate": 0.0017329221786223873, "loss": 2.481, "step": 9713 }, { "epoch": 0.26, "learning_rate": 0.0017328629619959503, "loss": 2.5199, "step": 9714 }, { "epoch": 0.26, "learning_rate": 0.0017328037398174749, "loss": 2.6715, "step": 9715 }, { "epoch": 0.26, "learning_rate": 0.001732744512087409, "loss": 2.7644, "step": 9716 }, { "epoch": 0.26, "learning_rate": 0.0017326852788062017, "loss": 2.2942, "step": 9717 }, { "epoch": 0.26, "learning_rate": 0.001732626039974302, "loss": 2.4751, "step": 9718 }, { "epoch": 0.26, "learning_rate": 0.0017325667955921582, "loss": 2.216, "step": 9719 }, { "epoch": 0.26, "learning_rate": 0.0017325075456602194, "loss": 2.8063, "step": 9720 }, { "epoch": 0.26, "learning_rate": 0.0017324482901789344, "loss": 2.6146, "step": 9721 }, { "epoch": 0.26, "learning_rate": 0.001732389029148752, "loss": 2.4336, "step": 9722 }, { "epoch": 0.26, "learning_rate": 0.0017323297625701213, "loss": 2.5775, "step": 9723 }, { "epoch": 0.26, "learning_rate": 0.0017322704904434913, "loss": 2.4724, "step": 9724 }, { "epoch": 0.26, "learning_rate": 0.001732211212769311, "loss": 2.6045, "step": 9725 }, { "epoch": 0.26, "learning_rate": 0.0017321519295480292, "loss": 2.5525, "step": 9726 }, { "epoch": 0.26, "learning_rate": 0.0017320926407800956, "loss": 2.5307, "step": 9727 }, { "epoch": 0.26, "learning_rate": 0.001732033346465959, "loss": 2.5472, "step": 9728 }, { "epoch": 0.26, "learning_rate": 0.0017319740466060685, "loss": 2.6522, "step": 9729 }, { "epoch": 0.26, "learning_rate": 0.0017319147412008739, "loss": 2.7401, "step": 9730 }, { "epoch": 0.26, "learning_rate": 0.0017318554302508233, "loss": 2.788, "step": 9731 }, { "epoch": 0.26, "learning_rate": 0.0017317961137563675, "loss": 2.4276, "step": 9732 }, { "epoch": 0.26, "learning_rate": 0.0017317367917179546, "loss": 2.3699, "step": 9733 }, { "epoch": 0.26, "learning_rate": 0.0017316774641360352, "loss": 2.7338, "step": 9734 }, { "epoch": 0.26, "learning_rate": 0.0017316181310110578, "loss": 2.5295, "step": 9735 }, { "epoch": 0.26, "learning_rate": 0.0017315587923434723, "loss": 2.3072, "step": 9736 }, { "epoch": 0.26, "learning_rate": 0.001731499448133728, "loss": 2.7155, "step": 9737 }, { "epoch": 0.26, "learning_rate": 0.0017314400983822749, "loss": 2.3459, "step": 9738 }, { "epoch": 0.26, "learning_rate": 0.0017313807430895624, "loss": 2.8021, "step": 9739 }, { "epoch": 0.26, "learning_rate": 0.00173132138225604, "loss": 2.3075, "step": 9740 }, { "epoch": 0.26, "learning_rate": 0.0017312620158821575, "loss": 2.5525, "step": 9741 }, { "epoch": 0.26, "learning_rate": 0.001731202643968365, "loss": 2.5977, "step": 9742 }, { "epoch": 0.26, "learning_rate": 0.0017311432665151117, "loss": 2.7639, "step": 9743 }, { "epoch": 0.26, "learning_rate": 0.0017310838835228478, "loss": 2.4511, "step": 9744 }, { "epoch": 0.26, "learning_rate": 0.0017310244949920231, "loss": 2.5358, "step": 9745 }, { "epoch": 0.26, "learning_rate": 0.0017309651009230875, "loss": 2.5888, "step": 9746 }, { "epoch": 0.26, "learning_rate": 0.001730905701316491, "loss": 2.4229, "step": 9747 }, { "epoch": 0.26, "learning_rate": 0.001730846296172684, "loss": 2.6732, "step": 9748 }, { "epoch": 0.26, "learning_rate": 0.0017307868854921154, "loss": 2.763, "step": 9749 }, { "epoch": 0.26, "learning_rate": 0.0017307274692752363, "loss": 2.6077, "step": 9750 }, { "epoch": 0.26, "learning_rate": 0.0017306680475224967, "loss": 2.754, "step": 9751 }, { "epoch": 0.26, "learning_rate": 0.0017306086202343468, "loss": 2.6405, "step": 9752 }, { "epoch": 0.26, "learning_rate": 0.0017305491874112363, "loss": 2.6118, "step": 9753 }, { "epoch": 0.26, "learning_rate": 0.0017304897490536156, "loss": 2.1738, "step": 9754 }, { "epoch": 0.26, "learning_rate": 0.0017304303051619355, "loss": 2.5827, "step": 9755 }, { "epoch": 0.26, "learning_rate": 0.0017303708557366458, "loss": 3.1146, "step": 9756 }, { "epoch": 0.26, "learning_rate": 0.0017303114007781969, "loss": 2.8155, "step": 9757 }, { "epoch": 0.26, "learning_rate": 0.0017302519402870398, "loss": 2.6567, "step": 9758 }, { "epoch": 0.26, "learning_rate": 0.0017301924742636242, "loss": 2.7894, "step": 9759 }, { "epoch": 0.26, "learning_rate": 0.001730133002708401, "loss": 2.9177, "step": 9760 }, { "epoch": 0.26, "learning_rate": 0.001730073525621821, "loss": 2.4421, "step": 9761 }, { "epoch": 0.26, "learning_rate": 0.0017300140430043342, "loss": 2.7383, "step": 9762 }, { "epoch": 0.26, "learning_rate": 0.0017299545548563916, "loss": 2.442, "step": 9763 }, { "epoch": 0.26, "learning_rate": 0.001729895061178444, "loss": 2.9957, "step": 9764 }, { "epoch": 0.26, "learning_rate": 0.0017298355619709419, "loss": 2.4371, "step": 9765 }, { "epoch": 0.26, "learning_rate": 0.0017297760572343357, "loss": 2.4277, "step": 9766 }, { "epoch": 0.26, "learning_rate": 0.001729716546969077, "loss": 2.4604, "step": 9767 }, { "epoch": 0.26, "learning_rate": 0.0017296570311756158, "loss": 2.5405, "step": 9768 }, { "epoch": 0.26, "learning_rate": 0.0017295975098544037, "loss": 2.5095, "step": 9769 }, { "epoch": 0.26, "learning_rate": 0.001729537983005891, "loss": 2.9001, "step": 9770 }, { "epoch": 0.26, "learning_rate": 0.0017294784506305292, "loss": 2.4229, "step": 9771 }, { "epoch": 0.26, "learning_rate": 0.001729418912728769, "loss": 2.4595, "step": 9772 }, { "epoch": 0.26, "learning_rate": 0.0017293593693010617, "loss": 2.6852, "step": 9773 }, { "epoch": 0.26, "learning_rate": 0.001729299820347858, "loss": 2.7543, "step": 9774 }, { "epoch": 0.26, "learning_rate": 0.001729240265869609, "loss": 2.6823, "step": 9775 }, { "epoch": 0.26, "learning_rate": 0.0017291807058667668, "loss": 3.0783, "step": 9776 }, { "epoch": 0.26, "learning_rate": 0.0017291211403397814, "loss": 2.7418, "step": 9777 }, { "epoch": 0.26, "learning_rate": 0.0017290615692891048, "loss": 2.644, "step": 9778 }, { "epoch": 0.26, "learning_rate": 0.001729001992715188, "loss": 2.2515, "step": 9779 }, { "epoch": 0.26, "learning_rate": 0.0017289424106184824, "loss": 2.1637, "step": 9780 }, { "epoch": 0.26, "learning_rate": 0.0017288828229994398, "loss": 2.6757, "step": 9781 }, { "epoch": 0.26, "learning_rate": 0.0017288232298585107, "loss": 2.9982, "step": 9782 }, { "epoch": 0.26, "learning_rate": 0.0017287636311961473, "loss": 2.6835, "step": 9783 }, { "epoch": 0.26, "learning_rate": 0.0017287040270128012, "loss": 2.4599, "step": 9784 }, { "epoch": 0.26, "learning_rate": 0.0017286444173089236, "loss": 2.5777, "step": 9785 }, { "epoch": 0.26, "learning_rate": 0.0017285848020849657, "loss": 2.9419, "step": 9786 }, { "epoch": 0.26, "learning_rate": 0.0017285251813413801, "loss": 3.0168, "step": 9787 }, { "epoch": 0.26, "learning_rate": 0.0017284655550786176, "loss": 2.7735, "step": 9788 }, { "epoch": 0.26, "learning_rate": 0.0017284059232971305, "loss": 2.4711, "step": 9789 }, { "epoch": 0.26, "learning_rate": 0.0017283462859973705, "loss": 2.3537, "step": 9790 }, { "epoch": 0.26, "learning_rate": 0.001728286643179789, "loss": 2.1647, "step": 9791 }, { "epoch": 0.26, "learning_rate": 0.0017282269948448383, "loss": 2.6968, "step": 9792 }, { "epoch": 0.26, "learning_rate": 0.0017281673409929698, "loss": 2.394, "step": 9793 }, { "epoch": 0.26, "learning_rate": 0.0017281076816246359, "loss": 2.6135, "step": 9794 }, { "epoch": 0.26, "learning_rate": 0.0017280480167402882, "loss": 2.3149, "step": 9795 }, { "epoch": 0.26, "learning_rate": 0.0017279883463403793, "loss": 2.597, "step": 9796 }, { "epoch": 0.26, "learning_rate": 0.0017279286704253605, "loss": 2.3934, "step": 9797 }, { "epoch": 0.26, "learning_rate": 0.0017278689889956844, "loss": 2.2787, "step": 9798 }, { "epoch": 0.26, "learning_rate": 0.001727809302051803, "loss": 2.664, "step": 9799 }, { "epoch": 0.26, "learning_rate": 0.0017277496095941683, "loss": 2.4998, "step": 9800 }, { "epoch": 0.26, "learning_rate": 0.0017276899116232328, "loss": 2.7942, "step": 9801 }, { "epoch": 0.26, "learning_rate": 0.0017276302081394483, "loss": 2.6915, "step": 9802 }, { "epoch": 0.26, "learning_rate": 0.0017275704991432676, "loss": 2.5298, "step": 9803 }, { "epoch": 0.26, "learning_rate": 0.0017275107846351431, "loss": 2.7278, "step": 9804 }, { "epoch": 0.26, "learning_rate": 0.0017274510646155265, "loss": 2.4269, "step": 9805 }, { "epoch": 0.26, "learning_rate": 0.0017273913390848713, "loss": 3.1393, "step": 9806 }, { "epoch": 0.26, "learning_rate": 0.001727331608043629, "loss": 2.7879, "step": 9807 }, { "epoch": 0.26, "learning_rate": 0.0017272718714922526, "loss": 2.5619, "step": 9808 }, { "epoch": 0.26, "learning_rate": 0.0017272121294311944, "loss": 2.5856, "step": 9809 }, { "epoch": 0.26, "learning_rate": 0.001727152381860907, "loss": 2.741, "step": 9810 }, { "epoch": 0.26, "learning_rate": 0.0017270926287818434, "loss": 2.5221, "step": 9811 }, { "epoch": 0.26, "learning_rate": 0.001727032870194456, "loss": 2.5243, "step": 9812 }, { "epoch": 0.26, "learning_rate": 0.0017269731060991975, "loss": 2.5775, "step": 9813 }, { "epoch": 0.26, "learning_rate": 0.0017269133364965208, "loss": 2.6329, "step": 9814 }, { "epoch": 0.26, "learning_rate": 0.0017268535613868786, "loss": 2.4145, "step": 9815 }, { "epoch": 0.26, "learning_rate": 0.0017267937807707238, "loss": 2.9348, "step": 9816 }, { "epoch": 0.26, "learning_rate": 0.0017267339946485092, "loss": 2.5011, "step": 9817 }, { "epoch": 0.26, "learning_rate": 0.0017266742030206876, "loss": 2.8951, "step": 9818 }, { "epoch": 0.26, "learning_rate": 0.0017266144058877126, "loss": 2.4635, "step": 9819 }, { "epoch": 0.26, "learning_rate": 0.0017265546032500362, "loss": 2.2733, "step": 9820 }, { "epoch": 0.26, "learning_rate": 0.0017264947951081125, "loss": 2.4229, "step": 9821 }, { "epoch": 0.26, "learning_rate": 0.0017264349814623938, "loss": 2.4835, "step": 9822 }, { "epoch": 0.26, "learning_rate": 0.0017263751623133336, "loss": 2.7226, "step": 9823 }, { "epoch": 0.26, "learning_rate": 0.0017263153376613851, "loss": 2.6291, "step": 9824 }, { "epoch": 0.26, "learning_rate": 0.0017262555075070014, "loss": 2.5669, "step": 9825 }, { "epoch": 0.26, "learning_rate": 0.0017261956718506361, "loss": 2.5715, "step": 9826 }, { "epoch": 0.26, "learning_rate": 0.001726135830692742, "loss": 2.7471, "step": 9827 }, { "epoch": 0.26, "learning_rate": 0.0017260759840337725, "loss": 2.781, "step": 9828 }, { "epoch": 0.26, "learning_rate": 0.0017260161318741816, "loss": 2.8984, "step": 9829 }, { "epoch": 0.26, "learning_rate": 0.0017259562742144218, "loss": 2.8772, "step": 9830 }, { "epoch": 0.26, "learning_rate": 0.0017258964110549474, "loss": 2.4506, "step": 9831 }, { "epoch": 0.26, "learning_rate": 0.0017258365423962114, "loss": 2.5436, "step": 9832 }, { "epoch": 0.26, "learning_rate": 0.0017257766682386678, "loss": 3.1297, "step": 9833 }, { "epoch": 0.26, "learning_rate": 0.0017257167885827696, "loss": 2.627, "step": 9834 }, { "epoch": 0.26, "learning_rate": 0.0017256569034289708, "loss": 2.6031, "step": 9835 }, { "epoch": 0.26, "learning_rate": 0.0017255970127777252, "loss": 2.4706, "step": 9836 }, { "epoch": 0.26, "learning_rate": 0.0017255371166294863, "loss": 2.7803, "step": 9837 }, { "epoch": 0.26, "learning_rate": 0.0017254772149847076, "loss": 2.7189, "step": 9838 }, { "epoch": 0.26, "learning_rate": 0.0017254173078438434, "loss": 2.3197, "step": 9839 }, { "epoch": 0.26, "learning_rate": 0.0017253573952073476, "loss": 2.7704, "step": 9840 }, { "epoch": 0.26, "learning_rate": 0.0017252974770756734, "loss": 2.761, "step": 9841 }, { "epoch": 0.26, "learning_rate": 0.0017252375534492757, "loss": 2.4476, "step": 9842 }, { "epoch": 0.26, "learning_rate": 0.001725177624328608, "loss": 3.0603, "step": 9843 }, { "epoch": 0.26, "learning_rate": 0.0017251176897141239, "loss": 2.5379, "step": 9844 }, { "epoch": 0.26, "learning_rate": 0.0017250577496062778, "loss": 2.3812, "step": 9845 }, { "epoch": 0.26, "learning_rate": 0.001724997804005524, "loss": 2.1071, "step": 9846 }, { "epoch": 0.26, "learning_rate": 0.0017249378529123165, "loss": 2.9575, "step": 9847 }, { "epoch": 0.26, "learning_rate": 0.0017248778963271092, "loss": 2.7142, "step": 9848 }, { "epoch": 0.26, "learning_rate": 0.0017248179342503568, "loss": 2.7121, "step": 9849 }, { "epoch": 0.26, "learning_rate": 0.001724757966682513, "loss": 3.1312, "step": 9850 }, { "epoch": 0.26, "learning_rate": 0.0017246979936240327, "loss": 2.6261, "step": 9851 }, { "epoch": 0.26, "learning_rate": 0.00172463801507537, "loss": 2.6968, "step": 9852 }, { "epoch": 0.26, "learning_rate": 0.001724578031036979, "loss": 2.775, "step": 9853 }, { "epoch": 0.26, "learning_rate": 0.0017245180415093144, "loss": 2.438, "step": 9854 }, { "epoch": 0.26, "learning_rate": 0.001724458046492831, "loss": 2.313, "step": 9855 }, { "epoch": 0.26, "learning_rate": 0.0017243980459879828, "loss": 2.5597, "step": 9856 }, { "epoch": 0.26, "learning_rate": 0.0017243380399952245, "loss": 2.4953, "step": 9857 }, { "epoch": 0.26, "learning_rate": 0.0017242780285150103, "loss": 2.5247, "step": 9858 }, { "epoch": 0.26, "learning_rate": 0.0017242180115477957, "loss": 3.2465, "step": 9859 }, { "epoch": 0.26, "learning_rate": 0.0017241579890940348, "loss": 2.7753, "step": 9860 }, { "epoch": 0.27, "learning_rate": 0.0017240979611541825, "loss": 2.9641, "step": 9861 }, { "epoch": 0.27, "learning_rate": 0.0017240379277286934, "loss": 2.6553, "step": 9862 }, { "epoch": 0.27, "learning_rate": 0.0017239778888180225, "loss": 2.3881, "step": 9863 }, { "epoch": 0.27, "learning_rate": 0.0017239178444226244, "loss": 2.5759, "step": 9864 }, { "epoch": 0.27, "learning_rate": 0.0017238577945429543, "loss": 2.4398, "step": 9865 }, { "epoch": 0.27, "learning_rate": 0.001723797739179467, "loss": 2.7516, "step": 9866 }, { "epoch": 0.27, "learning_rate": 0.0017237376783326172, "loss": 2.7678, "step": 9867 }, { "epoch": 0.27, "learning_rate": 0.0017236776120028603, "loss": 2.4925, "step": 9868 }, { "epoch": 0.27, "learning_rate": 0.0017236175401906513, "loss": 2.3227, "step": 9869 }, { "epoch": 0.27, "learning_rate": 0.0017235574628964453, "loss": 2.6742, "step": 9870 }, { "epoch": 0.27, "learning_rate": 0.0017234973801206967, "loss": 2.5978, "step": 9871 }, { "epoch": 0.27, "learning_rate": 0.0017234372918638618, "loss": 2.4651, "step": 9872 }, { "epoch": 0.27, "learning_rate": 0.001723377198126395, "loss": 2.1554, "step": 9873 }, { "epoch": 0.27, "learning_rate": 0.0017233170989087523, "loss": 2.6782, "step": 9874 }, { "epoch": 0.27, "learning_rate": 0.0017232569942113884, "loss": 2.6293, "step": 9875 }, { "epoch": 0.27, "learning_rate": 0.0017231968840347588, "loss": 2.8345, "step": 9876 }, { "epoch": 0.27, "learning_rate": 0.0017231367683793186, "loss": 2.5605, "step": 9877 }, { "epoch": 0.27, "learning_rate": 0.001723076647245524, "loss": 2.3313, "step": 9878 }, { "epoch": 0.27, "learning_rate": 0.0017230165206338298, "loss": 2.2641, "step": 9879 }, { "epoch": 0.27, "learning_rate": 0.0017229563885446917, "loss": 2.6563, "step": 9880 }, { "epoch": 0.27, "learning_rate": 0.001722896250978565, "loss": 2.5046, "step": 9881 }, { "epoch": 0.27, "learning_rate": 0.001722836107935906, "loss": 2.7992, "step": 9882 }, { "epoch": 0.27, "learning_rate": 0.0017227759594171698, "loss": 2.3468, "step": 9883 }, { "epoch": 0.27, "learning_rate": 0.0017227158054228119, "loss": 2.5542, "step": 9884 }, { "epoch": 0.27, "learning_rate": 0.0017226556459532883, "loss": 2.3299, "step": 9885 }, { "epoch": 0.27, "learning_rate": 0.001722595481009055, "loss": 2.7686, "step": 9886 }, { "epoch": 0.27, "learning_rate": 0.0017225353105905672, "loss": 2.5945, "step": 9887 }, { "epoch": 0.27, "learning_rate": 0.0017224751346982812, "loss": 2.5046, "step": 9888 }, { "epoch": 0.27, "learning_rate": 0.0017224149533326526, "loss": 2.4687, "step": 9889 }, { "epoch": 0.27, "learning_rate": 0.0017223547664941376, "loss": 2.7727, "step": 9890 }, { "epoch": 0.27, "learning_rate": 0.0017222945741831922, "loss": 2.5645, "step": 9891 }, { "epoch": 0.27, "learning_rate": 0.001722234376400272, "loss": 3.1599, "step": 9892 }, { "epoch": 0.27, "learning_rate": 0.0017221741731458335, "loss": 2.5428, "step": 9893 }, { "epoch": 0.27, "learning_rate": 0.0017221139644203324, "loss": 2.8504, "step": 9894 }, { "epoch": 0.27, "learning_rate": 0.001722053750224225, "loss": 2.8469, "step": 9895 }, { "epoch": 0.27, "learning_rate": 0.0017219935305579678, "loss": 2.6121, "step": 9896 }, { "epoch": 0.27, "learning_rate": 0.0017219333054220164, "loss": 2.774, "step": 9897 }, { "epoch": 0.27, "learning_rate": 0.0017218730748168275, "loss": 2.7352, "step": 9898 }, { "epoch": 0.27, "learning_rate": 0.001721812838742857, "loss": 2.8674, "step": 9899 }, { "epoch": 0.27, "learning_rate": 0.0017217525972005614, "loss": 2.3967, "step": 9900 }, { "epoch": 0.27, "learning_rate": 0.0017216923501903974, "loss": 3.0808, "step": 9901 }, { "epoch": 0.27, "learning_rate": 0.001721632097712821, "loss": 2.5369, "step": 9902 }, { "epoch": 0.27, "learning_rate": 0.001721571839768289, "loss": 2.652, "step": 9903 }, { "epoch": 0.27, "learning_rate": 0.001721511576357258, "loss": 2.5948, "step": 9904 }, { "epoch": 0.27, "learning_rate": 0.001721451307480184, "loss": 2.5453, "step": 9905 }, { "epoch": 0.27, "learning_rate": 0.0017213910331375238, "loss": 2.9694, "step": 9906 }, { "epoch": 0.27, "learning_rate": 0.0017213307533297342, "loss": 2.5701, "step": 9907 }, { "epoch": 0.27, "learning_rate": 0.0017212704680572718, "loss": 2.455, "step": 9908 }, { "epoch": 0.27, "learning_rate": 0.0017212101773205932, "loss": 2.7028, "step": 9909 }, { "epoch": 0.27, "learning_rate": 0.0017211498811201555, "loss": 2.7526, "step": 9910 }, { "epoch": 0.27, "learning_rate": 0.001721089579456415, "loss": 2.8977, "step": 9911 }, { "epoch": 0.27, "learning_rate": 0.0017210292723298286, "loss": 2.9008, "step": 9912 }, { "epoch": 0.27, "learning_rate": 0.0017209689597408539, "loss": 2.8331, "step": 9913 }, { "epoch": 0.27, "learning_rate": 0.0017209086416899466, "loss": 2.6109, "step": 9914 }, { "epoch": 0.27, "learning_rate": 0.0017208483181775649, "loss": 2.472, "step": 9915 }, { "epoch": 0.27, "learning_rate": 0.0017207879892041649, "loss": 2.5245, "step": 9916 }, { "epoch": 0.27, "learning_rate": 0.001720727654770204, "loss": 2.4213, "step": 9917 }, { "epoch": 0.27, "learning_rate": 0.0017206673148761392, "loss": 2.9101, "step": 9918 }, { "epoch": 0.27, "learning_rate": 0.0017206069695224276, "loss": 2.2937, "step": 9919 }, { "epoch": 0.27, "learning_rate": 0.0017205466187095264, "loss": 2.7037, "step": 9920 }, { "epoch": 0.27, "learning_rate": 0.0017204862624378933, "loss": 2.8141, "step": 9921 }, { "epoch": 0.27, "learning_rate": 0.0017204259007079846, "loss": 2.6444, "step": 9922 }, { "epoch": 0.27, "learning_rate": 0.0017203655335202583, "loss": 2.3758, "step": 9923 }, { "epoch": 0.27, "learning_rate": 0.0017203051608751711, "loss": 2.5581, "step": 9924 }, { "epoch": 0.27, "learning_rate": 0.0017202447827731815, "loss": 2.3833, "step": 9925 }, { "epoch": 0.27, "learning_rate": 0.0017201843992147457, "loss": 2.7433, "step": 9926 }, { "epoch": 0.27, "learning_rate": 0.0017201240102003217, "loss": 2.9135, "step": 9927 }, { "epoch": 0.27, "learning_rate": 0.001720063615730367, "loss": 3.076, "step": 9928 }, { "epoch": 0.27, "learning_rate": 0.0017200032158053392, "loss": 2.9033, "step": 9929 }, { "epoch": 0.27, "learning_rate": 0.0017199428104256956, "loss": 2.4306, "step": 9930 }, { "epoch": 0.27, "learning_rate": 0.001719882399591894, "loss": 2.4274, "step": 9931 }, { "epoch": 0.27, "learning_rate": 0.0017198219833043922, "loss": 2.5904, "step": 9932 }, { "epoch": 0.27, "learning_rate": 0.0017197615615636478, "loss": 2.4198, "step": 9933 }, { "epoch": 0.27, "learning_rate": 0.001719701134370118, "loss": 2.4397, "step": 9934 }, { "epoch": 0.27, "learning_rate": 0.0017196407017242615, "loss": 2.7457, "step": 9935 }, { "epoch": 0.27, "learning_rate": 0.0017195802636265356, "loss": 2.8363, "step": 9936 }, { "epoch": 0.27, "learning_rate": 0.001719519820077398, "loss": 2.9665, "step": 9937 }, { "epoch": 0.27, "learning_rate": 0.0017194593710773073, "loss": 2.5784, "step": 9938 }, { "epoch": 0.27, "learning_rate": 0.001719398916626721, "loss": 2.5304, "step": 9939 }, { "epoch": 0.27, "learning_rate": 0.001719338456726097, "loss": 2.6862, "step": 9940 }, { "epoch": 0.27, "learning_rate": 0.0017192779913758934, "loss": 3.0084, "step": 9941 }, { "epoch": 0.27, "learning_rate": 0.0017192175205765685, "loss": 2.7361, "step": 9942 }, { "epoch": 0.27, "learning_rate": 0.00171915704432858, "loss": 2.2623, "step": 9943 }, { "epoch": 0.27, "learning_rate": 0.0017190965626323865, "loss": 2.4845, "step": 9944 }, { "epoch": 0.27, "learning_rate": 0.001719036075488446, "loss": 2.7347, "step": 9945 }, { "epoch": 0.27, "learning_rate": 0.0017189755828972166, "loss": 2.5458, "step": 9946 }, { "epoch": 0.27, "learning_rate": 0.001718915084859157, "loss": 2.6441, "step": 9947 }, { "epoch": 0.27, "learning_rate": 0.0017188545813747252, "loss": 2.4642, "step": 9948 }, { "epoch": 0.27, "learning_rate": 0.0017187940724443793, "loss": 2.3021, "step": 9949 }, { "epoch": 0.27, "learning_rate": 0.0017187335580685782, "loss": 2.5824, "step": 9950 }, { "epoch": 0.27, "learning_rate": 0.00171867303824778, "loss": 2.7316, "step": 9951 }, { "epoch": 0.27, "learning_rate": 0.0017186125129824434, "loss": 2.7849, "step": 9952 }, { "epoch": 0.27, "learning_rate": 0.001718551982273027, "loss": 2.3702, "step": 9953 }, { "epoch": 0.27, "learning_rate": 0.0017184914461199894, "loss": 3.1216, "step": 9954 }, { "epoch": 0.27, "learning_rate": 0.001718430904523789, "loss": 2.6857, "step": 9955 }, { "epoch": 0.27, "learning_rate": 0.0017183703574848845, "loss": 2.5938, "step": 9956 }, { "epoch": 0.27, "learning_rate": 0.0017183098050037344, "loss": 2.8744, "step": 9957 }, { "epoch": 0.27, "learning_rate": 0.0017182492470807977, "loss": 2.6846, "step": 9958 }, { "epoch": 0.27, "learning_rate": 0.0017181886837165333, "loss": 2.1152, "step": 9959 }, { "epoch": 0.27, "learning_rate": 0.0017181281149113996, "loss": 2.7332, "step": 9960 }, { "epoch": 0.27, "learning_rate": 0.0017180675406658556, "loss": 2.3041, "step": 9961 }, { "epoch": 0.27, "learning_rate": 0.0017180069609803606, "loss": 2.7324, "step": 9962 }, { "epoch": 0.27, "learning_rate": 0.001717946375855373, "loss": 3.0266, "step": 9963 }, { "epoch": 0.27, "learning_rate": 0.0017178857852913523, "loss": 2.4146, "step": 9964 }, { "epoch": 0.27, "learning_rate": 0.0017178251892887568, "loss": 3.3166, "step": 9965 }, { "epoch": 0.27, "learning_rate": 0.0017177645878480466, "loss": 2.6107, "step": 9966 }, { "epoch": 0.27, "learning_rate": 0.0017177039809696795, "loss": 2.6209, "step": 9967 }, { "epoch": 0.27, "learning_rate": 0.001717643368654116, "loss": 2.8219, "step": 9968 }, { "epoch": 0.27, "learning_rate": 0.0017175827509018143, "loss": 2.6884, "step": 9969 }, { "epoch": 0.27, "learning_rate": 0.001717522127713234, "loss": 2.6011, "step": 9970 }, { "epoch": 0.27, "learning_rate": 0.0017174614990888345, "loss": 2.5617, "step": 9971 }, { "epoch": 0.27, "learning_rate": 0.0017174008650290746, "loss": 2.4134, "step": 9972 }, { "epoch": 0.27, "learning_rate": 0.0017173402255344144, "loss": 2.5925, "step": 9973 }, { "epoch": 0.27, "learning_rate": 0.0017172795806053125, "loss": 2.3378, "step": 9974 }, { "epoch": 0.27, "learning_rate": 0.001717218930242229, "loss": 2.8086, "step": 9975 }, { "epoch": 0.27, "learning_rate": 0.001717158274445623, "loss": 2.918, "step": 9976 }, { "epoch": 0.27, "learning_rate": 0.0017170976132159545, "loss": 2.1706, "step": 9977 }, { "epoch": 0.27, "learning_rate": 0.0017170369465536823, "loss": 2.5292, "step": 9978 }, { "epoch": 0.27, "learning_rate": 0.0017169762744592663, "loss": 2.404, "step": 9979 }, { "epoch": 0.27, "learning_rate": 0.0017169155969331664, "loss": 2.4134, "step": 9980 }, { "epoch": 0.27, "learning_rate": 0.0017168549139758424, "loss": 2.4463, "step": 9981 }, { "epoch": 0.27, "learning_rate": 0.0017167942255877531, "loss": 2.6979, "step": 9982 }, { "epoch": 0.27, "learning_rate": 0.0017167335317693593, "loss": 3.0193, "step": 9983 }, { "epoch": 0.27, "learning_rate": 0.0017166728325211204, "loss": 2.9468, "step": 9984 }, { "epoch": 0.27, "learning_rate": 0.0017166121278434964, "loss": 2.391, "step": 9985 }, { "epoch": 0.27, "learning_rate": 0.0017165514177369468, "loss": 2.2443, "step": 9986 }, { "epoch": 0.27, "learning_rate": 0.0017164907022019316, "loss": 3.0599, "step": 9987 }, { "epoch": 0.27, "learning_rate": 0.0017164299812389113, "loss": 2.6763, "step": 9988 }, { "epoch": 0.27, "learning_rate": 0.0017163692548483455, "loss": 2.5517, "step": 9989 }, { "epoch": 0.27, "learning_rate": 0.001716308523030694, "loss": 2.5293, "step": 9990 }, { "epoch": 0.27, "learning_rate": 0.0017162477857864174, "loss": 2.6632, "step": 9991 }, { "epoch": 0.27, "learning_rate": 0.0017161870431159757, "loss": 2.4115, "step": 9992 }, { "epoch": 0.27, "learning_rate": 0.0017161262950198288, "loss": 2.7406, "step": 9993 }, { "epoch": 0.27, "learning_rate": 0.0017160655414984371, "loss": 2.5041, "step": 9994 }, { "epoch": 0.27, "learning_rate": 0.0017160047825522612, "loss": 2.263, "step": 9995 }, { "epoch": 0.27, "learning_rate": 0.0017159440181817608, "loss": 2.5941, "step": 9996 }, { "epoch": 0.27, "learning_rate": 0.0017158832483873967, "loss": 2.9011, "step": 9997 }, { "epoch": 0.27, "learning_rate": 0.001715822473169629, "loss": 2.2305, "step": 9998 }, { "epoch": 0.27, "learning_rate": 0.0017157616925289184, "loss": 2.4482, "step": 9999 }, { "epoch": 0.27, "learning_rate": 0.0017157009064657247, "loss": 2.6127, "step": 10000 }, { "epoch": 0.27, "learning_rate": 0.001715640114980509, "loss": 2.5462, "step": 10001 }, { "epoch": 0.27, "learning_rate": 0.0017155793180737323, "loss": 2.6933, "step": 10002 }, { "epoch": 0.27, "learning_rate": 0.001715518515745854, "loss": 2.7286, "step": 10003 }, { "epoch": 0.27, "learning_rate": 0.0017154577079973358, "loss": 2.7489, "step": 10004 }, { "epoch": 0.27, "learning_rate": 0.0017153968948286375, "loss": 2.9222, "step": 10005 }, { "epoch": 0.27, "learning_rate": 0.0017153360762402205, "loss": 2.7378, "step": 10006 }, { "epoch": 0.27, "learning_rate": 0.0017152752522325452, "loss": 2.4644, "step": 10007 }, { "epoch": 0.27, "learning_rate": 0.0017152144228060723, "loss": 2.5656, "step": 10008 }, { "epoch": 0.27, "learning_rate": 0.0017151535879612633, "loss": 2.5863, "step": 10009 }, { "epoch": 0.27, "learning_rate": 0.0017150927476985783, "loss": 2.6551, "step": 10010 }, { "epoch": 0.27, "learning_rate": 0.0017150319020184785, "loss": 2.7221, "step": 10011 }, { "epoch": 0.27, "learning_rate": 0.0017149710509214247, "loss": 2.5692, "step": 10012 }, { "epoch": 0.27, "learning_rate": 0.001714910194407878, "loss": 2.5321, "step": 10013 }, { "epoch": 0.27, "learning_rate": 0.0017148493324782997, "loss": 2.3467, "step": 10014 }, { "epoch": 0.27, "learning_rate": 0.0017147884651331506, "loss": 2.4017, "step": 10015 }, { "epoch": 0.27, "learning_rate": 0.001714727592372892, "loss": 2.493, "step": 10016 }, { "epoch": 0.27, "learning_rate": 0.0017146667141979845, "loss": 2.5964, "step": 10017 }, { "epoch": 0.27, "learning_rate": 0.0017146058306088904, "loss": 2.808, "step": 10018 }, { "epoch": 0.27, "learning_rate": 0.0017145449416060697, "loss": 2.4571, "step": 10019 }, { "epoch": 0.27, "learning_rate": 0.0017144840471899846, "loss": 3.181, "step": 10020 }, { "epoch": 0.27, "learning_rate": 0.0017144231473610958, "loss": 2.2653, "step": 10021 }, { "epoch": 0.27, "learning_rate": 0.0017143622421198655, "loss": 2.5854, "step": 10022 }, { "epoch": 0.27, "learning_rate": 0.0017143013314667539, "loss": 2.6474, "step": 10023 }, { "epoch": 0.27, "learning_rate": 0.0017142404154022236, "loss": 2.4092, "step": 10024 }, { "epoch": 0.27, "learning_rate": 0.0017141794939267354, "loss": 2.3552, "step": 10025 }, { "epoch": 0.27, "learning_rate": 0.001714118567040751, "loss": 2.4419, "step": 10026 }, { "epoch": 0.27, "learning_rate": 0.0017140576347447322, "loss": 2.8686, "step": 10027 }, { "epoch": 0.27, "learning_rate": 0.0017139966970391406, "loss": 2.4387, "step": 10028 }, { "epoch": 0.27, "learning_rate": 0.0017139357539244374, "loss": 2.2778, "step": 10029 }, { "epoch": 0.27, "learning_rate": 0.0017138748054010841, "loss": 2.2467, "step": 10030 }, { "epoch": 0.27, "learning_rate": 0.0017138138514695435, "loss": 2.9435, "step": 10031 }, { "epoch": 0.27, "learning_rate": 0.0017137528921302768, "loss": 2.4113, "step": 10032 }, { "epoch": 0.27, "learning_rate": 0.0017136919273837458, "loss": 2.1712, "step": 10033 }, { "epoch": 0.27, "learning_rate": 0.001713630957230412, "loss": 3.2182, "step": 10034 }, { "epoch": 0.27, "learning_rate": 0.0017135699816707378, "loss": 2.9538, "step": 10035 }, { "epoch": 0.27, "learning_rate": 0.001713509000705185, "loss": 2.4803, "step": 10036 }, { "epoch": 0.27, "learning_rate": 0.0017134480143342157, "loss": 2.3074, "step": 10037 }, { "epoch": 0.27, "learning_rate": 0.0017133870225582916, "loss": 3.1169, "step": 10038 }, { "epoch": 0.27, "learning_rate": 0.0017133260253778752, "loss": 2.7981, "step": 10039 }, { "epoch": 0.27, "learning_rate": 0.0017132650227934282, "loss": 2.95, "step": 10040 }, { "epoch": 0.27, "learning_rate": 0.001713204014805413, "loss": 2.4848, "step": 10041 }, { "epoch": 0.27, "learning_rate": 0.0017131430014142917, "loss": 3.0041, "step": 10042 }, { "epoch": 0.27, "learning_rate": 0.0017130819826205264, "loss": 2.6371, "step": 10043 }, { "epoch": 0.27, "learning_rate": 0.0017130209584245795, "loss": 2.8672, "step": 10044 }, { "epoch": 0.27, "learning_rate": 0.0017129599288269134, "loss": 2.7766, "step": 10045 }, { "epoch": 0.27, "learning_rate": 0.0017128988938279904, "loss": 3.144, "step": 10046 }, { "epoch": 0.27, "learning_rate": 0.0017128378534282725, "loss": 2.9211, "step": 10047 }, { "epoch": 0.27, "learning_rate": 0.0017127768076282226, "loss": 2.534, "step": 10048 }, { "epoch": 0.27, "learning_rate": 0.0017127157564283033, "loss": 2.5683, "step": 10049 }, { "epoch": 0.27, "learning_rate": 0.0017126546998289768, "loss": 2.7628, "step": 10050 }, { "epoch": 0.27, "learning_rate": 0.0017125936378307052, "loss": 2.7373, "step": 10051 }, { "epoch": 0.27, "learning_rate": 0.0017125325704339521, "loss": 3.3356, "step": 10052 }, { "epoch": 0.27, "learning_rate": 0.0017124714976391796, "loss": 2.3794, "step": 10053 }, { "epoch": 0.27, "learning_rate": 0.0017124104194468504, "loss": 2.0664, "step": 10054 }, { "epoch": 0.27, "learning_rate": 0.0017123493358574269, "loss": 2.4086, "step": 10055 }, { "epoch": 0.27, "learning_rate": 0.0017122882468713725, "loss": 2.8546, "step": 10056 }, { "epoch": 0.27, "learning_rate": 0.0017122271524891498, "loss": 2.2726, "step": 10057 }, { "epoch": 0.27, "learning_rate": 0.0017121660527112212, "loss": 2.5706, "step": 10058 }, { "epoch": 0.27, "learning_rate": 0.00171210494753805, "loss": 2.2509, "step": 10059 }, { "epoch": 0.27, "learning_rate": 0.0017120438369700992, "loss": 2.3075, "step": 10060 }, { "epoch": 0.27, "learning_rate": 0.0017119827210078317, "loss": 2.3675, "step": 10061 }, { "epoch": 0.27, "learning_rate": 0.00171192159965171, "loss": 2.4934, "step": 10062 }, { "epoch": 0.27, "learning_rate": 0.0017118604729021976, "loss": 2.7577, "step": 10063 }, { "epoch": 0.27, "learning_rate": 0.0017117993407597578, "loss": 2.5275, "step": 10064 }, { "epoch": 0.27, "learning_rate": 0.0017117382032248534, "loss": 2.266, "step": 10065 }, { "epoch": 0.27, "learning_rate": 0.0017116770602979474, "loss": 2.5991, "step": 10066 }, { "epoch": 0.27, "learning_rate": 0.001711615911979503, "loss": 3.1169, "step": 10067 }, { "epoch": 0.27, "learning_rate": 0.0017115547582699842, "loss": 2.5025, "step": 10068 }, { "epoch": 0.27, "learning_rate": 0.0017114935991698536, "loss": 2.615, "step": 10069 }, { "epoch": 0.27, "learning_rate": 0.0017114324346795748, "loss": 2.4504, "step": 10070 }, { "epoch": 0.27, "learning_rate": 0.001711371264799611, "loss": 2.3905, "step": 10071 }, { "epoch": 0.27, "learning_rate": 0.0017113100895304253, "loss": 2.6056, "step": 10072 }, { "epoch": 0.27, "learning_rate": 0.0017112489088724821, "loss": 2.8734, "step": 10073 }, { "epoch": 0.27, "learning_rate": 0.001711187722826244, "loss": 2.766, "step": 10074 }, { "epoch": 0.27, "learning_rate": 0.0017111265313921752, "loss": 2.2983, "step": 10075 }, { "epoch": 0.27, "learning_rate": 0.0017110653345707386, "loss": 2.9394, "step": 10076 }, { "epoch": 0.27, "learning_rate": 0.001711004132362398, "loss": 2.649, "step": 10077 }, { "epoch": 0.27, "learning_rate": 0.0017109429247676175, "loss": 2.6055, "step": 10078 }, { "epoch": 0.27, "learning_rate": 0.0017108817117868606, "loss": 2.7983, "step": 10079 }, { "epoch": 0.27, "learning_rate": 0.0017108204934205907, "loss": 2.4993, "step": 10080 }, { "epoch": 0.27, "learning_rate": 0.001710759269669272, "loss": 3.2845, "step": 10081 }, { "epoch": 0.27, "learning_rate": 0.0017106980405333682, "loss": 2.8134, "step": 10082 }, { "epoch": 0.27, "learning_rate": 0.0017106368060133428, "loss": 2.7516, "step": 10083 }, { "epoch": 0.27, "learning_rate": 0.00171057556610966, "loss": 2.7251, "step": 10084 }, { "epoch": 0.27, "learning_rate": 0.0017105143208227841, "loss": 2.991, "step": 10085 }, { "epoch": 0.27, "learning_rate": 0.0017104530701531786, "loss": 2.7814, "step": 10086 }, { "epoch": 0.27, "learning_rate": 0.0017103918141013078, "loss": 2.6658, "step": 10087 }, { "epoch": 0.27, "learning_rate": 0.001710330552667635, "loss": 2.4659, "step": 10088 }, { "epoch": 0.27, "learning_rate": 0.0017102692858526254, "loss": 2.8806, "step": 10089 }, { "epoch": 0.27, "learning_rate": 0.001710208013656743, "loss": 2.6053, "step": 10090 }, { "epoch": 0.27, "learning_rate": 0.0017101467360804512, "loss": 3.3443, "step": 10091 }, { "epoch": 0.27, "learning_rate": 0.0017100854531242147, "loss": 2.6024, "step": 10092 }, { "epoch": 0.27, "learning_rate": 0.0017100241647884978, "loss": 2.8079, "step": 10093 }, { "epoch": 0.27, "learning_rate": 0.001709962871073765, "loss": 2.5612, "step": 10094 }, { "epoch": 0.27, "learning_rate": 0.0017099015719804803, "loss": 2.5795, "step": 10095 }, { "epoch": 0.27, "learning_rate": 0.001709840267509108, "loss": 2.3255, "step": 10096 }, { "epoch": 0.27, "learning_rate": 0.001709778957660113, "loss": 2.8386, "step": 10097 }, { "epoch": 0.27, "learning_rate": 0.0017097176424339592, "loss": 2.4772, "step": 10098 }, { "epoch": 0.27, "learning_rate": 0.0017096563218311118, "loss": 2.5254, "step": 10099 }, { "epoch": 0.27, "learning_rate": 0.0017095949958520348, "loss": 2.3731, "step": 10100 }, { "epoch": 0.27, "learning_rate": 0.0017095336644971928, "loss": 2.7483, "step": 10101 }, { "epoch": 0.27, "learning_rate": 0.001709472327767051, "loss": 2.9515, "step": 10102 }, { "epoch": 0.27, "learning_rate": 0.0017094109856620734, "loss": 2.8677, "step": 10103 }, { "epoch": 0.27, "learning_rate": 0.0017093496381827252, "loss": 2.7418, "step": 10104 }, { "epoch": 0.27, "learning_rate": 0.0017092882853294708, "loss": 2.444, "step": 10105 }, { "epoch": 0.27, "learning_rate": 0.001709226927102775, "loss": 2.4611, "step": 10106 }, { "epoch": 0.27, "learning_rate": 0.0017091655635031032, "loss": 2.3881, "step": 10107 }, { "epoch": 0.27, "learning_rate": 0.0017091041945309197, "loss": 2.5272, "step": 10108 }, { "epoch": 0.27, "learning_rate": 0.0017090428201866894, "loss": 2.6045, "step": 10109 }, { "epoch": 0.27, "learning_rate": 0.0017089814404708777, "loss": 2.7811, "step": 10110 }, { "epoch": 0.27, "learning_rate": 0.0017089200553839494, "loss": 2.6073, "step": 10111 }, { "epoch": 0.27, "learning_rate": 0.0017088586649263693, "loss": 2.3435, "step": 10112 }, { "epoch": 0.27, "learning_rate": 0.001708797269098603, "loss": 2.8082, "step": 10113 }, { "epoch": 0.27, "learning_rate": 0.001708735867901115, "loss": 2.6709, "step": 10114 }, { "epoch": 0.27, "learning_rate": 0.001708674461334371, "loss": 2.7215, "step": 10115 }, { "epoch": 0.27, "learning_rate": 0.0017086130493988358, "loss": 2.59, "step": 10116 }, { "epoch": 0.27, "learning_rate": 0.0017085516320949749, "loss": 2.9174, "step": 10117 }, { "epoch": 0.27, "learning_rate": 0.0017084902094232535, "loss": 2.9781, "step": 10118 }, { "epoch": 0.27, "learning_rate": 0.0017084287813841368, "loss": 2.437, "step": 10119 }, { "epoch": 0.27, "learning_rate": 0.0017083673479780903, "loss": 2.718, "step": 10120 }, { "epoch": 0.27, "learning_rate": 0.0017083059092055798, "loss": 2.8124, "step": 10121 }, { "epoch": 0.27, "learning_rate": 0.00170824446506707, "loss": 2.6572, "step": 10122 }, { "epoch": 0.27, "learning_rate": 0.0017081830155630268, "loss": 2.7211, "step": 10123 }, { "epoch": 0.27, "learning_rate": 0.001708121560693916, "loss": 2.616, "step": 10124 }, { "epoch": 0.27, "learning_rate": 0.0017080601004602026, "loss": 2.5879, "step": 10125 }, { "epoch": 0.27, "learning_rate": 0.0017079986348623524, "loss": 2.696, "step": 10126 }, { "epoch": 0.27, "learning_rate": 0.0017079371639008311, "loss": 2.9941, "step": 10127 }, { "epoch": 0.27, "learning_rate": 0.0017078756875761045, "loss": 2.5787, "step": 10128 }, { "epoch": 0.27, "learning_rate": 0.0017078142058886386, "loss": 2.7575, "step": 10129 }, { "epoch": 0.27, "learning_rate": 0.0017077527188388984, "loss": 2.4065, "step": 10130 }, { "epoch": 0.27, "learning_rate": 0.0017076912264273503, "loss": 2.8006, "step": 10131 }, { "epoch": 0.27, "learning_rate": 0.0017076297286544597, "loss": 2.2181, "step": 10132 }, { "epoch": 0.27, "learning_rate": 0.001707568225520693, "loss": 2.6314, "step": 10133 }, { "epoch": 0.27, "learning_rate": 0.001707506717026516, "loss": 2.7178, "step": 10134 }, { "epoch": 0.27, "learning_rate": 0.0017074452031723944, "loss": 2.6406, "step": 10135 }, { "epoch": 0.27, "learning_rate": 0.0017073836839587946, "loss": 2.2991, "step": 10136 }, { "epoch": 0.27, "learning_rate": 0.0017073221593861825, "loss": 2.562, "step": 10137 }, { "epoch": 0.27, "learning_rate": 0.001707260629455024, "loss": 2.5625, "step": 10138 }, { "epoch": 0.27, "learning_rate": 0.0017071990941657856, "loss": 2.8239, "step": 10139 }, { "epoch": 0.27, "learning_rate": 0.0017071375535189332, "loss": 2.8447, "step": 10140 }, { "epoch": 0.27, "learning_rate": 0.0017070760075149332, "loss": 2.4763, "step": 10141 }, { "epoch": 0.27, "learning_rate": 0.0017070144561542517, "loss": 2.8659, "step": 10142 }, { "epoch": 0.27, "learning_rate": 0.0017069528994373552, "loss": 2.1821, "step": 10143 }, { "epoch": 0.27, "learning_rate": 0.0017068913373647098, "loss": 2.1327, "step": 10144 }, { "epoch": 0.27, "learning_rate": 0.0017068297699367819, "loss": 2.4238, "step": 10145 }, { "epoch": 0.27, "learning_rate": 0.0017067681971540383, "loss": 3.0076, "step": 10146 }, { "epoch": 0.27, "learning_rate": 0.0017067066190169452, "loss": 2.9568, "step": 10147 }, { "epoch": 0.27, "learning_rate": 0.0017066450355259688, "loss": 2.6637, "step": 10148 }, { "epoch": 0.27, "learning_rate": 0.001706583446681576, "loss": 2.7408, "step": 10149 }, { "epoch": 0.27, "learning_rate": 0.0017065218524842337, "loss": 2.27, "step": 10150 }, { "epoch": 0.27, "learning_rate": 0.001706460252934408, "loss": 2.6049, "step": 10151 }, { "epoch": 0.27, "learning_rate": 0.0017063986480325656, "loss": 2.6637, "step": 10152 }, { "epoch": 0.27, "learning_rate": 0.001706337037779173, "loss": 2.6321, "step": 10153 }, { "epoch": 0.27, "learning_rate": 0.001706275422174698, "loss": 2.2535, "step": 10154 }, { "epoch": 0.27, "learning_rate": 0.0017062138012196063, "loss": 2.3612, "step": 10155 }, { "epoch": 0.27, "learning_rate": 0.0017061521749143652, "loss": 2.5877, "step": 10156 }, { "epoch": 0.27, "learning_rate": 0.001706090543259441, "loss": 2.3258, "step": 10157 }, { "epoch": 0.27, "learning_rate": 0.0017060289062553018, "loss": 2.5634, "step": 10158 }, { "epoch": 0.27, "learning_rate": 0.0017059672639024135, "loss": 2.2534, "step": 10159 }, { "epoch": 0.27, "learning_rate": 0.0017059056162012434, "loss": 2.5755, "step": 10160 }, { "epoch": 0.27, "learning_rate": 0.0017058439631522585, "loss": 1.9335, "step": 10161 }, { "epoch": 0.27, "learning_rate": 0.001705782304755926, "loss": 2.5197, "step": 10162 }, { "epoch": 0.27, "learning_rate": 0.0017057206410127132, "loss": 2.8772, "step": 10163 }, { "epoch": 0.27, "learning_rate": 0.0017056589719230866, "loss": 2.5074, "step": 10164 }, { "epoch": 0.27, "learning_rate": 0.0017055972974875141, "loss": 2.3539, "step": 10165 }, { "epoch": 0.27, "learning_rate": 0.0017055356177064624, "loss": 2.6912, "step": 10166 }, { "epoch": 0.27, "learning_rate": 0.001705473932580399, "loss": 2.2901, "step": 10167 }, { "epoch": 0.27, "learning_rate": 0.0017054122421097913, "loss": 2.694, "step": 10168 }, { "epoch": 0.27, "learning_rate": 0.0017053505462951066, "loss": 2.6309, "step": 10169 }, { "epoch": 0.27, "learning_rate": 0.0017052888451368122, "loss": 2.9827, "step": 10170 }, { "epoch": 0.27, "learning_rate": 0.0017052271386353754, "loss": 2.589, "step": 10171 }, { "epoch": 0.27, "learning_rate": 0.0017051654267912642, "loss": 2.459, "step": 10172 }, { "epoch": 0.27, "learning_rate": 0.0017051037096049457, "loss": 2.7055, "step": 10173 }, { "epoch": 0.27, "learning_rate": 0.001705041987076888, "loss": 2.4009, "step": 10174 }, { "epoch": 0.27, "learning_rate": 0.0017049802592075576, "loss": 2.4704, "step": 10175 }, { "epoch": 0.27, "learning_rate": 0.0017049185259974228, "loss": 2.7484, "step": 10176 }, { "epoch": 0.27, "learning_rate": 0.0017048567874469516, "loss": 3.0087, "step": 10177 }, { "epoch": 0.27, "learning_rate": 0.0017047950435566113, "loss": 2.955, "step": 10178 }, { "epoch": 0.27, "learning_rate": 0.0017047332943268697, "loss": 2.8788, "step": 10179 }, { "epoch": 0.27, "learning_rate": 0.0017046715397581946, "loss": 2.4868, "step": 10180 }, { "epoch": 0.27, "learning_rate": 0.0017046097798510541, "loss": 2.4958, "step": 10181 }, { "epoch": 0.27, "learning_rate": 0.0017045480146059158, "loss": 3.0301, "step": 10182 }, { "epoch": 0.27, "learning_rate": 0.0017044862440232476, "loss": 2.4166, "step": 10183 }, { "epoch": 0.27, "learning_rate": 0.0017044244681035177, "loss": 2.3986, "step": 10184 }, { "epoch": 0.27, "learning_rate": 0.001704362686847194, "loss": 2.5033, "step": 10185 }, { "epoch": 0.27, "learning_rate": 0.0017043009002547442, "loss": 2.2452, "step": 10186 }, { "epoch": 0.27, "learning_rate": 0.0017042391083266371, "loss": 3.2087, "step": 10187 }, { "epoch": 0.27, "learning_rate": 0.00170417731106334, "loss": 2.8127, "step": 10188 }, { "epoch": 0.27, "learning_rate": 0.001704115508465322, "loss": 2.6003, "step": 10189 }, { "epoch": 0.27, "learning_rate": 0.0017040537005330503, "loss": 2.6045, "step": 10190 }, { "epoch": 0.27, "learning_rate": 0.001703991887266994, "loss": 2.7256, "step": 10191 }, { "epoch": 0.27, "learning_rate": 0.0017039300686676206, "loss": 2.6428, "step": 10192 }, { "epoch": 0.27, "learning_rate": 0.0017038682447353996, "loss": 2.322, "step": 10193 }, { "epoch": 0.27, "learning_rate": 0.001703806415470798, "loss": 2.2604, "step": 10194 }, { "epoch": 0.27, "learning_rate": 0.0017037445808742852, "loss": 2.3465, "step": 10195 }, { "epoch": 0.27, "learning_rate": 0.0017036827409463284, "loss": 2.4624, "step": 10196 }, { "epoch": 0.27, "learning_rate": 0.001703620895687398, "loss": 2.6879, "step": 10197 }, { "epoch": 0.27, "learning_rate": 0.001703559045097961, "loss": 2.6234, "step": 10198 }, { "epoch": 0.27, "learning_rate": 0.0017034971891784865, "loss": 2.5902, "step": 10199 }, { "epoch": 0.27, "learning_rate": 0.001703435327929443, "loss": 2.6574, "step": 10200 }, { "epoch": 0.27, "learning_rate": 0.0017033734613512994, "loss": 2.5212, "step": 10201 }, { "epoch": 0.27, "learning_rate": 0.0017033115894445243, "loss": 2.362, "step": 10202 }, { "epoch": 0.27, "learning_rate": 0.001703249712209586, "loss": 2.8244, "step": 10203 }, { "epoch": 0.27, "learning_rate": 0.001703187829646954, "loss": 2.8299, "step": 10204 }, { "epoch": 0.27, "learning_rate": 0.0017031259417570963, "loss": 2.4681, "step": 10205 }, { "epoch": 0.27, "learning_rate": 0.0017030640485404826, "loss": 2.3732, "step": 10206 }, { "epoch": 0.27, "learning_rate": 0.001703002149997581, "loss": 2.7298, "step": 10207 }, { "epoch": 0.27, "learning_rate": 0.001702940246128861, "loss": 2.5763, "step": 10208 }, { "epoch": 0.27, "learning_rate": 0.0017028783369347914, "loss": 2.2262, "step": 10209 }, { "epoch": 0.27, "learning_rate": 0.001702816422415841, "loss": 2.471, "step": 10210 }, { "epoch": 0.27, "learning_rate": 0.0017027545025724792, "loss": 2.3801, "step": 10211 }, { "epoch": 0.27, "learning_rate": 0.001702692577405175, "loss": 2.7692, "step": 10212 }, { "epoch": 0.27, "learning_rate": 0.0017026306469143974, "loss": 2.5056, "step": 10213 }, { "epoch": 0.27, "learning_rate": 0.0017025687111006155, "loss": 2.7123, "step": 10214 }, { "epoch": 0.27, "learning_rate": 0.0017025067699642986, "loss": 2.6159, "step": 10215 }, { "epoch": 0.27, "learning_rate": 0.0017024448235059162, "loss": 2.6454, "step": 10216 }, { "epoch": 0.27, "learning_rate": 0.0017023828717259372, "loss": 2.5852, "step": 10217 }, { "epoch": 0.27, "learning_rate": 0.0017023209146248314, "loss": 2.7393, "step": 10218 }, { "epoch": 0.27, "learning_rate": 0.0017022589522030676, "loss": 2.5575, "step": 10219 }, { "epoch": 0.27, "learning_rate": 0.0017021969844611157, "loss": 2.5786, "step": 10220 }, { "epoch": 0.27, "learning_rate": 0.0017021350113994452, "loss": 2.9155, "step": 10221 }, { "epoch": 0.27, "learning_rate": 0.0017020730330185253, "loss": 2.682, "step": 10222 }, { "epoch": 0.27, "learning_rate": 0.0017020110493188253, "loss": 2.4719, "step": 10223 }, { "epoch": 0.27, "learning_rate": 0.0017019490603008155, "loss": 2.5745, "step": 10224 }, { "epoch": 0.27, "learning_rate": 0.0017018870659649648, "loss": 2.4837, "step": 10225 }, { "epoch": 0.27, "learning_rate": 0.0017018250663117431, "loss": 2.7491, "step": 10226 }, { "epoch": 0.27, "learning_rate": 0.0017017630613416204, "loss": 2.6474, "step": 10227 }, { "epoch": 0.27, "learning_rate": 0.0017017010510550663, "loss": 2.4773, "step": 10228 }, { "epoch": 0.27, "learning_rate": 0.0017016390354525504, "loss": 2.4228, "step": 10229 }, { "epoch": 0.27, "learning_rate": 0.0017015770145345425, "loss": 2.5423, "step": 10230 }, { "epoch": 0.27, "learning_rate": 0.0017015149883015126, "loss": 2.4584, "step": 10231 }, { "epoch": 0.27, "learning_rate": 0.0017014529567539304, "loss": 2.1668, "step": 10232 }, { "epoch": 0.27, "learning_rate": 0.0017013909198922664, "loss": 2.9318, "step": 10233 }, { "epoch": 0.28, "learning_rate": 0.00170132887771699, "loss": 2.0966, "step": 10234 }, { "epoch": 0.28, "learning_rate": 0.0017012668302285713, "loss": 2.6896, "step": 10235 }, { "epoch": 0.28, "learning_rate": 0.001701204777427481, "loss": 2.8709, "step": 10236 }, { "epoch": 0.28, "learning_rate": 0.001701142719314188, "loss": 2.3756, "step": 10237 }, { "epoch": 0.28, "learning_rate": 0.001701080655889163, "loss": 2.201, "step": 10238 }, { "epoch": 0.28, "learning_rate": 0.001701018587152877, "loss": 2.5789, "step": 10239 }, { "epoch": 0.28, "learning_rate": 0.0017009565131057994, "loss": 2.7635, "step": 10240 }, { "epoch": 0.28, "learning_rate": 0.0017008944337484001, "loss": 2.5946, "step": 10241 }, { "epoch": 0.28, "learning_rate": 0.00170083234908115, "loss": 2.542, "step": 10242 }, { "epoch": 0.28, "learning_rate": 0.0017007702591045196, "loss": 2.1503, "step": 10243 }, { "epoch": 0.28, "learning_rate": 0.001700708163818979, "loss": 2.536, "step": 10244 }, { "epoch": 0.28, "learning_rate": 0.0017006460632249985, "loss": 2.6577, "step": 10245 }, { "epoch": 0.28, "learning_rate": 0.0017005839573230484, "loss": 2.5305, "step": 10246 }, { "epoch": 0.28, "learning_rate": 0.0017005218461135997, "loss": 2.6642, "step": 10247 }, { "epoch": 0.28, "learning_rate": 0.0017004597295971228, "loss": 2.378, "step": 10248 }, { "epoch": 0.28, "learning_rate": 0.0017003976077740884, "loss": 2.5564, "step": 10249 }, { "epoch": 0.28, "learning_rate": 0.0017003354806449666, "loss": 2.1836, "step": 10250 }, { "epoch": 0.28, "learning_rate": 0.0017002733482102286, "loss": 2.6715, "step": 10251 }, { "epoch": 0.28, "learning_rate": 0.0017002112104703448, "loss": 2.592, "step": 10252 }, { "epoch": 0.28, "learning_rate": 0.0017001490674257865, "loss": 2.7998, "step": 10253 }, { "epoch": 0.28, "learning_rate": 0.0017000869190770232, "loss": 2.6831, "step": 10254 }, { "epoch": 0.28, "learning_rate": 0.0017000247654245274, "loss": 2.9958, "step": 10255 }, { "epoch": 0.28, "learning_rate": 0.0016999626064687686, "loss": 2.8862, "step": 10256 }, { "epoch": 0.28, "learning_rate": 0.0016999004422102184, "loss": 2.6474, "step": 10257 }, { "epoch": 0.28, "learning_rate": 0.0016998382726493475, "loss": 2.6862, "step": 10258 }, { "epoch": 0.28, "learning_rate": 0.001699776097786627, "loss": 2.6363, "step": 10259 }, { "epoch": 0.28, "learning_rate": 0.001699713917622528, "loss": 2.2555, "step": 10260 }, { "epoch": 0.28, "learning_rate": 0.0016996517321575216, "loss": 2.5695, "step": 10261 }, { "epoch": 0.28, "learning_rate": 0.0016995895413920784, "loss": 2.908, "step": 10262 }, { "epoch": 0.28, "learning_rate": 0.00169952734532667, "loss": 2.3474, "step": 10263 }, { "epoch": 0.28, "learning_rate": 0.0016994651439617675, "loss": 2.5562, "step": 10264 }, { "epoch": 0.28, "learning_rate": 0.001699402937297842, "loss": 2.5371, "step": 10265 }, { "epoch": 0.28, "learning_rate": 0.0016993407253353655, "loss": 2.3678, "step": 10266 }, { "epoch": 0.28, "learning_rate": 0.0016992785080748082, "loss": 2.5237, "step": 10267 }, { "epoch": 0.28, "learning_rate": 0.001699216285516642, "loss": 2.8842, "step": 10268 }, { "epoch": 0.28, "learning_rate": 0.0016991540576613382, "loss": 2.7528, "step": 10269 }, { "epoch": 0.28, "learning_rate": 0.0016990918245093681, "loss": 2.1481, "step": 10270 }, { "epoch": 0.28, "learning_rate": 0.0016990295860612036, "loss": 2.873, "step": 10271 }, { "epoch": 0.28, "learning_rate": 0.001698967342317316, "loss": 2.5487, "step": 10272 }, { "epoch": 0.28, "learning_rate": 0.0016989050932781765, "loss": 3.0692, "step": 10273 }, { "epoch": 0.28, "learning_rate": 0.0016988428389442573, "loss": 2.7802, "step": 10274 }, { "epoch": 0.28, "learning_rate": 0.0016987805793160292, "loss": 2.6763, "step": 10275 }, { "epoch": 0.28, "learning_rate": 0.0016987183143939645, "loss": 2.5434, "step": 10276 }, { "epoch": 0.28, "learning_rate": 0.001698656044178535, "loss": 2.5496, "step": 10277 }, { "epoch": 0.28, "learning_rate": 0.001698593768670212, "loss": 2.647, "step": 10278 }, { "epoch": 0.28, "learning_rate": 0.001698531487869468, "loss": 2.4867, "step": 10279 }, { "epoch": 0.28, "learning_rate": 0.0016984692017767739, "loss": 2.4892, "step": 10280 }, { "epoch": 0.28, "learning_rate": 0.0016984069103926022, "loss": 2.5715, "step": 10281 }, { "epoch": 0.28, "learning_rate": 0.0016983446137174242, "loss": 2.994, "step": 10282 }, { "epoch": 0.28, "learning_rate": 0.0016982823117517127, "loss": 2.6055, "step": 10283 }, { "epoch": 0.28, "learning_rate": 0.001698220004495939, "loss": 2.5048, "step": 10284 }, { "epoch": 0.28, "learning_rate": 0.0016981576919505754, "loss": 2.4634, "step": 10285 }, { "epoch": 0.28, "learning_rate": 0.001698095374116094, "loss": 2.9063, "step": 10286 }, { "epoch": 0.28, "learning_rate": 0.0016980330509929668, "loss": 2.3998, "step": 10287 }, { "epoch": 0.28, "learning_rate": 0.0016979707225816662, "loss": 2.4984, "step": 10288 }, { "epoch": 0.28, "learning_rate": 0.0016979083888826638, "loss": 2.817, "step": 10289 }, { "epoch": 0.28, "learning_rate": 0.0016978460498964325, "loss": 2.6802, "step": 10290 }, { "epoch": 0.28, "learning_rate": 0.0016977837056234445, "loss": 2.9226, "step": 10291 }, { "epoch": 0.28, "learning_rate": 0.0016977213560641715, "loss": 2.8377, "step": 10292 }, { "epoch": 0.28, "learning_rate": 0.0016976590012190865, "loss": 2.5317, "step": 10293 }, { "epoch": 0.28, "learning_rate": 0.0016975966410886615, "loss": 3.2641, "step": 10294 }, { "epoch": 0.28, "learning_rate": 0.0016975342756733692, "loss": 2.471, "step": 10295 }, { "epoch": 0.28, "learning_rate": 0.001697471904973682, "loss": 2.6577, "step": 10296 }, { "epoch": 0.28, "learning_rate": 0.0016974095289900722, "loss": 2.4161, "step": 10297 }, { "epoch": 0.28, "learning_rate": 0.0016973471477230123, "loss": 2.6261, "step": 10298 }, { "epoch": 0.28, "learning_rate": 0.0016972847611729754, "loss": 2.5705, "step": 10299 }, { "epoch": 0.28, "learning_rate": 0.0016972223693404336, "loss": 2.2567, "step": 10300 }, { "epoch": 0.28, "learning_rate": 0.0016971599722258599, "loss": 2.6846, "step": 10301 }, { "epoch": 0.28, "learning_rate": 0.0016970975698297269, "loss": 2.1549, "step": 10302 }, { "epoch": 0.28, "learning_rate": 0.001697035162152507, "loss": 2.7216, "step": 10303 }, { "epoch": 0.28, "learning_rate": 0.0016969727491946741, "loss": 2.6581, "step": 10304 }, { "epoch": 0.28, "learning_rate": 0.0016969103309566994, "loss": 2.2713, "step": 10305 }, { "epoch": 0.28, "learning_rate": 0.0016968479074390573, "loss": 2.7578, "step": 10306 }, { "epoch": 0.28, "learning_rate": 0.0016967854786422195, "loss": 2.367, "step": 10307 }, { "epoch": 0.28, "learning_rate": 0.0016967230445666596, "loss": 2.7946, "step": 10308 }, { "epoch": 0.28, "learning_rate": 0.0016966606052128508, "loss": 2.4746, "step": 10309 }, { "epoch": 0.28, "learning_rate": 0.0016965981605812654, "loss": 2.3407, "step": 10310 }, { "epoch": 0.28, "learning_rate": 0.0016965357106723774, "loss": 2.7134, "step": 10311 }, { "epoch": 0.28, "learning_rate": 0.001696473255486659, "loss": 2.4637, "step": 10312 }, { "epoch": 0.28, "learning_rate": 0.0016964107950245837, "loss": 2.7719, "step": 10313 }, { "epoch": 0.28, "learning_rate": 0.0016963483292866252, "loss": 2.592, "step": 10314 }, { "epoch": 0.28, "learning_rate": 0.0016962858582732557, "loss": 2.324, "step": 10315 }, { "epoch": 0.28, "learning_rate": 0.001696223381984949, "loss": 2.5408, "step": 10316 }, { "epoch": 0.28, "learning_rate": 0.0016961609004221788, "loss": 2.7518, "step": 10317 }, { "epoch": 0.28, "learning_rate": 0.0016960984135854181, "loss": 2.9027, "step": 10318 }, { "epoch": 0.28, "learning_rate": 0.00169603592147514, "loss": 2.6784, "step": 10319 }, { "epoch": 0.28, "learning_rate": 0.001695973424091818, "loss": 2.979, "step": 10320 }, { "epoch": 0.28, "learning_rate": 0.0016959109214359264, "loss": 2.751, "step": 10321 }, { "epoch": 0.28, "learning_rate": 0.0016958484135079375, "loss": 2.4424, "step": 10322 }, { "epoch": 0.28, "learning_rate": 0.0016957859003083257, "loss": 2.5917, "step": 10323 }, { "epoch": 0.28, "learning_rate": 0.0016957233818375643, "loss": 2.8455, "step": 10324 }, { "epoch": 0.28, "learning_rate": 0.0016956608580961268, "loss": 2.5971, "step": 10325 }, { "epoch": 0.28, "learning_rate": 0.0016955983290844873, "loss": 2.4841, "step": 10326 }, { "epoch": 0.28, "learning_rate": 0.001695535794803119, "loss": 2.7104, "step": 10327 }, { "epoch": 0.28, "learning_rate": 0.0016954732552524959, "loss": 2.3614, "step": 10328 }, { "epoch": 0.28, "learning_rate": 0.0016954107104330918, "loss": 2.7312, "step": 10329 }, { "epoch": 0.28, "learning_rate": 0.0016953481603453804, "loss": 2.5268, "step": 10330 }, { "epoch": 0.28, "learning_rate": 0.0016952856049898357, "loss": 2.528, "step": 10331 }, { "epoch": 0.28, "learning_rate": 0.0016952230443669316, "loss": 3.1863, "step": 10332 }, { "epoch": 0.28, "learning_rate": 0.001695160478477142, "loss": 2.2418, "step": 10333 }, { "epoch": 0.28, "learning_rate": 0.0016950979073209408, "loss": 2.5887, "step": 10334 }, { "epoch": 0.28, "learning_rate": 0.0016950353308988024, "loss": 2.7042, "step": 10335 }, { "epoch": 0.28, "learning_rate": 0.0016949727492112003, "loss": 2.5916, "step": 10336 }, { "epoch": 0.28, "learning_rate": 0.0016949101622586089, "loss": 2.1766, "step": 10337 }, { "epoch": 0.28, "learning_rate": 0.0016948475700415027, "loss": 2.0501, "step": 10338 }, { "epoch": 0.28, "learning_rate": 0.0016947849725603553, "loss": 2.5043, "step": 10339 }, { "epoch": 0.28, "learning_rate": 0.0016947223698156409, "loss": 2.6699, "step": 10340 }, { "epoch": 0.28, "learning_rate": 0.0016946597618078343, "loss": 2.6883, "step": 10341 }, { "epoch": 0.28, "learning_rate": 0.0016945971485374097, "loss": 2.4937, "step": 10342 }, { "epoch": 0.28, "learning_rate": 0.0016945345300048412, "loss": 2.4515, "step": 10343 }, { "epoch": 0.28, "learning_rate": 0.001694471906210603, "loss": 2.5238, "step": 10344 }, { "epoch": 0.28, "learning_rate": 0.00169440927715517, "loss": 2.472, "step": 10345 }, { "epoch": 0.28, "learning_rate": 0.0016943466428390164, "loss": 2.6982, "step": 10346 }, { "epoch": 0.28, "learning_rate": 0.0016942840032626169, "loss": 2.7814, "step": 10347 }, { "epoch": 0.28, "learning_rate": 0.0016942213584264457, "loss": 3.0847, "step": 10348 }, { "epoch": 0.28, "learning_rate": 0.0016941587083309777, "loss": 2.3371, "step": 10349 }, { "epoch": 0.28, "learning_rate": 0.0016940960529766875, "loss": 2.9813, "step": 10350 }, { "epoch": 0.28, "learning_rate": 0.0016940333923640498, "loss": 2.444, "step": 10351 }, { "epoch": 0.28, "learning_rate": 0.0016939707264935389, "loss": 2.3533, "step": 10352 }, { "epoch": 0.28, "learning_rate": 0.00169390805536563, "loss": 2.5463, "step": 10353 }, { "epoch": 0.28, "learning_rate": 0.001693845378980798, "loss": 2.2604, "step": 10354 }, { "epoch": 0.28, "learning_rate": 0.0016937826973395169, "loss": 2.6218, "step": 10355 }, { "epoch": 0.28, "learning_rate": 0.0016937200104422626, "loss": 2.506, "step": 10356 }, { "epoch": 0.28, "learning_rate": 0.0016936573182895094, "loss": 2.7285, "step": 10357 }, { "epoch": 0.28, "learning_rate": 0.0016935946208817324, "loss": 2.3641, "step": 10358 }, { "epoch": 0.28, "learning_rate": 0.0016935319182194064, "loss": 2.5253, "step": 10359 }, { "epoch": 0.28, "learning_rate": 0.0016934692103030065, "loss": 2.5418, "step": 10360 }, { "epoch": 0.28, "learning_rate": 0.001693406497133008, "loss": 3.1099, "step": 10361 }, { "epoch": 0.28, "learning_rate": 0.001693343778709886, "loss": 2.5123, "step": 10362 }, { "epoch": 0.28, "learning_rate": 0.0016932810550341151, "loss": 2.6255, "step": 10363 }, { "epoch": 0.28, "learning_rate": 0.0016932183261061714, "loss": 2.2183, "step": 10364 }, { "epoch": 0.28, "learning_rate": 0.001693155591926529, "loss": 2.4383, "step": 10365 }, { "epoch": 0.28, "learning_rate": 0.0016930928524956643, "loss": 2.9888, "step": 10366 }, { "epoch": 0.28, "learning_rate": 0.0016930301078140518, "loss": 2.7983, "step": 10367 }, { "epoch": 0.28, "learning_rate": 0.001692967357882167, "loss": 2.7068, "step": 10368 }, { "epoch": 0.28, "learning_rate": 0.0016929046027004855, "loss": 2.3576, "step": 10369 }, { "epoch": 0.28, "learning_rate": 0.0016928418422694827, "loss": 2.8154, "step": 10370 }, { "epoch": 0.28, "learning_rate": 0.0016927790765896339, "loss": 2.5331, "step": 10371 }, { "epoch": 0.28, "learning_rate": 0.0016927163056614147, "loss": 2.4267, "step": 10372 }, { "epoch": 0.28, "learning_rate": 0.0016926535294853006, "loss": 2.8336, "step": 10373 }, { "epoch": 0.28, "learning_rate": 0.0016925907480617674, "loss": 2.5271, "step": 10374 }, { "epoch": 0.28, "learning_rate": 0.00169252796139129, "loss": 2.099, "step": 10375 }, { "epoch": 0.28, "learning_rate": 0.001692465169474345, "loss": 2.5689, "step": 10376 }, { "epoch": 0.28, "learning_rate": 0.0016924023723114076, "loss": 2.43, "step": 10377 }, { "epoch": 0.28, "learning_rate": 0.0016923395699029536, "loss": 2.6023, "step": 10378 }, { "epoch": 0.28, "learning_rate": 0.0016922767622494586, "loss": 2.5625, "step": 10379 }, { "epoch": 0.28, "learning_rate": 0.0016922139493513988, "loss": 2.4978, "step": 10380 }, { "epoch": 0.28, "learning_rate": 0.0016921511312092499, "loss": 2.6787, "step": 10381 }, { "epoch": 0.28, "learning_rate": 0.0016920883078234876, "loss": 2.5297, "step": 10382 }, { "epoch": 0.28, "learning_rate": 0.001692025479194588, "loss": 2.6559, "step": 10383 }, { "epoch": 0.28, "learning_rate": 0.0016919626453230274, "loss": 2.5619, "step": 10384 }, { "epoch": 0.28, "learning_rate": 0.0016918998062092814, "loss": 2.7249, "step": 10385 }, { "epoch": 0.28, "learning_rate": 0.0016918369618538261, "loss": 2.3664, "step": 10386 }, { "epoch": 0.28, "learning_rate": 0.0016917741122571377, "loss": 2.5171, "step": 10387 }, { "epoch": 0.28, "learning_rate": 0.0016917112574196924, "loss": 2.3149, "step": 10388 }, { "epoch": 0.28, "learning_rate": 0.0016916483973419662, "loss": 2.5655, "step": 10389 }, { "epoch": 0.28, "learning_rate": 0.0016915855320244351, "loss": 2.5533, "step": 10390 }, { "epoch": 0.28, "learning_rate": 0.001691522661467576, "loss": 2.8264, "step": 10391 }, { "epoch": 0.28, "learning_rate": 0.001691459785671865, "loss": 2.9082, "step": 10392 }, { "epoch": 0.28, "learning_rate": 0.001691396904637778, "loss": 2.4678, "step": 10393 }, { "epoch": 0.28, "learning_rate": 0.0016913340183657914, "loss": 2.8973, "step": 10394 }, { "epoch": 0.28, "learning_rate": 0.0016912711268563822, "loss": 3.033, "step": 10395 }, { "epoch": 0.28, "learning_rate": 0.0016912082301100268, "loss": 2.5945, "step": 10396 }, { "epoch": 0.28, "learning_rate": 0.0016911453281272012, "loss": 2.618, "step": 10397 }, { "epoch": 0.28, "learning_rate": 0.001691082420908382, "loss": 2.6841, "step": 10398 }, { "epoch": 0.28, "learning_rate": 0.001691019508454046, "loss": 2.6593, "step": 10399 }, { "epoch": 0.28, "learning_rate": 0.00169095659076467, "loss": 2.5426, "step": 10400 }, { "epoch": 0.28, "learning_rate": 0.0016908936678407302, "loss": 2.7525, "step": 10401 }, { "epoch": 0.28, "learning_rate": 0.0016908307396827033, "loss": 2.4699, "step": 10402 }, { "epoch": 0.28, "learning_rate": 0.0016907678062910666, "loss": 2.6505, "step": 10403 }, { "epoch": 0.28, "learning_rate": 0.0016907048676662961, "loss": 2.3874, "step": 10404 }, { "epoch": 0.28, "learning_rate": 0.0016906419238088694, "loss": 2.4427, "step": 10405 }, { "epoch": 0.28, "learning_rate": 0.0016905789747192626, "loss": 2.8498, "step": 10406 }, { "epoch": 0.28, "learning_rate": 0.0016905160203979533, "loss": 2.6859, "step": 10407 }, { "epoch": 0.28, "learning_rate": 0.0016904530608454179, "loss": 2.7227, "step": 10408 }, { "epoch": 0.28, "learning_rate": 0.0016903900960621335, "loss": 2.6429, "step": 10409 }, { "epoch": 0.28, "learning_rate": 0.001690327126048577, "loss": 2.7289, "step": 10410 }, { "epoch": 0.28, "learning_rate": 0.0016902641508052259, "loss": 2.4869, "step": 10411 }, { "epoch": 0.28, "learning_rate": 0.001690201170332557, "loss": 2.2648, "step": 10412 }, { "epoch": 0.28, "learning_rate": 0.0016901381846310475, "loss": 2.5387, "step": 10413 }, { "epoch": 0.28, "learning_rate": 0.001690075193701174, "loss": 2.5301, "step": 10414 }, { "epoch": 0.28, "learning_rate": 0.0016900121975434149, "loss": 2.6892, "step": 10415 }, { "epoch": 0.28, "learning_rate": 0.0016899491961582462, "loss": 2.9281, "step": 10416 }, { "epoch": 0.28, "learning_rate": 0.001689886189546146, "loss": 2.7311, "step": 10417 }, { "epoch": 0.28, "learning_rate": 0.0016898231777075915, "loss": 3.0093, "step": 10418 }, { "epoch": 0.28, "learning_rate": 0.0016897601606430594, "loss": 2.0823, "step": 10419 }, { "epoch": 0.28, "learning_rate": 0.0016896971383530285, "loss": 2.3963, "step": 10420 }, { "epoch": 0.28, "learning_rate": 0.0016896341108379746, "loss": 3.0895, "step": 10421 }, { "epoch": 0.28, "learning_rate": 0.0016895710780983762, "loss": 2.407, "step": 10422 }, { "epoch": 0.28, "learning_rate": 0.0016895080401347108, "loss": 2.8598, "step": 10423 }, { "epoch": 0.28, "learning_rate": 0.0016894449969474556, "loss": 2.4309, "step": 10424 }, { "epoch": 0.28, "learning_rate": 0.0016893819485370883, "loss": 3.1054, "step": 10425 }, { "epoch": 0.28, "learning_rate": 0.0016893188949040868, "loss": 2.4099, "step": 10426 }, { "epoch": 0.28, "learning_rate": 0.0016892558360489286, "loss": 2.4729, "step": 10427 }, { "epoch": 0.28, "learning_rate": 0.0016891927719720912, "loss": 2.7243, "step": 10428 }, { "epoch": 0.28, "learning_rate": 0.0016891297026740526, "loss": 2.5848, "step": 10429 }, { "epoch": 0.28, "learning_rate": 0.0016890666281552907, "loss": 2.6174, "step": 10430 }, { "epoch": 0.28, "learning_rate": 0.0016890035484162832, "loss": 2.089, "step": 10431 }, { "epoch": 0.28, "learning_rate": 0.001688940463457508, "loss": 2.5914, "step": 10432 }, { "epoch": 0.28, "learning_rate": 0.0016888773732794426, "loss": 2.4022, "step": 10433 }, { "epoch": 0.28, "learning_rate": 0.0016888142778825662, "loss": 2.5963, "step": 10434 }, { "epoch": 0.28, "learning_rate": 0.0016887511772673554, "loss": 2.4118, "step": 10435 }, { "epoch": 0.28, "learning_rate": 0.001688688071434289, "loss": 2.3378, "step": 10436 }, { "epoch": 0.28, "learning_rate": 0.0016886249603838448, "loss": 2.8285, "step": 10437 }, { "epoch": 0.28, "learning_rate": 0.0016885618441165012, "loss": 2.5756, "step": 10438 }, { "epoch": 0.28, "learning_rate": 0.001688498722632736, "loss": 2.9913, "step": 10439 }, { "epoch": 0.28, "learning_rate": 0.0016884355959330276, "loss": 2.8125, "step": 10440 }, { "epoch": 0.28, "learning_rate": 0.0016883724640178541, "loss": 2.7539, "step": 10441 }, { "epoch": 0.28, "learning_rate": 0.001688309326887694, "loss": 2.5569, "step": 10442 }, { "epoch": 0.28, "learning_rate": 0.0016882461845430256, "loss": 2.4563, "step": 10443 }, { "epoch": 0.28, "learning_rate": 0.0016881830369843273, "loss": 2.6607, "step": 10444 }, { "epoch": 0.28, "learning_rate": 0.001688119884212077, "loss": 2.5373, "step": 10445 }, { "epoch": 0.28, "learning_rate": 0.0016880567262267535, "loss": 2.4529, "step": 10446 }, { "epoch": 0.28, "learning_rate": 0.0016879935630288352, "loss": 2.573, "step": 10447 }, { "epoch": 0.28, "learning_rate": 0.001687930394618801, "loss": 3.2732, "step": 10448 }, { "epoch": 0.28, "learning_rate": 0.0016878672209971288, "loss": 2.7544, "step": 10449 }, { "epoch": 0.28, "learning_rate": 0.0016878040421642977, "loss": 2.6895, "step": 10450 }, { "epoch": 0.28, "learning_rate": 0.001687740858120786, "loss": 2.8681, "step": 10451 }, { "epoch": 0.28, "learning_rate": 0.0016876776688670727, "loss": 2.6084, "step": 10452 }, { "epoch": 0.28, "learning_rate": 0.0016876144744036362, "loss": 2.6833, "step": 10453 }, { "epoch": 0.28, "learning_rate": 0.0016875512747309555, "loss": 2.8794, "step": 10454 }, { "epoch": 0.28, "learning_rate": 0.001687488069849509, "loss": 2.6869, "step": 10455 }, { "epoch": 0.28, "learning_rate": 0.001687424859759776, "loss": 2.7378, "step": 10456 }, { "epoch": 0.28, "learning_rate": 0.001687361644462235, "loss": 2.6393, "step": 10457 }, { "epoch": 0.28, "learning_rate": 0.0016872984239573654, "loss": 2.737, "step": 10458 }, { "epoch": 0.28, "learning_rate": 0.0016872351982456456, "loss": 2.5315, "step": 10459 }, { "epoch": 0.28, "learning_rate": 0.0016871719673275548, "loss": 2.5137, "step": 10460 }, { "epoch": 0.28, "learning_rate": 0.001687108731203572, "loss": 2.9333, "step": 10461 }, { "epoch": 0.28, "learning_rate": 0.0016870454898741762, "loss": 2.726, "step": 10462 }, { "epoch": 0.28, "learning_rate": 0.001686982243339847, "loss": 2.4825, "step": 10463 }, { "epoch": 0.28, "learning_rate": 0.0016869189916010625, "loss": 2.9365, "step": 10464 }, { "epoch": 0.28, "learning_rate": 0.001686855734658303, "loss": 2.2919, "step": 10465 }, { "epoch": 0.28, "learning_rate": 0.0016867924725120474, "loss": 2.4505, "step": 10466 }, { "epoch": 0.28, "learning_rate": 0.0016867292051627744, "loss": 2.4061, "step": 10467 }, { "epoch": 0.28, "learning_rate": 0.001686665932610964, "loss": 2.6316, "step": 10468 }, { "epoch": 0.28, "learning_rate": 0.0016866026548570951, "loss": 2.4988, "step": 10469 }, { "epoch": 0.28, "learning_rate": 0.0016865393719016474, "loss": 2.306, "step": 10470 }, { "epoch": 0.28, "learning_rate": 0.0016864760837451002, "loss": 2.8692, "step": 10471 }, { "epoch": 0.28, "learning_rate": 0.0016864127903879328, "loss": 2.288, "step": 10472 }, { "epoch": 0.28, "learning_rate": 0.0016863494918306246, "loss": 2.6644, "step": 10473 }, { "epoch": 0.28, "learning_rate": 0.0016862861880736558, "loss": 2.4077, "step": 10474 }, { "epoch": 0.28, "learning_rate": 0.0016862228791175052, "loss": 2.8147, "step": 10475 }, { "epoch": 0.28, "learning_rate": 0.0016861595649626526, "loss": 2.6966, "step": 10476 }, { "epoch": 0.28, "learning_rate": 0.001686096245609578, "loss": 2.384, "step": 10477 }, { "epoch": 0.28, "learning_rate": 0.0016860329210587612, "loss": 2.6607, "step": 10478 }, { "epoch": 0.28, "learning_rate": 0.0016859695913106815, "loss": 2.4129, "step": 10479 }, { "epoch": 0.28, "learning_rate": 0.0016859062563658186, "loss": 2.6707, "step": 10480 }, { "epoch": 0.28, "learning_rate": 0.0016858429162246527, "loss": 2.7062, "step": 10481 }, { "epoch": 0.28, "learning_rate": 0.0016857795708876636, "loss": 2.9792, "step": 10482 }, { "epoch": 0.28, "learning_rate": 0.0016857162203553306, "loss": 2.5968, "step": 10483 }, { "epoch": 0.28, "learning_rate": 0.0016856528646281347, "loss": 2.5503, "step": 10484 }, { "epoch": 0.28, "learning_rate": 0.001685589503706555, "loss": 2.6007, "step": 10485 }, { "epoch": 0.28, "learning_rate": 0.0016855261375910717, "loss": 2.7066, "step": 10486 }, { "epoch": 0.28, "learning_rate": 0.001685462766282165, "loss": 2.5279, "step": 10487 }, { "epoch": 0.28, "learning_rate": 0.001685399389780315, "loss": 2.623, "step": 10488 }, { "epoch": 0.28, "learning_rate": 0.0016853360080860017, "loss": 2.7505, "step": 10489 }, { "epoch": 0.28, "learning_rate": 0.0016852726211997054, "loss": 2.725, "step": 10490 }, { "epoch": 0.28, "learning_rate": 0.0016852092291219061, "loss": 2.4444, "step": 10491 }, { "epoch": 0.28, "learning_rate": 0.0016851458318530841, "loss": 2.5256, "step": 10492 }, { "epoch": 0.28, "learning_rate": 0.00168508242939372, "loss": 2.7566, "step": 10493 }, { "epoch": 0.28, "learning_rate": 0.001685019021744294, "loss": 2.4033, "step": 10494 }, { "epoch": 0.28, "learning_rate": 0.0016849556089052861, "loss": 2.4783, "step": 10495 }, { "epoch": 0.28, "learning_rate": 0.0016848921908771772, "loss": 2.6983, "step": 10496 }, { "epoch": 0.28, "learning_rate": 0.0016848287676604473, "loss": 2.7577, "step": 10497 }, { "epoch": 0.28, "learning_rate": 0.0016847653392555774, "loss": 2.4033, "step": 10498 }, { "epoch": 0.28, "learning_rate": 0.0016847019056630472, "loss": 2.6875, "step": 10499 }, { "epoch": 0.28, "learning_rate": 0.001684638466883338, "loss": 2.4591, "step": 10500 }, { "epoch": 0.28, "learning_rate": 0.0016845750229169303, "loss": 2.4864, "step": 10501 }, { "epoch": 0.28, "learning_rate": 0.0016845115737643046, "loss": 3.1093, "step": 10502 }, { "epoch": 0.28, "learning_rate": 0.0016844481194259419, "loss": 2.9165, "step": 10503 }, { "epoch": 0.28, "learning_rate": 0.001684384659902322, "loss": 2.5932, "step": 10504 }, { "epoch": 0.28, "learning_rate": 0.0016843211951939265, "loss": 2.3753, "step": 10505 }, { "epoch": 0.28, "learning_rate": 0.0016842577253012362, "loss": 2.1674, "step": 10506 }, { "epoch": 0.28, "learning_rate": 0.0016841942502247313, "loss": 2.8451, "step": 10507 }, { "epoch": 0.28, "learning_rate": 0.0016841307699648933, "loss": 2.5956, "step": 10508 }, { "epoch": 0.28, "learning_rate": 0.001684067284522203, "loss": 2.3098, "step": 10509 }, { "epoch": 0.28, "learning_rate": 0.001684003793897141, "loss": 2.4096, "step": 10510 }, { "epoch": 0.28, "learning_rate": 0.0016839402980901887, "loss": 2.4845, "step": 10511 }, { "epoch": 0.28, "learning_rate": 0.001683876797101827, "loss": 2.648, "step": 10512 }, { "epoch": 0.28, "learning_rate": 0.001683813290932537, "loss": 2.5485, "step": 10513 }, { "epoch": 0.28, "learning_rate": 0.0016837497795827998, "loss": 2.8422, "step": 10514 }, { "epoch": 0.28, "learning_rate": 0.0016836862630530962, "loss": 2.166, "step": 10515 }, { "epoch": 0.28, "learning_rate": 0.001683622741343908, "loss": 2.8346, "step": 10516 }, { "epoch": 0.28, "learning_rate": 0.001683559214455716, "loss": 2.9126, "step": 10517 }, { "epoch": 0.28, "learning_rate": 0.0016834956823890018, "loss": 2.5683, "step": 10518 }, { "epoch": 0.28, "learning_rate": 0.0016834321451442463, "loss": 2.4813, "step": 10519 }, { "epoch": 0.28, "learning_rate": 0.0016833686027219311, "loss": 2.2524, "step": 10520 }, { "epoch": 0.28, "learning_rate": 0.0016833050551225376, "loss": 2.4512, "step": 10521 }, { "epoch": 0.28, "learning_rate": 0.0016832415023465472, "loss": 2.461, "step": 10522 }, { "epoch": 0.28, "learning_rate": 0.001683177944394441, "loss": 2.4319, "step": 10523 }, { "epoch": 0.28, "learning_rate": 0.001683114381266701, "loss": 2.8193, "step": 10524 }, { "epoch": 0.28, "learning_rate": 0.0016830508129638089, "loss": 2.3676, "step": 10525 }, { "epoch": 0.28, "learning_rate": 0.0016829872394862459, "loss": 2.4141, "step": 10526 }, { "epoch": 0.28, "learning_rate": 0.001682923660834493, "loss": 2.1417, "step": 10527 }, { "epoch": 0.28, "learning_rate": 0.0016828600770090333, "loss": 2.83, "step": 10528 }, { "epoch": 0.28, "learning_rate": 0.0016827964880103475, "loss": 2.388, "step": 10529 }, { "epoch": 0.28, "learning_rate": 0.0016827328938389175, "loss": 2.8125, "step": 10530 }, { "epoch": 0.28, "learning_rate": 0.001682669294495225, "loss": 2.336, "step": 10531 }, { "epoch": 0.28, "learning_rate": 0.0016826056899797524, "loss": 2.5291, "step": 10532 }, { "epoch": 0.28, "learning_rate": 0.001682542080292981, "loss": 2.7793, "step": 10533 }, { "epoch": 0.28, "learning_rate": 0.0016824784654353925, "loss": 2.4199, "step": 10534 }, { "epoch": 0.28, "learning_rate": 0.0016824148454074694, "loss": 2.8538, "step": 10535 }, { "epoch": 0.28, "learning_rate": 0.0016823512202096933, "loss": 2.85, "step": 10536 }, { "epoch": 0.28, "learning_rate": 0.001682287589842547, "loss": 2.5521, "step": 10537 }, { "epoch": 0.28, "learning_rate": 0.001682223954306511, "loss": 2.7281, "step": 10538 }, { "epoch": 0.28, "learning_rate": 0.0016821603136020688, "loss": 2.3042, "step": 10539 }, { "epoch": 0.28, "learning_rate": 0.0016820966677297017, "loss": 2.6714, "step": 10540 }, { "epoch": 0.28, "learning_rate": 0.0016820330166898926, "loss": 2.157, "step": 10541 }, { "epoch": 0.28, "learning_rate": 0.001681969360483123, "loss": 2.2446, "step": 10542 }, { "epoch": 0.28, "learning_rate": 0.0016819056991098755, "loss": 2.4453, "step": 10543 }, { "epoch": 0.28, "learning_rate": 0.0016818420325706324, "loss": 2.8109, "step": 10544 }, { "epoch": 0.28, "learning_rate": 0.0016817783608658761, "loss": 2.9851, "step": 10545 }, { "epoch": 0.28, "learning_rate": 0.0016817146839960887, "loss": 2.634, "step": 10546 }, { "epoch": 0.28, "learning_rate": 0.0016816510019617525, "loss": 2.4875, "step": 10547 }, { "epoch": 0.28, "learning_rate": 0.0016815873147633504, "loss": 2.3242, "step": 10548 }, { "epoch": 0.28, "learning_rate": 0.001681523622401365, "loss": 2.7317, "step": 10549 }, { "epoch": 0.28, "learning_rate": 0.001681459924876278, "loss": 2.7371, "step": 10550 }, { "epoch": 0.28, "learning_rate": 0.0016813962221885724, "loss": 2.4116, "step": 10551 }, { "epoch": 0.28, "learning_rate": 0.0016813325143387311, "loss": 2.6136, "step": 10552 }, { "epoch": 0.28, "learning_rate": 0.0016812688013272364, "loss": 2.6238, "step": 10553 }, { "epoch": 0.28, "learning_rate": 0.0016812050831545712, "loss": 2.5407, "step": 10554 }, { "epoch": 0.28, "learning_rate": 0.0016811413598212177, "loss": 2.77, "step": 10555 }, { "epoch": 0.28, "learning_rate": 0.0016810776313276592, "loss": 2.1331, "step": 10556 }, { "epoch": 0.28, "learning_rate": 0.0016810138976743785, "loss": 2.3007, "step": 10557 }, { "epoch": 0.28, "learning_rate": 0.0016809501588618582, "loss": 2.4796, "step": 10558 }, { "epoch": 0.28, "learning_rate": 0.0016808864148905812, "loss": 2.4861, "step": 10559 }, { "epoch": 0.28, "learning_rate": 0.0016808226657610303, "loss": 2.4686, "step": 10560 }, { "epoch": 0.28, "learning_rate": 0.001680758911473689, "loss": 2.7591, "step": 10561 }, { "epoch": 0.28, "learning_rate": 0.0016806951520290396, "loss": 2.7831, "step": 10562 }, { "epoch": 0.28, "learning_rate": 0.0016806313874275654, "loss": 2.5572, "step": 10563 }, { "epoch": 0.28, "learning_rate": 0.0016805676176697495, "loss": 2.8021, "step": 10564 }, { "epoch": 0.28, "learning_rate": 0.0016805038427560753, "loss": 2.6703, "step": 10565 }, { "epoch": 0.28, "learning_rate": 0.0016804400626870253, "loss": 2.8299, "step": 10566 }, { "epoch": 0.28, "learning_rate": 0.001680376277463083, "loss": 2.4071, "step": 10567 }, { "epoch": 0.28, "learning_rate": 0.001680312487084732, "loss": 2.7623, "step": 10568 }, { "epoch": 0.28, "learning_rate": 0.0016802486915524551, "loss": 2.6659, "step": 10569 }, { "epoch": 0.28, "learning_rate": 0.0016801848908667356, "loss": 2.8424, "step": 10570 }, { "epoch": 0.28, "learning_rate": 0.001680121085028057, "loss": 2.5519, "step": 10571 }, { "epoch": 0.28, "learning_rate": 0.0016800572740369028, "loss": 2.7307, "step": 10572 }, { "epoch": 0.28, "learning_rate": 0.001679993457893756, "loss": 2.7002, "step": 10573 }, { "epoch": 0.28, "learning_rate": 0.0016799296365991006, "loss": 2.7388, "step": 10574 }, { "epoch": 0.28, "learning_rate": 0.0016798658101534198, "loss": 2.4174, "step": 10575 }, { "epoch": 0.28, "learning_rate": 0.001679801978557197, "loss": 2.9827, "step": 10576 }, { "epoch": 0.28, "learning_rate": 0.0016797381418109162, "loss": 2.7025, "step": 10577 }, { "epoch": 0.28, "learning_rate": 0.0016796742999150608, "loss": 2.2544, "step": 10578 }, { "epoch": 0.28, "learning_rate": 0.0016796104528701142, "loss": 2.6196, "step": 10579 }, { "epoch": 0.28, "learning_rate": 0.0016795466006765602, "loss": 2.5926, "step": 10580 }, { "epoch": 0.28, "learning_rate": 0.0016794827433348827, "loss": 2.7946, "step": 10581 }, { "epoch": 0.28, "learning_rate": 0.0016794188808455656, "loss": 2.7769, "step": 10582 }, { "epoch": 0.28, "learning_rate": 0.0016793550132090925, "loss": 2.6899, "step": 10583 }, { "epoch": 0.28, "learning_rate": 0.0016792911404259472, "loss": 2.8229, "step": 10584 }, { "epoch": 0.28, "learning_rate": 0.0016792272624966136, "loss": 2.891, "step": 10585 }, { "epoch": 0.28, "learning_rate": 0.001679163379421576, "loss": 2.7574, "step": 10586 }, { "epoch": 0.28, "learning_rate": 0.0016790994912013178, "loss": 2.9504, "step": 10587 }, { "epoch": 0.28, "learning_rate": 0.0016790355978363234, "loss": 2.8555, "step": 10588 }, { "epoch": 0.28, "learning_rate": 0.0016789716993270765, "loss": 1.9101, "step": 10589 }, { "epoch": 0.28, "learning_rate": 0.0016789077956740615, "loss": 3.0115, "step": 10590 }, { "epoch": 0.28, "learning_rate": 0.0016788438868777624, "loss": 2.6773, "step": 10591 }, { "epoch": 0.28, "learning_rate": 0.0016787799729386635, "loss": 2.8765, "step": 10592 }, { "epoch": 0.28, "learning_rate": 0.0016787160538572485, "loss": 2.6328, "step": 10593 }, { "epoch": 0.28, "learning_rate": 0.0016786521296340024, "loss": 2.4433, "step": 10594 }, { "epoch": 0.28, "learning_rate": 0.001678588200269409, "loss": 2.6048, "step": 10595 }, { "epoch": 0.28, "learning_rate": 0.001678524265763953, "loss": 2.6091, "step": 10596 }, { "epoch": 0.28, "learning_rate": 0.001678460326118118, "loss": 2.3051, "step": 10597 }, { "epoch": 0.28, "learning_rate": 0.001678396381332389, "loss": 2.7692, "step": 10598 }, { "epoch": 0.28, "learning_rate": 0.0016783324314072505, "loss": 3.1345, "step": 10599 }, { "epoch": 0.28, "learning_rate": 0.0016782684763431868, "loss": 3.2315, "step": 10600 }, { "epoch": 0.28, "learning_rate": 0.001678204516140682, "loss": 2.792, "step": 10601 }, { "epoch": 0.28, "learning_rate": 0.0016781405508002215, "loss": 2.6175, "step": 10602 }, { "epoch": 0.28, "learning_rate": 0.001678076580322289, "loss": 2.8587, "step": 10603 }, { "epoch": 0.28, "learning_rate": 0.0016780126047073699, "loss": 2.2352, "step": 10604 }, { "epoch": 0.28, "learning_rate": 0.001677948623955948, "loss": 2.8531, "step": 10605 }, { "epoch": 0.29, "learning_rate": 0.0016778846380685092, "loss": 2.1661, "step": 10606 }, { "epoch": 0.29, "learning_rate": 0.0016778206470455374, "loss": 2.6295, "step": 10607 }, { "epoch": 0.29, "learning_rate": 0.0016777566508875174, "loss": 2.8714, "step": 10608 }, { "epoch": 0.29, "learning_rate": 0.0016776926495949338, "loss": 2.387, "step": 10609 }, { "epoch": 0.29, "learning_rate": 0.0016776286431682723, "loss": 2.7164, "step": 10610 }, { "epoch": 0.29, "learning_rate": 0.0016775646316080177, "loss": 2.5402, "step": 10611 }, { "epoch": 0.29, "learning_rate": 0.0016775006149146539, "loss": 2.7974, "step": 10612 }, { "epoch": 0.29, "learning_rate": 0.001677436593088667, "loss": 2.5729, "step": 10613 }, { "epoch": 0.29, "learning_rate": 0.0016773725661305414, "loss": 2.4866, "step": 10614 }, { "epoch": 0.29, "learning_rate": 0.0016773085340407623, "loss": 2.2996, "step": 10615 }, { "epoch": 0.29, "learning_rate": 0.0016772444968198151, "loss": 2.6752, "step": 10616 }, { "epoch": 0.29, "learning_rate": 0.0016771804544681843, "loss": 2.6697, "step": 10617 }, { "epoch": 0.29, "learning_rate": 0.001677116406986356, "loss": 2.6795, "step": 10618 }, { "epoch": 0.29, "learning_rate": 0.0016770523543748145, "loss": 2.0767, "step": 10619 }, { "epoch": 0.29, "learning_rate": 0.0016769882966340454, "loss": 2.5212, "step": 10620 }, { "epoch": 0.29, "learning_rate": 0.001676924233764534, "loss": 2.4684, "step": 10621 }, { "epoch": 0.29, "learning_rate": 0.0016768601657667656, "loss": 2.5946, "step": 10622 }, { "epoch": 0.29, "learning_rate": 0.0016767960926412256, "loss": 2.6985, "step": 10623 }, { "epoch": 0.29, "learning_rate": 0.0016767320143883993, "loss": 2.7007, "step": 10624 }, { "epoch": 0.29, "learning_rate": 0.0016766679310087724, "loss": 2.4936, "step": 10625 }, { "epoch": 0.29, "learning_rate": 0.0016766038425028303, "loss": 2.3994, "step": 10626 }, { "epoch": 0.29, "learning_rate": 0.0016765397488710586, "loss": 2.1576, "step": 10627 }, { "epoch": 0.29, "learning_rate": 0.0016764756501139423, "loss": 2.5711, "step": 10628 }, { "epoch": 0.29, "learning_rate": 0.0016764115462319675, "loss": 2.6435, "step": 10629 }, { "epoch": 0.29, "learning_rate": 0.00167634743722562, "loss": 2.2119, "step": 10630 }, { "epoch": 0.29, "learning_rate": 0.0016762833230953853, "loss": 2.3256, "step": 10631 }, { "epoch": 0.29, "learning_rate": 0.0016762192038417484, "loss": 2.2982, "step": 10632 }, { "epoch": 0.29, "learning_rate": 0.0016761550794651965, "loss": 2.6809, "step": 10633 }, { "epoch": 0.29, "learning_rate": 0.0016760909499662143, "loss": 2.378, "step": 10634 }, { "epoch": 0.29, "learning_rate": 0.001676026815345288, "loss": 2.2476, "step": 10635 }, { "epoch": 0.29, "learning_rate": 0.001675962675602903, "loss": 2.1468, "step": 10636 }, { "epoch": 0.29, "learning_rate": 0.001675898530739546, "loss": 2.51, "step": 10637 }, { "epoch": 0.29, "learning_rate": 0.0016758343807557025, "loss": 2.6937, "step": 10638 }, { "epoch": 0.29, "learning_rate": 0.0016757702256518588, "loss": 2.5878, "step": 10639 }, { "epoch": 0.29, "learning_rate": 0.0016757060654285004, "loss": 3.1159, "step": 10640 }, { "epoch": 0.29, "learning_rate": 0.0016756419000861136, "loss": 2.6618, "step": 10641 }, { "epoch": 0.29, "learning_rate": 0.0016755777296251848, "loss": 2.8403, "step": 10642 }, { "epoch": 0.29, "learning_rate": 0.0016755135540461995, "loss": 2.5396, "step": 10643 }, { "epoch": 0.29, "learning_rate": 0.0016754493733496445, "loss": 2.4652, "step": 10644 }, { "epoch": 0.29, "learning_rate": 0.001675385187536006, "loss": 2.7595, "step": 10645 }, { "epoch": 0.29, "learning_rate": 0.00167532099660577, "loss": 2.6935, "step": 10646 }, { "epoch": 0.29, "learning_rate": 0.0016752568005594225, "loss": 2.3783, "step": 10647 }, { "epoch": 0.29, "learning_rate": 0.0016751925993974508, "loss": 2.5107, "step": 10648 }, { "epoch": 0.29, "learning_rate": 0.0016751283931203402, "loss": 2.3395, "step": 10649 }, { "epoch": 0.29, "learning_rate": 0.001675064181728578, "loss": 2.3425, "step": 10650 }, { "epoch": 0.29, "learning_rate": 0.00167499996522265, "loss": 2.4108, "step": 10651 }, { "epoch": 0.29, "learning_rate": 0.0016749357436030429, "loss": 2.6567, "step": 10652 }, { "epoch": 0.29, "learning_rate": 0.0016748715168702433, "loss": 2.6925, "step": 10653 }, { "epoch": 0.29, "learning_rate": 0.0016748072850247377, "loss": 2.6071, "step": 10654 }, { "epoch": 0.29, "learning_rate": 0.0016747430480670128, "loss": 2.2557, "step": 10655 }, { "epoch": 0.29, "learning_rate": 0.0016746788059975553, "loss": 2.302, "step": 10656 }, { "epoch": 0.29, "learning_rate": 0.0016746145588168518, "loss": 2.7356, "step": 10657 }, { "epoch": 0.29, "learning_rate": 0.001674550306525389, "loss": 2.8669, "step": 10658 }, { "epoch": 0.29, "learning_rate": 0.0016744860491236535, "loss": 2.8394, "step": 10659 }, { "epoch": 0.29, "learning_rate": 0.0016744217866121324, "loss": 2.9507, "step": 10660 }, { "epoch": 0.29, "learning_rate": 0.0016743575189913122, "loss": 2.9143, "step": 10661 }, { "epoch": 0.29, "learning_rate": 0.0016742932462616804, "loss": 2.5421, "step": 10662 }, { "epoch": 0.29, "learning_rate": 0.0016742289684237232, "loss": 2.4723, "step": 10663 }, { "epoch": 0.29, "learning_rate": 0.001674164685477928, "loss": 2.601, "step": 10664 }, { "epoch": 0.29, "learning_rate": 0.0016741003974247816, "loss": 2.809, "step": 10665 }, { "epoch": 0.29, "learning_rate": 0.0016740361042647714, "loss": 2.8168, "step": 10666 }, { "epoch": 0.29, "learning_rate": 0.001673971805998384, "loss": 2.0656, "step": 10667 }, { "epoch": 0.29, "learning_rate": 0.0016739075026261064, "loss": 2.4231, "step": 10668 }, { "epoch": 0.29, "learning_rate": 0.0016738431941484264, "loss": 2.6283, "step": 10669 }, { "epoch": 0.29, "learning_rate": 0.0016737788805658309, "loss": 2.2933, "step": 10670 }, { "epoch": 0.29, "learning_rate": 0.0016737145618788067, "loss": 2.5299, "step": 10671 }, { "epoch": 0.29, "learning_rate": 0.0016736502380878418, "loss": 2.5628, "step": 10672 }, { "epoch": 0.29, "learning_rate": 0.0016735859091934228, "loss": 2.3754, "step": 10673 }, { "epoch": 0.29, "learning_rate": 0.0016735215751960376, "loss": 2.7537, "step": 10674 }, { "epoch": 0.29, "learning_rate": 0.0016734572360961734, "loss": 2.1017, "step": 10675 }, { "epoch": 0.29, "learning_rate": 0.0016733928918943174, "loss": 3.0275, "step": 10676 }, { "epoch": 0.29, "learning_rate": 0.0016733285425909572, "loss": 2.3917, "step": 10677 }, { "epoch": 0.29, "learning_rate": 0.0016732641881865807, "loss": 2.4969, "step": 10678 }, { "epoch": 0.29, "learning_rate": 0.0016731998286816747, "loss": 2.9961, "step": 10679 }, { "epoch": 0.29, "learning_rate": 0.0016731354640767272, "loss": 2.4156, "step": 10680 }, { "epoch": 0.29, "learning_rate": 0.001673071094372226, "loss": 2.77, "step": 10681 }, { "epoch": 0.29, "learning_rate": 0.0016730067195686582, "loss": 2.9187, "step": 10682 }, { "epoch": 0.29, "learning_rate": 0.001672942339666512, "loss": 1.9575, "step": 10683 }, { "epoch": 0.29, "learning_rate": 0.0016728779546662752, "loss": 2.8575, "step": 10684 }, { "epoch": 0.29, "learning_rate": 0.0016728135645684347, "loss": 2.7714, "step": 10685 }, { "epoch": 0.29, "learning_rate": 0.0016727491693734793, "loss": 2.3255, "step": 10686 }, { "epoch": 0.29, "learning_rate": 0.0016726847690818967, "loss": 2.1434, "step": 10687 }, { "epoch": 0.29, "learning_rate": 0.001672620363694174, "loss": 2.4304, "step": 10688 }, { "epoch": 0.29, "learning_rate": 0.0016725559532108, "loss": 2.4629, "step": 10689 }, { "epoch": 0.29, "learning_rate": 0.0016724915376322622, "loss": 2.7845, "step": 10690 }, { "epoch": 0.29, "learning_rate": 0.001672427116959049, "loss": 2.4468, "step": 10691 }, { "epoch": 0.29, "learning_rate": 0.0016723626911916481, "loss": 2.6931, "step": 10692 }, { "epoch": 0.29, "learning_rate": 0.001672298260330548, "loss": 2.2591, "step": 10693 }, { "epoch": 0.29, "learning_rate": 0.0016722338243762356, "loss": 2.3671, "step": 10694 }, { "epoch": 0.29, "learning_rate": 0.0016721693833292007, "loss": 2.7104, "step": 10695 }, { "epoch": 0.29, "learning_rate": 0.0016721049371899303, "loss": 2.6306, "step": 10696 }, { "epoch": 0.29, "learning_rate": 0.0016720404859589132, "loss": 3.0381, "step": 10697 }, { "epoch": 0.29, "learning_rate": 0.0016719760296366375, "loss": 2.5739, "step": 10698 }, { "epoch": 0.29, "learning_rate": 0.0016719115682235915, "loss": 2.9339, "step": 10699 }, { "epoch": 0.29, "learning_rate": 0.001671847101720264, "loss": 2.7113, "step": 10700 }, { "epoch": 0.29, "learning_rate": 0.0016717826301271424, "loss": 2.7824, "step": 10701 }, { "epoch": 0.29, "learning_rate": 0.001671718153444716, "loss": 2.7313, "step": 10702 }, { "epoch": 0.29, "learning_rate": 0.0016716536716734726, "loss": 2.5285, "step": 10703 }, { "epoch": 0.29, "learning_rate": 0.0016715891848139016, "loss": 2.581, "step": 10704 }, { "epoch": 0.29, "learning_rate": 0.0016715246928664907, "loss": 2.6267, "step": 10705 }, { "epoch": 0.29, "learning_rate": 0.0016714601958317285, "loss": 2.2097, "step": 10706 }, { "epoch": 0.29, "learning_rate": 0.0016713956937101045, "loss": 2.9222, "step": 10707 }, { "epoch": 0.29, "learning_rate": 0.0016713311865021066, "loss": 2.5857, "step": 10708 }, { "epoch": 0.29, "learning_rate": 0.0016712666742082233, "loss": 2.4906, "step": 10709 }, { "epoch": 0.29, "learning_rate": 0.001671202156828944, "loss": 2.3989, "step": 10710 }, { "epoch": 0.29, "learning_rate": 0.0016711376343647572, "loss": 2.8254, "step": 10711 }, { "epoch": 0.29, "learning_rate": 0.0016710731068161513, "loss": 2.433, "step": 10712 }, { "epoch": 0.29, "learning_rate": 0.0016710085741836159, "loss": 2.7728, "step": 10713 }, { "epoch": 0.29, "learning_rate": 0.0016709440364676394, "loss": 2.4453, "step": 10714 }, { "epoch": 0.29, "learning_rate": 0.0016708794936687108, "loss": 2.757, "step": 10715 }, { "epoch": 0.29, "learning_rate": 0.0016708149457873192, "loss": 2.7371, "step": 10716 }, { "epoch": 0.29, "learning_rate": 0.0016707503928239534, "loss": 2.4535, "step": 10717 }, { "epoch": 0.29, "learning_rate": 0.0016706858347791025, "loss": 2.6297, "step": 10718 }, { "epoch": 0.29, "learning_rate": 0.0016706212716532556, "loss": 3.2479, "step": 10719 }, { "epoch": 0.29, "learning_rate": 0.001670556703446902, "loss": 2.5559, "step": 10720 }, { "epoch": 0.29, "learning_rate": 0.0016704921301605306, "loss": 3.0687, "step": 10721 }, { "epoch": 0.29, "learning_rate": 0.0016704275517946305, "loss": 2.4717, "step": 10722 }, { "epoch": 0.29, "learning_rate": 0.0016703629683496916, "loss": 2.3781, "step": 10723 }, { "epoch": 0.29, "learning_rate": 0.0016702983798262024, "loss": 2.5887, "step": 10724 }, { "epoch": 0.29, "learning_rate": 0.0016702337862246526, "loss": 3.0988, "step": 10725 }, { "epoch": 0.29, "learning_rate": 0.0016701691875455314, "loss": 2.3373, "step": 10726 }, { "epoch": 0.29, "learning_rate": 0.0016701045837893282, "loss": 2.2528, "step": 10727 }, { "epoch": 0.29, "learning_rate": 0.0016700399749565327, "loss": 2.2678, "step": 10728 }, { "epoch": 0.29, "learning_rate": 0.001669975361047634, "loss": 2.4171, "step": 10729 }, { "epoch": 0.29, "learning_rate": 0.0016699107420631216, "loss": 2.879, "step": 10730 }, { "epoch": 0.29, "learning_rate": 0.0016698461180034855, "loss": 2.0872, "step": 10731 }, { "epoch": 0.29, "learning_rate": 0.0016697814888692146, "loss": 2.7238, "step": 10732 }, { "epoch": 0.29, "learning_rate": 0.001669716854660799, "loss": 2.4206, "step": 10733 }, { "epoch": 0.29, "learning_rate": 0.0016696522153787283, "loss": 2.9171, "step": 10734 }, { "epoch": 0.29, "learning_rate": 0.0016695875710234925, "loss": 3.0632, "step": 10735 }, { "epoch": 0.29, "learning_rate": 0.0016695229215955806, "loss": 2.3857, "step": 10736 }, { "epoch": 0.29, "learning_rate": 0.0016694582670954826, "loss": 2.3038, "step": 10737 }, { "epoch": 0.29, "learning_rate": 0.0016693936075236886, "loss": 2.8217, "step": 10738 }, { "epoch": 0.29, "learning_rate": 0.0016693289428806883, "loss": 2.6506, "step": 10739 }, { "epoch": 0.29, "learning_rate": 0.0016692642731669718, "loss": 2.5269, "step": 10740 }, { "epoch": 0.29, "learning_rate": 0.0016691995983830284, "loss": 2.2851, "step": 10741 }, { "epoch": 0.29, "learning_rate": 0.001669134918529349, "loss": 2.5348, "step": 10742 }, { "epoch": 0.29, "learning_rate": 0.0016690702336064228, "loss": 2.6794, "step": 10743 }, { "epoch": 0.29, "learning_rate": 0.0016690055436147401, "loss": 2.7917, "step": 10744 }, { "epoch": 0.29, "learning_rate": 0.001668940848554791, "loss": 3.0801, "step": 10745 }, { "epoch": 0.29, "learning_rate": 0.001668876148427066, "loss": 2.6016, "step": 10746 }, { "epoch": 0.29, "learning_rate": 0.0016688114432320542, "loss": 2.3967, "step": 10747 }, { "epoch": 0.29, "learning_rate": 0.001668746732970247, "loss": 2.5715, "step": 10748 }, { "epoch": 0.29, "learning_rate": 0.0016686820176421337, "loss": 2.2069, "step": 10749 }, { "epoch": 0.29, "learning_rate": 0.0016686172972482055, "loss": 2.7778, "step": 10750 }, { "epoch": 0.29, "learning_rate": 0.001668552571788952, "loss": 2.374, "step": 10751 }, { "epoch": 0.29, "learning_rate": 0.0016684878412648637, "loss": 2.7699, "step": 10752 }, { "epoch": 0.29, "learning_rate": 0.001668423105676431, "loss": 2.6158, "step": 10753 }, { "epoch": 0.29, "learning_rate": 0.0016683583650241444, "loss": 2.7023, "step": 10754 }, { "epoch": 0.29, "learning_rate": 0.0016682936193084942, "loss": 2.4203, "step": 10755 }, { "epoch": 0.29, "learning_rate": 0.001668228868529971, "loss": 2.2517, "step": 10756 }, { "epoch": 0.29, "learning_rate": 0.0016681641126890655, "loss": 2.7517, "step": 10757 }, { "epoch": 0.29, "learning_rate": 0.001668099351786268, "loss": 2.7903, "step": 10758 }, { "epoch": 0.29, "learning_rate": 0.0016680345858220696, "loss": 2.869, "step": 10759 }, { "epoch": 0.29, "learning_rate": 0.00166796981479696, "loss": 2.1836, "step": 10760 }, { "epoch": 0.29, "learning_rate": 0.001667905038711431, "loss": 2.478, "step": 10761 }, { "epoch": 0.29, "learning_rate": 0.0016678402575659725, "loss": 2.5991, "step": 10762 }, { "epoch": 0.29, "learning_rate": 0.0016677754713610763, "loss": 2.8677, "step": 10763 }, { "epoch": 0.29, "learning_rate": 0.0016677106800972318, "loss": 2.3533, "step": 10764 }, { "epoch": 0.29, "learning_rate": 0.0016676458837749308, "loss": 2.7708, "step": 10765 }, { "epoch": 0.29, "learning_rate": 0.001667581082394664, "loss": 2.3196, "step": 10766 }, { "epoch": 0.29, "learning_rate": 0.0016675162759569222, "loss": 2.3919, "step": 10767 }, { "epoch": 0.29, "learning_rate": 0.0016674514644621963, "loss": 2.4606, "step": 10768 }, { "epoch": 0.29, "learning_rate": 0.0016673866479109776, "loss": 2.4858, "step": 10769 }, { "epoch": 0.29, "learning_rate": 0.001667321826303757, "loss": 2.2862, "step": 10770 }, { "epoch": 0.29, "learning_rate": 0.0016672569996410255, "loss": 2.6743, "step": 10771 }, { "epoch": 0.29, "learning_rate": 0.0016671921679232743, "loss": 2.6192, "step": 10772 }, { "epoch": 0.29, "learning_rate": 0.0016671273311509944, "loss": 2.3468, "step": 10773 }, { "epoch": 0.29, "learning_rate": 0.0016670624893246773, "loss": 2.5957, "step": 10774 }, { "epoch": 0.29, "learning_rate": 0.001666997642444814, "loss": 2.4061, "step": 10775 }, { "epoch": 0.29, "learning_rate": 0.0016669327905118956, "loss": 2.591, "step": 10776 }, { "epoch": 0.29, "learning_rate": 0.0016668679335264138, "loss": 2.5466, "step": 10777 }, { "epoch": 0.29, "learning_rate": 0.00166680307148886, "loss": 2.8213, "step": 10778 }, { "epoch": 0.29, "learning_rate": 0.0016667382043997249, "loss": 2.6505, "step": 10779 }, { "epoch": 0.29, "learning_rate": 0.0016666733322595005, "loss": 2.5338, "step": 10780 }, { "epoch": 0.29, "learning_rate": 0.0016666084550686782, "loss": 2.5852, "step": 10781 }, { "epoch": 0.29, "learning_rate": 0.0016665435728277494, "loss": 2.6427, "step": 10782 }, { "epoch": 0.29, "learning_rate": 0.0016664786855372057, "loss": 3.0527, "step": 10783 }, { "epoch": 0.29, "learning_rate": 0.0016664137931975383, "loss": 2.9225, "step": 10784 }, { "epoch": 0.29, "learning_rate": 0.0016663488958092395, "loss": 2.3415, "step": 10785 }, { "epoch": 0.29, "learning_rate": 0.0016662839933728006, "loss": 2.9203, "step": 10786 }, { "epoch": 0.29, "learning_rate": 0.0016662190858887135, "loss": 2.8597, "step": 10787 }, { "epoch": 0.29, "learning_rate": 0.001666154173357469, "loss": 2.5012, "step": 10788 }, { "epoch": 0.29, "learning_rate": 0.0016660892557795602, "loss": 2.4358, "step": 10789 }, { "epoch": 0.29, "learning_rate": 0.0016660243331554781, "loss": 2.6471, "step": 10790 }, { "epoch": 0.29, "learning_rate": 0.0016659594054857147, "loss": 2.4178, "step": 10791 }, { "epoch": 0.29, "learning_rate": 0.0016658944727707618, "loss": 2.4973, "step": 10792 }, { "epoch": 0.29, "learning_rate": 0.0016658295350111115, "loss": 2.5889, "step": 10793 }, { "epoch": 0.29, "learning_rate": 0.001665764592207256, "loss": 2.2809, "step": 10794 }, { "epoch": 0.29, "learning_rate": 0.0016656996443596866, "loss": 2.3583, "step": 10795 }, { "epoch": 0.29, "learning_rate": 0.0016656346914688959, "loss": 2.5805, "step": 10796 }, { "epoch": 0.29, "learning_rate": 0.0016655697335353754, "loss": 2.9142, "step": 10797 }, { "epoch": 0.29, "learning_rate": 0.001665504770559618, "loss": 2.6312, "step": 10798 }, { "epoch": 0.29, "learning_rate": 0.0016654398025421151, "loss": 2.6328, "step": 10799 }, { "epoch": 0.29, "learning_rate": 0.0016653748294833597, "loss": 2.33, "step": 10800 }, { "epoch": 0.29, "learning_rate": 0.0016653098513838432, "loss": 2.4053, "step": 10801 }, { "epoch": 0.29, "learning_rate": 0.0016652448682440584, "loss": 2.7442, "step": 10802 }, { "epoch": 0.29, "learning_rate": 0.0016651798800644973, "loss": 2.5017, "step": 10803 }, { "epoch": 0.29, "learning_rate": 0.0016651148868456526, "loss": 2.6919, "step": 10804 }, { "epoch": 0.29, "learning_rate": 0.001665049888588016, "loss": 2.7752, "step": 10805 }, { "epoch": 0.29, "learning_rate": 0.0016649848852920805, "loss": 2.2618, "step": 10806 }, { "epoch": 0.29, "learning_rate": 0.0016649198769583381, "loss": 2.196, "step": 10807 }, { "epoch": 0.29, "learning_rate": 0.0016648548635872823, "loss": 2.5298, "step": 10808 }, { "epoch": 0.29, "learning_rate": 0.0016647898451794046, "loss": 2.2009, "step": 10809 }, { "epoch": 0.29, "learning_rate": 0.0016647248217351977, "loss": 2.6708, "step": 10810 }, { "epoch": 0.29, "learning_rate": 0.0016646597932551547, "loss": 2.4042, "step": 10811 }, { "epoch": 0.29, "learning_rate": 0.0016645947597397678, "loss": 2.4768, "step": 10812 }, { "epoch": 0.29, "learning_rate": 0.0016645297211895296, "loss": 2.153, "step": 10813 }, { "epoch": 0.29, "learning_rate": 0.0016644646776049331, "loss": 2.5335, "step": 10814 }, { "epoch": 0.29, "learning_rate": 0.0016643996289864714, "loss": 3.215, "step": 10815 }, { "epoch": 0.29, "learning_rate": 0.0016643345753346367, "loss": 3.0296, "step": 10816 }, { "epoch": 0.29, "learning_rate": 0.0016642695166499218, "loss": 2.9115, "step": 10817 }, { "epoch": 0.29, "learning_rate": 0.00166420445293282, "loss": 2.6298, "step": 10818 }, { "epoch": 0.29, "learning_rate": 0.0016641393841838239, "loss": 3.0633, "step": 10819 }, { "epoch": 0.29, "learning_rate": 0.0016640743104034265, "loss": 2.658, "step": 10820 }, { "epoch": 0.29, "learning_rate": 0.001664009231592121, "loss": 2.3717, "step": 10821 }, { "epoch": 0.29, "learning_rate": 0.0016639441477504003, "loss": 2.819, "step": 10822 }, { "epoch": 0.29, "learning_rate": 0.0016638790588787574, "loss": 2.8666, "step": 10823 }, { "epoch": 0.29, "learning_rate": 0.0016638139649776855, "loss": 2.9136, "step": 10824 }, { "epoch": 0.29, "learning_rate": 0.0016637488660476776, "loss": 2.5403, "step": 10825 }, { "epoch": 0.29, "learning_rate": 0.0016636837620892268, "loss": 2.489, "step": 10826 }, { "epoch": 0.29, "learning_rate": 0.0016636186531028265, "loss": 2.5385, "step": 10827 }, { "epoch": 0.29, "learning_rate": 0.0016635535390889702, "loss": 2.615, "step": 10828 }, { "epoch": 0.29, "learning_rate": 0.001663488420048151, "loss": 3.0174, "step": 10829 }, { "epoch": 0.29, "learning_rate": 0.0016634232959808618, "loss": 2.5515, "step": 10830 }, { "epoch": 0.29, "learning_rate": 0.0016633581668875964, "loss": 2.6171, "step": 10831 }, { "epoch": 0.29, "learning_rate": 0.0016632930327688483, "loss": 2.8094, "step": 10832 }, { "epoch": 0.29, "learning_rate": 0.0016632278936251105, "loss": 2.8756, "step": 10833 }, { "epoch": 0.29, "learning_rate": 0.001663162749456877, "loss": 2.7354, "step": 10834 }, { "epoch": 0.29, "learning_rate": 0.001663097600264641, "loss": 2.4424, "step": 10835 }, { "epoch": 0.29, "learning_rate": 0.0016630324460488962, "loss": 3.1285, "step": 10836 }, { "epoch": 0.29, "learning_rate": 0.001662967286810136, "loss": 2.1288, "step": 10837 }, { "epoch": 0.29, "learning_rate": 0.001662902122548854, "loss": 2.4914, "step": 10838 }, { "epoch": 0.29, "learning_rate": 0.0016628369532655442, "loss": 1.8698, "step": 10839 }, { "epoch": 0.29, "learning_rate": 0.0016627717789607002, "loss": 2.3125, "step": 10840 }, { "epoch": 0.29, "learning_rate": 0.0016627065996348159, "loss": 2.8216, "step": 10841 }, { "epoch": 0.29, "learning_rate": 0.0016626414152883845, "loss": 2.4962, "step": 10842 }, { "epoch": 0.29, "learning_rate": 0.0016625762259219004, "loss": 3.1005, "step": 10843 }, { "epoch": 0.29, "learning_rate": 0.0016625110315358575, "loss": 2.6582, "step": 10844 }, { "epoch": 0.29, "learning_rate": 0.0016624458321307489, "loss": 2.4052, "step": 10845 }, { "epoch": 0.29, "learning_rate": 0.0016623806277070695, "loss": 2.7704, "step": 10846 }, { "epoch": 0.29, "learning_rate": 0.0016623154182653127, "loss": 2.6625, "step": 10847 }, { "epoch": 0.29, "learning_rate": 0.0016622502038059728, "loss": 2.4682, "step": 10848 }, { "epoch": 0.29, "learning_rate": 0.001662184984329544, "loss": 2.8011, "step": 10849 }, { "epoch": 0.29, "learning_rate": 0.0016621197598365195, "loss": 2.3911, "step": 10850 }, { "epoch": 0.29, "learning_rate": 0.0016620545303273947, "loss": 2.0257, "step": 10851 }, { "epoch": 0.29, "learning_rate": 0.001661989295802663, "loss": 2.9005, "step": 10852 }, { "epoch": 0.29, "learning_rate": 0.0016619240562628186, "loss": 2.7717, "step": 10853 }, { "epoch": 0.29, "learning_rate": 0.001661858811708356, "loss": 2.4159, "step": 10854 }, { "epoch": 0.29, "learning_rate": 0.0016617935621397694, "loss": 2.3249, "step": 10855 }, { "epoch": 0.29, "learning_rate": 0.001661728307557553, "loss": 2.7006, "step": 10856 }, { "epoch": 0.29, "learning_rate": 0.0016616630479622013, "loss": 2.5745, "step": 10857 }, { "epoch": 0.29, "learning_rate": 0.0016615977833542084, "loss": 2.7469, "step": 10858 }, { "epoch": 0.29, "learning_rate": 0.0016615325137340692, "loss": 2.8377, "step": 10859 }, { "epoch": 0.29, "learning_rate": 0.0016614672391022781, "loss": 2.7008, "step": 10860 }, { "epoch": 0.29, "learning_rate": 0.0016614019594593293, "loss": 2.8149, "step": 10861 }, { "epoch": 0.29, "learning_rate": 0.0016613366748057174, "loss": 2.7961, "step": 10862 }, { "epoch": 0.29, "learning_rate": 0.0016612713851419372, "loss": 2.9059, "step": 10863 }, { "epoch": 0.29, "learning_rate": 0.001661206090468483, "loss": 2.4801, "step": 10864 }, { "epoch": 0.29, "learning_rate": 0.0016611407907858502, "loss": 2.344, "step": 10865 }, { "epoch": 0.29, "learning_rate": 0.0016610754860945326, "loss": 2.5755, "step": 10866 }, { "epoch": 0.29, "learning_rate": 0.0016610101763950252, "loss": 2.728, "step": 10867 }, { "epoch": 0.29, "learning_rate": 0.001660944861687823, "loss": 2.7008, "step": 10868 }, { "epoch": 0.29, "learning_rate": 0.0016608795419734209, "loss": 2.6034, "step": 10869 }, { "epoch": 0.29, "learning_rate": 0.0016608142172523134, "loss": 2.4629, "step": 10870 }, { "epoch": 0.29, "learning_rate": 0.0016607488875249952, "loss": 2.6608, "step": 10871 }, { "epoch": 0.29, "learning_rate": 0.0016606835527919622, "loss": 2.4731, "step": 10872 }, { "epoch": 0.29, "learning_rate": 0.001660618213053708, "loss": 2.4788, "step": 10873 }, { "epoch": 0.29, "learning_rate": 0.0016605528683107287, "loss": 2.4157, "step": 10874 }, { "epoch": 0.29, "learning_rate": 0.0016604875185635192, "loss": 2.8027, "step": 10875 }, { "epoch": 0.29, "learning_rate": 0.0016604221638125741, "loss": 2.4106, "step": 10876 }, { "epoch": 0.29, "learning_rate": 0.0016603568040583884, "loss": 2.6739, "step": 10877 }, { "epoch": 0.29, "learning_rate": 0.0016602914393014582, "loss": 2.4727, "step": 10878 }, { "epoch": 0.29, "learning_rate": 0.0016602260695422779, "loss": 2.9395, "step": 10879 }, { "epoch": 0.29, "learning_rate": 0.001660160694781343, "loss": 2.2689, "step": 10880 }, { "epoch": 0.29, "learning_rate": 0.0016600953150191485, "loss": 2.9776, "step": 10881 }, { "epoch": 0.29, "learning_rate": 0.0016600299302561902, "loss": 2.4865, "step": 10882 }, { "epoch": 0.29, "learning_rate": 0.0016599645404929628, "loss": 2.3038, "step": 10883 }, { "epoch": 0.29, "learning_rate": 0.0016598991457299622, "loss": 2.814, "step": 10884 }, { "epoch": 0.29, "learning_rate": 0.0016598337459676836, "loss": 2.4566, "step": 10885 }, { "epoch": 0.29, "learning_rate": 0.0016597683412066227, "loss": 2.4657, "step": 10886 }, { "epoch": 0.29, "learning_rate": 0.0016597029314472747, "loss": 2.2652, "step": 10887 }, { "epoch": 0.29, "learning_rate": 0.0016596375166901352, "loss": 2.6494, "step": 10888 }, { "epoch": 0.29, "learning_rate": 0.0016595720969356997, "loss": 2.6014, "step": 10889 }, { "epoch": 0.29, "learning_rate": 0.001659506672184464, "loss": 2.4254, "step": 10890 }, { "epoch": 0.29, "learning_rate": 0.0016594412424369238, "loss": 3.0045, "step": 10891 }, { "epoch": 0.29, "learning_rate": 0.0016593758076935746, "loss": 2.986, "step": 10892 }, { "epoch": 0.29, "learning_rate": 0.001659310367954912, "loss": 2.1794, "step": 10893 }, { "epoch": 0.29, "learning_rate": 0.0016592449232214319, "loss": 2.6552, "step": 10894 }, { "epoch": 0.29, "learning_rate": 0.0016591794734936306, "loss": 2.2801, "step": 10895 }, { "epoch": 0.29, "learning_rate": 0.0016591140187720028, "loss": 2.3946, "step": 10896 }, { "epoch": 0.29, "learning_rate": 0.0016590485590570454, "loss": 2.597, "step": 10897 }, { "epoch": 0.29, "learning_rate": 0.0016589830943492538, "loss": 2.9431, "step": 10898 }, { "epoch": 0.29, "learning_rate": 0.0016589176246491243, "loss": 2.4325, "step": 10899 }, { "epoch": 0.29, "learning_rate": 0.0016588521499571528, "loss": 3.0313, "step": 10900 }, { "epoch": 0.29, "learning_rate": 0.0016587866702738347, "loss": 2.7026, "step": 10901 }, { "epoch": 0.29, "learning_rate": 0.0016587211855996669, "loss": 2.3675, "step": 10902 }, { "epoch": 0.29, "learning_rate": 0.001658655695935145, "loss": 2.4577, "step": 10903 }, { "epoch": 0.29, "learning_rate": 0.0016585902012807654, "loss": 2.7528, "step": 10904 }, { "epoch": 0.29, "learning_rate": 0.0016585247016370243, "loss": 3.1535, "step": 10905 }, { "epoch": 0.29, "learning_rate": 0.0016584591970044177, "loss": 2.741, "step": 10906 }, { "epoch": 0.29, "learning_rate": 0.0016583936873834418, "loss": 2.6327, "step": 10907 }, { "epoch": 0.29, "learning_rate": 0.001658328172774593, "loss": 2.9838, "step": 10908 }, { "epoch": 0.29, "learning_rate": 0.001658262653178368, "loss": 2.6343, "step": 10909 }, { "epoch": 0.29, "learning_rate": 0.0016581971285952626, "loss": 2.4497, "step": 10910 }, { "epoch": 0.29, "learning_rate": 0.0016581315990257734, "loss": 2.4674, "step": 10911 }, { "epoch": 0.29, "learning_rate": 0.0016580660644703968, "loss": 2.8241, "step": 10912 }, { "epoch": 0.29, "learning_rate": 0.0016580005249296295, "loss": 2.4662, "step": 10913 }, { "epoch": 0.29, "learning_rate": 0.0016579349804039679, "loss": 2.1283, "step": 10914 }, { "epoch": 0.29, "learning_rate": 0.0016578694308939086, "loss": 2.3843, "step": 10915 }, { "epoch": 0.29, "learning_rate": 0.0016578038763999479, "loss": 2.3141, "step": 10916 }, { "epoch": 0.29, "learning_rate": 0.0016577383169225825, "loss": 2.4966, "step": 10917 }, { "epoch": 0.29, "learning_rate": 0.0016576727524623097, "loss": 2.722, "step": 10918 }, { "epoch": 0.29, "learning_rate": 0.0016576071830196252, "loss": 2.6763, "step": 10919 }, { "epoch": 0.29, "learning_rate": 0.0016575416085950266, "loss": 2.5372, "step": 10920 }, { "epoch": 0.29, "learning_rate": 0.0016574760291890103, "loss": 2.5151, "step": 10921 }, { "epoch": 0.29, "learning_rate": 0.001657410444802073, "loss": 2.7417, "step": 10922 }, { "epoch": 0.29, "learning_rate": 0.0016573448554347116, "loss": 2.9085, "step": 10923 }, { "epoch": 0.29, "learning_rate": 0.0016572792610874232, "loss": 2.3873, "step": 10924 }, { "epoch": 0.29, "learning_rate": 0.001657213661760705, "loss": 2.4545, "step": 10925 }, { "epoch": 0.29, "learning_rate": 0.001657148057455053, "loss": 2.5985, "step": 10926 }, { "epoch": 0.29, "learning_rate": 0.0016570824481709652, "loss": 1.9736, "step": 10927 }, { "epoch": 0.29, "learning_rate": 0.001657016833908938, "loss": 2.6804, "step": 10928 }, { "epoch": 0.29, "learning_rate": 0.0016569512146694687, "loss": 2.3592, "step": 10929 }, { "epoch": 0.29, "learning_rate": 0.0016568855904530548, "loss": 2.7802, "step": 10930 }, { "epoch": 0.29, "learning_rate": 0.0016568199612601929, "loss": 2.7804, "step": 10931 }, { "epoch": 0.29, "learning_rate": 0.0016567543270913805, "loss": 2.6767, "step": 10932 }, { "epoch": 0.29, "learning_rate": 0.0016566886879471146, "loss": 2.1644, "step": 10933 }, { "epoch": 0.29, "learning_rate": 0.0016566230438278926, "loss": 2.3954, "step": 10934 }, { "epoch": 0.29, "learning_rate": 0.0016565573947342118, "loss": 2.8358, "step": 10935 }, { "epoch": 0.29, "learning_rate": 0.00165649174066657, "loss": 2.621, "step": 10936 }, { "epoch": 0.29, "learning_rate": 0.0016564260816254635, "loss": 2.4216, "step": 10937 }, { "epoch": 0.29, "learning_rate": 0.0016563604176113907, "loss": 2.7518, "step": 10938 }, { "epoch": 0.29, "learning_rate": 0.0016562947486248487, "loss": 2.3643, "step": 10939 }, { "epoch": 0.29, "learning_rate": 0.001656229074666335, "loss": 2.8576, "step": 10940 }, { "epoch": 0.29, "learning_rate": 0.0016561633957363471, "loss": 2.7781, "step": 10941 }, { "epoch": 0.29, "learning_rate": 0.0016560977118353826, "loss": 2.7612, "step": 10942 }, { "epoch": 0.29, "learning_rate": 0.001656032022963939, "loss": 2.3604, "step": 10943 }, { "epoch": 0.29, "learning_rate": 0.0016559663291225144, "loss": 2.4773, "step": 10944 }, { "epoch": 0.29, "learning_rate": 0.001655900630311606, "loss": 2.2139, "step": 10945 }, { "epoch": 0.29, "learning_rate": 0.001655834926531712, "loss": 2.4495, "step": 10946 }, { "epoch": 0.29, "learning_rate": 0.0016557692177833292, "loss": 2.7314, "step": 10947 }, { "epoch": 0.29, "learning_rate": 0.0016557035040669565, "loss": 2.7366, "step": 10948 }, { "epoch": 0.29, "learning_rate": 0.001655637785383091, "loss": 2.5539, "step": 10949 }, { "epoch": 0.29, "learning_rate": 0.0016555720617322312, "loss": 2.653, "step": 10950 }, { "epoch": 0.29, "learning_rate": 0.0016555063331148746, "loss": 2.677, "step": 10951 }, { "epoch": 0.29, "learning_rate": 0.0016554405995315193, "loss": 2.9229, "step": 10952 }, { "epoch": 0.29, "learning_rate": 0.0016553748609826628, "loss": 2.4576, "step": 10953 }, { "epoch": 0.29, "learning_rate": 0.001655309117468804, "loss": 2.3124, "step": 10954 }, { "epoch": 0.29, "learning_rate": 0.00165524336899044, "loss": 2.5283, "step": 10955 }, { "epoch": 0.29, "learning_rate": 0.0016551776155480696, "loss": 2.7002, "step": 10956 }, { "epoch": 0.29, "learning_rate": 0.001655111857142191, "loss": 2.8362, "step": 10957 }, { "epoch": 0.29, "learning_rate": 0.0016550460937733017, "loss": 2.654, "step": 10958 }, { "epoch": 0.29, "learning_rate": 0.0016549803254419003, "loss": 2.938, "step": 10959 }, { "epoch": 0.29, "learning_rate": 0.001654914552148485, "loss": 2.1694, "step": 10960 }, { "epoch": 0.29, "learning_rate": 0.0016548487738935545, "loss": 2.4701, "step": 10961 }, { "epoch": 0.29, "learning_rate": 0.0016547829906776066, "loss": 2.1934, "step": 10962 }, { "epoch": 0.29, "learning_rate": 0.00165471720250114, "loss": 2.6062, "step": 10963 }, { "epoch": 0.29, "learning_rate": 0.0016546514093646527, "loss": 2.5114, "step": 10964 }, { "epoch": 0.29, "learning_rate": 0.0016545856112686432, "loss": 2.3831, "step": 10965 }, { "epoch": 0.29, "learning_rate": 0.0016545198082136105, "loss": 2.719, "step": 10966 }, { "epoch": 0.29, "learning_rate": 0.0016544540002000525, "loss": 2.3732, "step": 10967 }, { "epoch": 0.29, "learning_rate": 0.0016543881872284683, "loss": 2.9247, "step": 10968 }, { "epoch": 0.29, "learning_rate": 0.001654322369299356, "loss": 2.3964, "step": 10969 }, { "epoch": 0.29, "learning_rate": 0.0016542565464132144, "loss": 2.4506, "step": 10970 }, { "epoch": 0.29, "learning_rate": 0.001654190718570542, "loss": 2.3114, "step": 10971 }, { "epoch": 0.29, "learning_rate": 0.0016541248857718381, "loss": 2.5956, "step": 10972 }, { "epoch": 0.29, "learning_rate": 0.0016540590480176008, "loss": 2.4376, "step": 10973 }, { "epoch": 0.29, "learning_rate": 0.0016539932053083288, "loss": 3.1353, "step": 10974 }, { "epoch": 0.29, "learning_rate": 0.0016539273576445216, "loss": 2.2895, "step": 10975 }, { "epoch": 0.29, "learning_rate": 0.0016538615050266773, "loss": 2.9083, "step": 10976 }, { "epoch": 0.29, "learning_rate": 0.0016537956474552953, "loss": 2.7532, "step": 10977 }, { "epoch": 0.3, "learning_rate": 0.0016537297849308743, "loss": 2.4382, "step": 10978 }, { "epoch": 0.3, "learning_rate": 0.0016536639174539137, "loss": 2.5872, "step": 10979 }, { "epoch": 0.3, "learning_rate": 0.001653598045024912, "loss": 2.481, "step": 10980 }, { "epoch": 0.3, "learning_rate": 0.0016535321676443679, "loss": 2.3344, "step": 10981 }, { "epoch": 0.3, "learning_rate": 0.0016534662853127814, "loss": 2.5015, "step": 10982 }, { "epoch": 0.3, "learning_rate": 0.0016534003980306512, "loss": 2.5714, "step": 10983 }, { "epoch": 0.3, "learning_rate": 0.001653334505798476, "loss": 2.1755, "step": 10984 }, { "epoch": 0.3, "learning_rate": 0.0016532686086167556, "loss": 2.4764, "step": 10985 }, { "epoch": 0.3, "learning_rate": 0.001653202706485989, "loss": 2.5207, "step": 10986 }, { "epoch": 0.3, "learning_rate": 0.0016531367994066755, "loss": 2.351, "step": 10987 }, { "epoch": 0.3, "learning_rate": 0.0016530708873793143, "loss": 2.4833, "step": 10988 }, { "epoch": 0.3, "learning_rate": 0.001653004970404405, "loss": 2.7471, "step": 10989 }, { "epoch": 0.3, "learning_rate": 0.0016529390484824465, "loss": 2.4131, "step": 10990 }, { "epoch": 0.3, "learning_rate": 0.0016528731216139388, "loss": 2.8349, "step": 10991 }, { "epoch": 0.3, "learning_rate": 0.001652807189799381, "loss": 2.4093, "step": 10992 }, { "epoch": 0.3, "learning_rate": 0.0016527412530392724, "loss": 2.1521, "step": 10993 }, { "epoch": 0.3, "learning_rate": 0.0016526753113341132, "loss": 2.5289, "step": 10994 }, { "epoch": 0.3, "learning_rate": 0.001652609364684402, "loss": 3.086, "step": 10995 }, { "epoch": 0.3, "learning_rate": 0.0016525434130906392, "loss": 2.7943, "step": 10996 }, { "epoch": 0.3, "learning_rate": 0.0016524774565533243, "loss": 2.5386, "step": 10997 }, { "epoch": 0.3, "learning_rate": 0.0016524114950729567, "loss": 2.5513, "step": 10998 }, { "epoch": 0.3, "learning_rate": 0.0016523455286500362, "loss": 2.8775, "step": 10999 }, { "epoch": 0.3, "learning_rate": 0.0016522795572850627, "loss": 3.0918, "step": 11000 }, { "epoch": 0.3, "learning_rate": 0.0016522135809785357, "loss": 2.7048, "step": 11001 }, { "epoch": 0.3, "learning_rate": 0.0016521475997309555, "loss": 2.5066, "step": 11002 }, { "epoch": 0.3, "learning_rate": 0.0016520816135428215, "loss": 2.3227, "step": 11003 }, { "epoch": 0.3, "learning_rate": 0.0016520156224146339, "loss": 2.377, "step": 11004 }, { "epoch": 0.3, "learning_rate": 0.0016519496263468923, "loss": 2.6249, "step": 11005 }, { "epoch": 0.3, "learning_rate": 0.001651883625340097, "loss": 2.5808, "step": 11006 }, { "epoch": 0.3, "learning_rate": 0.0016518176193947478, "loss": 2.6238, "step": 11007 }, { "epoch": 0.3, "learning_rate": 0.0016517516085113452, "loss": 2.3464, "step": 11008 }, { "epoch": 0.3, "learning_rate": 0.001651685592690389, "loss": 2.7388, "step": 11009 }, { "epoch": 0.3, "learning_rate": 0.0016516195719323786, "loss": 2.7181, "step": 11010 }, { "epoch": 0.3, "learning_rate": 0.0016515535462378152, "loss": 2.5761, "step": 11011 }, { "epoch": 0.3, "learning_rate": 0.0016514875156071987, "loss": 3.1104, "step": 11012 }, { "epoch": 0.3, "learning_rate": 0.0016514214800410292, "loss": 2.1539, "step": 11013 }, { "epoch": 0.3, "learning_rate": 0.0016513554395398069, "loss": 2.698, "step": 11014 }, { "epoch": 0.3, "learning_rate": 0.0016512893941040324, "loss": 2.6107, "step": 11015 }, { "epoch": 0.3, "learning_rate": 0.0016512233437342057, "loss": 2.6225, "step": 11016 }, { "epoch": 0.3, "learning_rate": 0.0016511572884308275, "loss": 2.4165, "step": 11017 }, { "epoch": 0.3, "learning_rate": 0.0016510912281943982, "loss": 2.4986, "step": 11018 }, { "epoch": 0.3, "learning_rate": 0.0016510251630254178, "loss": 2.4605, "step": 11019 }, { "epoch": 0.3, "learning_rate": 0.0016509590929243876, "loss": 2.6427, "step": 11020 }, { "epoch": 0.3, "learning_rate": 0.0016508930178918077, "loss": 2.8683, "step": 11021 }, { "epoch": 0.3, "learning_rate": 0.0016508269379281783, "loss": 2.4546, "step": 11022 }, { "epoch": 0.3, "learning_rate": 0.0016507608530340005, "loss": 2.1496, "step": 11023 }, { "epoch": 0.3, "learning_rate": 0.0016506947632097748, "loss": 2.5933, "step": 11024 }, { "epoch": 0.3, "learning_rate": 0.0016506286684560018, "loss": 2.5669, "step": 11025 }, { "epoch": 0.3, "learning_rate": 0.0016505625687731826, "loss": 2.5596, "step": 11026 }, { "epoch": 0.3, "learning_rate": 0.001650496464161818, "loss": 2.4812, "step": 11027 }, { "epoch": 0.3, "learning_rate": 0.001650430354622408, "loss": 2.7891, "step": 11028 }, { "epoch": 0.3, "learning_rate": 0.001650364240155454, "loss": 2.6499, "step": 11029 }, { "epoch": 0.3, "learning_rate": 0.0016502981207614567, "loss": 2.4536, "step": 11030 }, { "epoch": 0.3, "learning_rate": 0.0016502319964409172, "loss": 2.7041, "step": 11031 }, { "epoch": 0.3, "learning_rate": 0.0016501658671943362, "loss": 2.8369, "step": 11032 }, { "epoch": 0.3, "learning_rate": 0.001650099733022215, "loss": 2.0733, "step": 11033 }, { "epoch": 0.3, "learning_rate": 0.0016500335939250545, "loss": 2.6684, "step": 11034 }, { "epoch": 0.3, "learning_rate": 0.0016499674499033557, "loss": 2.6621, "step": 11035 }, { "epoch": 0.3, "learning_rate": 0.0016499013009576196, "loss": 2.7914, "step": 11036 }, { "epoch": 0.3, "learning_rate": 0.0016498351470883472, "loss": 2.2289, "step": 11037 }, { "epoch": 0.3, "learning_rate": 0.0016497689882960405, "loss": 2.4593, "step": 11038 }, { "epoch": 0.3, "learning_rate": 0.0016497028245811996, "loss": 2.4823, "step": 11039 }, { "epoch": 0.3, "learning_rate": 0.0016496366559443265, "loss": 2.6217, "step": 11040 }, { "epoch": 0.3, "learning_rate": 0.0016495704823859222, "loss": 2.5122, "step": 11041 }, { "epoch": 0.3, "learning_rate": 0.0016495043039064879, "loss": 2.7445, "step": 11042 }, { "epoch": 0.3, "learning_rate": 0.0016494381205065251, "loss": 2.7774, "step": 11043 }, { "epoch": 0.3, "learning_rate": 0.0016493719321865354, "loss": 2.4508, "step": 11044 }, { "epoch": 0.3, "learning_rate": 0.0016493057389470201, "loss": 2.5912, "step": 11045 }, { "epoch": 0.3, "learning_rate": 0.0016492395407884807, "loss": 2.6075, "step": 11046 }, { "epoch": 0.3, "learning_rate": 0.0016491733377114184, "loss": 2.0927, "step": 11047 }, { "epoch": 0.3, "learning_rate": 0.0016491071297163348, "loss": 2.6952, "step": 11048 }, { "epoch": 0.3, "learning_rate": 0.001649040916803732, "loss": 2.506, "step": 11049 }, { "epoch": 0.3, "learning_rate": 0.0016489746989741111, "loss": 2.4117, "step": 11050 }, { "epoch": 0.3, "learning_rate": 0.0016489084762279737, "loss": 3.1084, "step": 11051 }, { "epoch": 0.3, "learning_rate": 0.001648842248565822, "loss": 2.891, "step": 11052 }, { "epoch": 0.3, "learning_rate": 0.001648776015988157, "loss": 2.6288, "step": 11053 }, { "epoch": 0.3, "learning_rate": 0.0016487097784954811, "loss": 2.6969, "step": 11054 }, { "epoch": 0.3, "learning_rate": 0.0016486435360882964, "loss": 2.582, "step": 11055 }, { "epoch": 0.3, "learning_rate": 0.0016485772887671036, "loss": 2.9408, "step": 11056 }, { "epoch": 0.3, "learning_rate": 0.0016485110365324054, "loss": 3.0282, "step": 11057 }, { "epoch": 0.3, "learning_rate": 0.0016484447793847035, "loss": 2.6808, "step": 11058 }, { "epoch": 0.3, "learning_rate": 0.0016483785173245001, "loss": 3.152, "step": 11059 }, { "epoch": 0.3, "learning_rate": 0.0016483122503522967, "loss": 2.3761, "step": 11060 }, { "epoch": 0.3, "learning_rate": 0.0016482459784685956, "loss": 2.5072, "step": 11061 }, { "epoch": 0.3, "learning_rate": 0.0016481797016738994, "loss": 2.4989, "step": 11062 }, { "epoch": 0.3, "learning_rate": 0.0016481134199687092, "loss": 2.7459, "step": 11063 }, { "epoch": 0.3, "learning_rate": 0.0016480471333535274, "loss": 2.3812, "step": 11064 }, { "epoch": 0.3, "learning_rate": 0.0016479808418288567, "loss": 2.3604, "step": 11065 }, { "epoch": 0.3, "learning_rate": 0.001647914545395199, "loss": 2.6369, "step": 11066 }, { "epoch": 0.3, "learning_rate": 0.0016478482440530561, "loss": 2.5954, "step": 11067 }, { "epoch": 0.3, "learning_rate": 0.001647781937802931, "loss": 2.3671, "step": 11068 }, { "epoch": 0.3, "learning_rate": 0.0016477156266453262, "loss": 2.9462, "step": 11069 }, { "epoch": 0.3, "learning_rate": 0.0016476493105807434, "loss": 3.105, "step": 11070 }, { "epoch": 0.3, "learning_rate": 0.0016475829896096849, "loss": 2.4879, "step": 11071 }, { "epoch": 0.3, "learning_rate": 0.0016475166637326536, "loss": 2.5136, "step": 11072 }, { "epoch": 0.3, "learning_rate": 0.0016474503329501516, "loss": 2.6116, "step": 11073 }, { "epoch": 0.3, "learning_rate": 0.0016473839972626818, "loss": 2.9535, "step": 11074 }, { "epoch": 0.3, "learning_rate": 0.0016473176566707468, "loss": 2.2694, "step": 11075 }, { "epoch": 0.3, "learning_rate": 0.0016472513111748489, "loss": 2.6074, "step": 11076 }, { "epoch": 0.3, "learning_rate": 0.0016471849607754905, "loss": 2.2763, "step": 11077 }, { "epoch": 0.3, "learning_rate": 0.0016471186054731748, "loss": 2.9134, "step": 11078 }, { "epoch": 0.3, "learning_rate": 0.0016470522452684043, "loss": 2.6112, "step": 11079 }, { "epoch": 0.3, "learning_rate": 0.0016469858801616813, "loss": 3.1237, "step": 11080 }, { "epoch": 0.3, "learning_rate": 0.0016469195101535092, "loss": 2.8721, "step": 11081 }, { "epoch": 0.3, "learning_rate": 0.0016468531352443905, "loss": 2.5695, "step": 11082 }, { "epoch": 0.3, "learning_rate": 0.001646786755434828, "loss": 2.7188, "step": 11083 }, { "epoch": 0.3, "learning_rate": 0.001646720370725325, "loss": 2.9748, "step": 11084 }, { "epoch": 0.3, "learning_rate": 0.001646653981116384, "loss": 2.3258, "step": 11085 }, { "epoch": 0.3, "learning_rate": 0.0016465875866085078, "loss": 2.3056, "step": 11086 }, { "epoch": 0.3, "learning_rate": 0.0016465211872021999, "loss": 2.2357, "step": 11087 }, { "epoch": 0.3, "learning_rate": 0.0016464547828979627, "loss": 2.6137, "step": 11088 }, { "epoch": 0.3, "learning_rate": 0.0016463883736963002, "loss": 2.7642, "step": 11089 }, { "epoch": 0.3, "learning_rate": 0.0016463219595977145, "loss": 3.0375, "step": 11090 }, { "epoch": 0.3, "learning_rate": 0.0016462555406027094, "loss": 2.6561, "step": 11091 }, { "epoch": 0.3, "learning_rate": 0.0016461891167117877, "loss": 2.7319, "step": 11092 }, { "epoch": 0.3, "learning_rate": 0.0016461226879254528, "loss": 2.0803, "step": 11093 }, { "epoch": 0.3, "learning_rate": 0.001646056254244208, "loss": 2.8204, "step": 11094 }, { "epoch": 0.3, "learning_rate": 0.0016459898156685564, "loss": 2.3645, "step": 11095 }, { "epoch": 0.3, "learning_rate": 0.0016459233721990017, "loss": 2.7666, "step": 11096 }, { "epoch": 0.3, "learning_rate": 0.001645856923836047, "loss": 2.5137, "step": 11097 }, { "epoch": 0.3, "learning_rate": 0.0016457904705801955, "loss": 2.1091, "step": 11098 }, { "epoch": 0.3, "learning_rate": 0.0016457240124319508, "loss": 2.4415, "step": 11099 }, { "epoch": 0.3, "learning_rate": 0.0016456575493918168, "loss": 2.8178, "step": 11100 }, { "epoch": 0.3, "learning_rate": 0.0016455910814602963, "loss": 2.4701, "step": 11101 }, { "epoch": 0.3, "learning_rate": 0.0016455246086378935, "loss": 2.9037, "step": 11102 }, { "epoch": 0.3, "learning_rate": 0.0016454581309251113, "loss": 2.4675, "step": 11103 }, { "epoch": 0.3, "learning_rate": 0.0016453916483224538, "loss": 2.8382, "step": 11104 }, { "epoch": 0.3, "learning_rate": 0.0016453251608304247, "loss": 2.7611, "step": 11105 }, { "epoch": 0.3, "learning_rate": 0.0016452586684495274, "loss": 2.3961, "step": 11106 }, { "epoch": 0.3, "learning_rate": 0.0016451921711802657, "loss": 2.4093, "step": 11107 }, { "epoch": 0.3, "learning_rate": 0.0016451256690231438, "loss": 2.5601, "step": 11108 }, { "epoch": 0.3, "learning_rate": 0.001645059161978665, "loss": 2.4946, "step": 11109 }, { "epoch": 0.3, "learning_rate": 0.0016449926500473335, "loss": 2.3581, "step": 11110 }, { "epoch": 0.3, "learning_rate": 0.0016449261332296525, "loss": 2.5721, "step": 11111 }, { "epoch": 0.3, "learning_rate": 0.0016448596115261269, "loss": 2.5464, "step": 11112 }, { "epoch": 0.3, "learning_rate": 0.00164479308493726, "loss": 2.5159, "step": 11113 }, { "epoch": 0.3, "learning_rate": 0.001644726553463556, "loss": 2.6174, "step": 11114 }, { "epoch": 0.3, "learning_rate": 0.0016446600171055189, "loss": 2.4577, "step": 11115 }, { "epoch": 0.3, "learning_rate": 0.0016445934758636527, "loss": 2.7196, "step": 11116 }, { "epoch": 0.3, "learning_rate": 0.0016445269297384617, "loss": 2.4794, "step": 11117 }, { "epoch": 0.3, "learning_rate": 0.0016444603787304497, "loss": 2.6097, "step": 11118 }, { "epoch": 0.3, "learning_rate": 0.0016443938228401212, "loss": 2.635, "step": 11119 }, { "epoch": 0.3, "learning_rate": 0.0016443272620679803, "loss": 2.7208, "step": 11120 }, { "epoch": 0.3, "learning_rate": 0.0016442606964145315, "loss": 2.5067, "step": 11121 }, { "epoch": 0.3, "learning_rate": 0.0016441941258802783, "loss": 2.2847, "step": 11122 }, { "epoch": 0.3, "learning_rate": 0.001644127550465726, "loss": 2.2566, "step": 11123 }, { "epoch": 0.3, "learning_rate": 0.0016440609701713785, "loss": 2.9373, "step": 11124 }, { "epoch": 0.3, "learning_rate": 0.00164399438499774, "loss": 2.367, "step": 11125 }, { "epoch": 0.3, "learning_rate": 0.0016439277949453156, "loss": 2.2927, "step": 11126 }, { "epoch": 0.3, "learning_rate": 0.0016438612000146088, "loss": 2.5274, "step": 11127 }, { "epoch": 0.3, "learning_rate": 0.001643794600206125, "loss": 2.3442, "step": 11128 }, { "epoch": 0.3, "learning_rate": 0.0016437279955203686, "loss": 2.4215, "step": 11129 }, { "epoch": 0.3, "learning_rate": 0.0016436613859578436, "loss": 2.9664, "step": 11130 }, { "epoch": 0.3, "learning_rate": 0.0016435947715190552, "loss": 2.5347, "step": 11131 }, { "epoch": 0.3, "learning_rate": 0.0016435281522045077, "loss": 2.4704, "step": 11132 }, { "epoch": 0.3, "learning_rate": 0.001643461528014706, "loss": 2.8496, "step": 11133 }, { "epoch": 0.3, "learning_rate": 0.001643394898950155, "loss": 2.6712, "step": 11134 }, { "epoch": 0.3, "learning_rate": 0.001643328265011359, "loss": 2.4014, "step": 11135 }, { "epoch": 0.3, "learning_rate": 0.0016432616261988233, "loss": 2.3892, "step": 11136 }, { "epoch": 0.3, "learning_rate": 0.0016431949825130526, "loss": 2.6095, "step": 11137 }, { "epoch": 0.3, "learning_rate": 0.0016431283339545515, "loss": 2.5098, "step": 11138 }, { "epoch": 0.3, "learning_rate": 0.0016430616805238251, "loss": 2.4667, "step": 11139 }, { "epoch": 0.3, "learning_rate": 0.0016429950222213788, "loss": 2.4004, "step": 11140 }, { "epoch": 0.3, "learning_rate": 0.0016429283590477168, "loss": 2.4944, "step": 11141 }, { "epoch": 0.3, "learning_rate": 0.0016428616910033444, "loss": 3.0168, "step": 11142 }, { "epoch": 0.3, "learning_rate": 0.001642795018088767, "loss": 2.6895, "step": 11143 }, { "epoch": 0.3, "learning_rate": 0.0016427283403044894, "loss": 2.2677, "step": 11144 }, { "epoch": 0.3, "learning_rate": 0.0016426616576510169, "loss": 2.8502, "step": 11145 }, { "epoch": 0.3, "learning_rate": 0.0016425949701288545, "loss": 2.7021, "step": 11146 }, { "epoch": 0.3, "learning_rate": 0.0016425282777385074, "loss": 2.2919, "step": 11147 }, { "epoch": 0.3, "learning_rate": 0.001642461580480481, "loss": 2.3635, "step": 11148 }, { "epoch": 0.3, "learning_rate": 0.0016423948783552804, "loss": 2.7529, "step": 11149 }, { "epoch": 0.3, "learning_rate": 0.0016423281713634113, "loss": 2.8033, "step": 11150 }, { "epoch": 0.3, "learning_rate": 0.0016422614595053787, "loss": 2.7354, "step": 11151 }, { "epoch": 0.3, "learning_rate": 0.0016421947427816882, "loss": 2.4696, "step": 11152 }, { "epoch": 0.3, "learning_rate": 0.0016421280211928449, "loss": 2.3855, "step": 11153 }, { "epoch": 0.3, "learning_rate": 0.0016420612947393547, "loss": 2.9811, "step": 11154 }, { "epoch": 0.3, "learning_rate": 0.0016419945634217228, "loss": 2.1989, "step": 11155 }, { "epoch": 0.3, "learning_rate": 0.0016419278272404552, "loss": 2.3086, "step": 11156 }, { "epoch": 0.3, "learning_rate": 0.0016418610861960567, "loss": 2.7147, "step": 11157 }, { "epoch": 0.3, "learning_rate": 0.0016417943402890333, "loss": 2.8115, "step": 11158 }, { "epoch": 0.3, "learning_rate": 0.0016417275895198912, "loss": 2.923, "step": 11159 }, { "epoch": 0.3, "learning_rate": 0.0016416608338891356, "loss": 2.414, "step": 11160 }, { "epoch": 0.3, "learning_rate": 0.001641594073397272, "loss": 2.7836, "step": 11161 }, { "epoch": 0.3, "learning_rate": 0.001641527308044806, "loss": 2.4368, "step": 11162 }, { "epoch": 0.3, "learning_rate": 0.0016414605378322444, "loss": 2.8768, "step": 11163 }, { "epoch": 0.3, "learning_rate": 0.0016413937627600924, "loss": 2.2096, "step": 11164 }, { "epoch": 0.3, "learning_rate": 0.0016413269828288557, "loss": 2.5054, "step": 11165 }, { "epoch": 0.3, "learning_rate": 0.0016412601980390407, "loss": 2.2422, "step": 11166 }, { "epoch": 0.3, "learning_rate": 0.001641193408391153, "loss": 2.4955, "step": 11167 }, { "epoch": 0.3, "learning_rate": 0.0016411266138856987, "loss": 2.8095, "step": 11168 }, { "epoch": 0.3, "learning_rate": 0.0016410598145231833, "loss": 2.4186, "step": 11169 }, { "epoch": 0.3, "learning_rate": 0.001640993010304114, "loss": 2.618, "step": 11170 }, { "epoch": 0.3, "learning_rate": 0.0016409262012289962, "loss": 2.3441, "step": 11171 }, { "epoch": 0.3, "learning_rate": 0.0016408593872983357, "loss": 2.4758, "step": 11172 }, { "epoch": 0.3, "learning_rate": 0.001640792568512639, "loss": 2.4651, "step": 11173 }, { "epoch": 0.3, "learning_rate": 0.0016407257448724129, "loss": 2.4063, "step": 11174 }, { "epoch": 0.3, "learning_rate": 0.001640658916378163, "loss": 3.1288, "step": 11175 }, { "epoch": 0.3, "learning_rate": 0.0016405920830303952, "loss": 2.6015, "step": 11176 }, { "epoch": 0.3, "learning_rate": 0.0016405252448296165, "loss": 2.697, "step": 11177 }, { "epoch": 0.3, "learning_rate": 0.0016404584017763334, "loss": 2.2229, "step": 11178 }, { "epoch": 0.3, "learning_rate": 0.0016403915538710518, "loss": 2.6928, "step": 11179 }, { "epoch": 0.3, "learning_rate": 0.001640324701114278, "loss": 2.6381, "step": 11180 }, { "epoch": 0.3, "learning_rate": 0.001640257843506519, "loss": 3.1476, "step": 11181 }, { "epoch": 0.3, "learning_rate": 0.001640190981048281, "loss": 2.1515, "step": 11182 }, { "epoch": 0.3, "learning_rate": 0.0016401241137400707, "loss": 3.0432, "step": 11183 }, { "epoch": 0.3, "learning_rate": 0.0016400572415823944, "loss": 2.534, "step": 11184 }, { "epoch": 0.3, "learning_rate": 0.0016399903645757587, "loss": 2.3969, "step": 11185 }, { "epoch": 0.3, "learning_rate": 0.0016399234827206707, "loss": 2.3773, "step": 11186 }, { "epoch": 0.3, "learning_rate": 0.0016398565960176368, "loss": 2.4454, "step": 11187 }, { "epoch": 0.3, "learning_rate": 0.0016397897044671636, "loss": 2.0339, "step": 11188 }, { "epoch": 0.3, "learning_rate": 0.0016397228080697582, "loss": 2.3456, "step": 11189 }, { "epoch": 0.3, "learning_rate": 0.001639655906825927, "loss": 2.5629, "step": 11190 }, { "epoch": 0.3, "learning_rate": 0.0016395890007361769, "loss": 2.5092, "step": 11191 }, { "epoch": 0.3, "learning_rate": 0.001639522089801015, "loss": 2.8148, "step": 11192 }, { "epoch": 0.3, "learning_rate": 0.001639455174020948, "loss": 2.8296, "step": 11193 }, { "epoch": 0.3, "learning_rate": 0.0016393882533964831, "loss": 2.4396, "step": 11194 }, { "epoch": 0.3, "learning_rate": 0.0016393213279281272, "loss": 2.65, "step": 11195 }, { "epoch": 0.3, "learning_rate": 0.001639254397616387, "loss": 2.4926, "step": 11196 }, { "epoch": 0.3, "learning_rate": 0.0016391874624617695, "loss": 2.419, "step": 11197 }, { "epoch": 0.3, "learning_rate": 0.0016391205224647826, "loss": 2.4371, "step": 11198 }, { "epoch": 0.3, "learning_rate": 0.0016390535776259325, "loss": 2.2566, "step": 11199 }, { "epoch": 0.3, "learning_rate": 0.0016389866279457271, "loss": 2.7534, "step": 11200 }, { "epoch": 0.3, "learning_rate": 0.001638919673424673, "loss": 2.9595, "step": 11201 }, { "epoch": 0.3, "learning_rate": 0.0016388527140632778, "loss": 2.5802, "step": 11202 }, { "epoch": 0.3, "learning_rate": 0.0016387857498620483, "loss": 2.7782, "step": 11203 }, { "epoch": 0.3, "learning_rate": 0.0016387187808214927, "loss": 2.7723, "step": 11204 }, { "epoch": 0.3, "learning_rate": 0.0016386518069421174, "loss": 2.4913, "step": 11205 }, { "epoch": 0.3, "learning_rate": 0.0016385848282244304, "loss": 2.6535, "step": 11206 }, { "epoch": 0.3, "learning_rate": 0.001638517844668939, "loss": 2.553, "step": 11207 }, { "epoch": 0.3, "learning_rate": 0.0016384508562761503, "loss": 2.4616, "step": 11208 }, { "epoch": 0.3, "learning_rate": 0.0016383838630465721, "loss": 3.0596, "step": 11209 }, { "epoch": 0.3, "learning_rate": 0.0016383168649807122, "loss": 2.9953, "step": 11210 }, { "epoch": 0.3, "learning_rate": 0.0016382498620790777, "loss": 2.8415, "step": 11211 }, { "epoch": 0.3, "learning_rate": 0.001638182854342176, "loss": 2.7792, "step": 11212 }, { "epoch": 0.3, "learning_rate": 0.0016381158417705154, "loss": 2.7066, "step": 11213 }, { "epoch": 0.3, "learning_rate": 0.0016380488243646033, "loss": 2.2593, "step": 11214 }, { "epoch": 0.3, "learning_rate": 0.0016379818021249474, "loss": 2.7699, "step": 11215 }, { "epoch": 0.3, "learning_rate": 0.0016379147750520552, "loss": 2.6587, "step": 11216 }, { "epoch": 0.3, "learning_rate": 0.001637847743146435, "loss": 2.4845, "step": 11217 }, { "epoch": 0.3, "learning_rate": 0.001637780706408594, "loss": 2.4864, "step": 11218 }, { "epoch": 0.3, "learning_rate": 0.0016377136648390404, "loss": 2.6349, "step": 11219 }, { "epoch": 0.3, "learning_rate": 0.0016376466184382823, "loss": 2.5483, "step": 11220 }, { "epoch": 0.3, "learning_rate": 0.0016375795672068274, "loss": 2.6927, "step": 11221 }, { "epoch": 0.3, "learning_rate": 0.001637512511145184, "loss": 2.7144, "step": 11222 }, { "epoch": 0.3, "learning_rate": 0.0016374454502538591, "loss": 2.9026, "step": 11223 }, { "epoch": 0.3, "learning_rate": 0.001637378384533362, "loss": 2.4574, "step": 11224 }, { "epoch": 0.3, "learning_rate": 0.0016373113139842, "loss": 2.547, "step": 11225 }, { "epoch": 0.3, "learning_rate": 0.0016372442386068814, "loss": 2.5725, "step": 11226 }, { "epoch": 0.3, "learning_rate": 0.0016371771584019145, "loss": 2.1711, "step": 11227 }, { "epoch": 0.3, "learning_rate": 0.001637110073369807, "loss": 2.4671, "step": 11228 }, { "epoch": 0.3, "learning_rate": 0.0016370429835110677, "loss": 2.5405, "step": 11229 }, { "epoch": 0.3, "learning_rate": 0.001636975888826205, "loss": 2.1459, "step": 11230 }, { "epoch": 0.3, "learning_rate": 0.0016369087893157266, "loss": 2.8579, "step": 11231 }, { "epoch": 0.3, "learning_rate": 0.001636841684980141, "loss": 2.4372, "step": 11232 }, { "epoch": 0.3, "learning_rate": 0.0016367745758199565, "loss": 2.7119, "step": 11233 }, { "epoch": 0.3, "learning_rate": 0.0016367074618356822, "loss": 2.6747, "step": 11234 }, { "epoch": 0.3, "learning_rate": 0.0016366403430278255, "loss": 2.3627, "step": 11235 }, { "epoch": 0.3, "learning_rate": 0.0016365732193968955, "loss": 2.8993, "step": 11236 }, { "epoch": 0.3, "learning_rate": 0.0016365060909434006, "loss": 2.77, "step": 11237 }, { "epoch": 0.3, "learning_rate": 0.0016364389576678496, "loss": 2.7775, "step": 11238 }, { "epoch": 0.3, "learning_rate": 0.0016363718195707504, "loss": 2.4811, "step": 11239 }, { "epoch": 0.3, "learning_rate": 0.001636304676652612, "loss": 2.4978, "step": 11240 }, { "epoch": 0.3, "learning_rate": 0.0016362375289139437, "loss": 2.3163, "step": 11241 }, { "epoch": 0.3, "learning_rate": 0.0016361703763552533, "loss": 2.6191, "step": 11242 }, { "epoch": 0.3, "learning_rate": 0.0016361032189770497, "loss": 2.5301, "step": 11243 }, { "epoch": 0.3, "learning_rate": 0.0016360360567798423, "loss": 3.0276, "step": 11244 }, { "epoch": 0.3, "learning_rate": 0.0016359688897641393, "loss": 2.3808, "step": 11245 }, { "epoch": 0.3, "learning_rate": 0.0016359017179304494, "loss": 2.1248, "step": 11246 }, { "epoch": 0.3, "learning_rate": 0.0016358345412792819, "loss": 2.7114, "step": 11247 }, { "epoch": 0.3, "learning_rate": 0.0016357673598111457, "loss": 2.6297, "step": 11248 }, { "epoch": 0.3, "learning_rate": 0.0016357001735265498, "loss": 2.6129, "step": 11249 }, { "epoch": 0.3, "learning_rate": 0.001635632982426003, "loss": 2.4442, "step": 11250 }, { "epoch": 0.3, "learning_rate": 0.0016355657865100136, "loss": 2.6861, "step": 11251 }, { "epoch": 0.3, "learning_rate": 0.0016354985857790925, "loss": 2.4812, "step": 11252 }, { "epoch": 0.3, "learning_rate": 0.0016354313802337472, "loss": 2.4526, "step": 11253 }, { "epoch": 0.3, "learning_rate": 0.0016353641698744874, "loss": 2.366, "step": 11254 }, { "epoch": 0.3, "learning_rate": 0.0016352969547018224, "loss": 2.7265, "step": 11255 }, { "epoch": 0.3, "learning_rate": 0.0016352297347162611, "loss": 2.6608, "step": 11256 }, { "epoch": 0.3, "learning_rate": 0.0016351625099183128, "loss": 2.2334, "step": 11257 }, { "epoch": 0.3, "learning_rate": 0.0016350952803084872, "loss": 2.9797, "step": 11258 }, { "epoch": 0.3, "learning_rate": 0.0016350280458872928, "loss": 2.5112, "step": 11259 }, { "epoch": 0.3, "learning_rate": 0.00163496080665524, "loss": 2.6177, "step": 11260 }, { "epoch": 0.3, "learning_rate": 0.0016348935626128373, "loss": 2.5776, "step": 11261 }, { "epoch": 0.3, "learning_rate": 0.0016348263137605948, "loss": 2.674, "step": 11262 }, { "epoch": 0.3, "learning_rate": 0.0016347590600990212, "loss": 2.5101, "step": 11263 }, { "epoch": 0.3, "learning_rate": 0.0016346918016286267, "loss": 2.6702, "step": 11264 }, { "epoch": 0.3, "learning_rate": 0.0016346245383499207, "loss": 1.9974, "step": 11265 }, { "epoch": 0.3, "learning_rate": 0.0016345572702634126, "loss": 2.8875, "step": 11266 }, { "epoch": 0.3, "learning_rate": 0.0016344899973696116, "loss": 2.3033, "step": 11267 }, { "epoch": 0.3, "learning_rate": 0.0016344227196690285, "loss": 2.7391, "step": 11268 }, { "epoch": 0.3, "learning_rate": 0.001634355437162172, "loss": 2.5122, "step": 11269 }, { "epoch": 0.3, "learning_rate": 0.001634288149849552, "loss": 2.83, "step": 11270 }, { "epoch": 0.3, "learning_rate": 0.0016342208577316787, "loss": 2.444, "step": 11271 }, { "epoch": 0.3, "learning_rate": 0.0016341535608090613, "loss": 2.6489, "step": 11272 }, { "epoch": 0.3, "learning_rate": 0.0016340862590822098, "loss": 2.1543, "step": 11273 }, { "epoch": 0.3, "learning_rate": 0.0016340189525516347, "loss": 2.6527, "step": 11274 }, { "epoch": 0.3, "learning_rate": 0.0016339516412178447, "loss": 2.4217, "step": 11275 }, { "epoch": 0.3, "learning_rate": 0.0016338843250813509, "loss": 2.8921, "step": 11276 }, { "epoch": 0.3, "learning_rate": 0.0016338170041426626, "loss": 2.926, "step": 11277 }, { "epoch": 0.3, "learning_rate": 0.0016337496784022897, "loss": 2.6521, "step": 11278 }, { "epoch": 0.3, "learning_rate": 0.001633682347860743, "loss": 2.6083, "step": 11279 }, { "epoch": 0.3, "learning_rate": 0.001633615012518532, "loss": 2.893, "step": 11280 }, { "epoch": 0.3, "learning_rate": 0.0016335476723761668, "loss": 2.4406, "step": 11281 }, { "epoch": 0.3, "learning_rate": 0.0016334803274341576, "loss": 3.0592, "step": 11282 }, { "epoch": 0.3, "learning_rate": 0.0016334129776930152, "loss": 2.4242, "step": 11283 }, { "epoch": 0.3, "learning_rate": 0.0016333456231532489, "loss": 2.4858, "step": 11284 }, { "epoch": 0.3, "learning_rate": 0.0016332782638153697, "loss": 3.0449, "step": 11285 }, { "epoch": 0.3, "learning_rate": 0.0016332108996798872, "loss": 2.7623, "step": 11286 }, { "epoch": 0.3, "learning_rate": 0.0016331435307473123, "loss": 2.659, "step": 11287 }, { "epoch": 0.3, "learning_rate": 0.0016330761570181554, "loss": 2.9183, "step": 11288 }, { "epoch": 0.3, "learning_rate": 0.0016330087784929264, "loss": 2.6132, "step": 11289 }, { "epoch": 0.3, "learning_rate": 0.001632941395172136, "loss": 2.4377, "step": 11290 }, { "epoch": 0.3, "learning_rate": 0.0016328740070562953, "loss": 2.8383, "step": 11291 }, { "epoch": 0.3, "learning_rate": 0.001632806614145914, "loss": 2.7122, "step": 11292 }, { "epoch": 0.3, "learning_rate": 0.001632739216441503, "loss": 2.5783, "step": 11293 }, { "epoch": 0.3, "learning_rate": 0.0016326718139435723, "loss": 2.6811, "step": 11294 }, { "epoch": 0.3, "learning_rate": 0.0016326044066526336, "loss": 2.7008, "step": 11295 }, { "epoch": 0.3, "learning_rate": 0.0016325369945691967, "loss": 2.8279, "step": 11296 }, { "epoch": 0.3, "learning_rate": 0.0016324695776937727, "loss": 2.6334, "step": 11297 }, { "epoch": 0.3, "learning_rate": 0.0016324021560268724, "loss": 2.5603, "step": 11298 }, { "epoch": 0.3, "learning_rate": 0.0016323347295690064, "loss": 2.8788, "step": 11299 }, { "epoch": 0.3, "learning_rate": 0.0016322672983206856, "loss": 2.3023, "step": 11300 }, { "epoch": 0.3, "learning_rate": 0.0016321998622824206, "loss": 2.906, "step": 11301 }, { "epoch": 0.3, "learning_rate": 0.0016321324214547226, "loss": 2.6776, "step": 11302 }, { "epoch": 0.3, "learning_rate": 0.0016320649758381023, "loss": 2.583, "step": 11303 }, { "epoch": 0.3, "learning_rate": 0.0016319975254330708, "loss": 2.2128, "step": 11304 }, { "epoch": 0.3, "learning_rate": 0.0016319300702401392, "loss": 2.4409, "step": 11305 }, { "epoch": 0.3, "learning_rate": 0.001631862610259818, "loss": 2.7217, "step": 11306 }, { "epoch": 0.3, "learning_rate": 0.0016317951454926187, "loss": 2.6921, "step": 11307 }, { "epoch": 0.3, "learning_rate": 0.0016317276759390525, "loss": 2.86, "step": 11308 }, { "epoch": 0.3, "learning_rate": 0.0016316602015996305, "loss": 2.6885, "step": 11309 }, { "epoch": 0.3, "learning_rate": 0.0016315927224748634, "loss": 2.6209, "step": 11310 }, { "epoch": 0.3, "learning_rate": 0.001631525238565263, "loss": 3.0585, "step": 11311 }, { "epoch": 0.3, "learning_rate": 0.0016314577498713404, "loss": 2.8294, "step": 11312 }, { "epoch": 0.3, "learning_rate": 0.0016313902563936064, "loss": 2.322, "step": 11313 }, { "epoch": 0.3, "learning_rate": 0.0016313227581325727, "loss": 2.4578, "step": 11314 }, { "epoch": 0.3, "learning_rate": 0.001631255255088751, "loss": 2.4575, "step": 11315 }, { "epoch": 0.3, "learning_rate": 0.0016311877472626525, "loss": 2.8144, "step": 11316 }, { "epoch": 0.3, "learning_rate": 0.0016311202346547878, "loss": 2.6982, "step": 11317 }, { "epoch": 0.3, "learning_rate": 0.0016310527172656694, "loss": 2.194, "step": 11318 }, { "epoch": 0.3, "learning_rate": 0.0016309851950958086, "loss": 2.6005, "step": 11319 }, { "epoch": 0.3, "learning_rate": 0.0016309176681457164, "loss": 2.6516, "step": 11320 }, { "epoch": 0.3, "learning_rate": 0.001630850136415905, "loss": 2.322, "step": 11321 }, { "epoch": 0.3, "learning_rate": 0.0016307825999068858, "loss": 2.4677, "step": 11322 }, { "epoch": 0.3, "learning_rate": 0.0016307150586191703, "loss": 2.2405, "step": 11323 }, { "epoch": 0.3, "learning_rate": 0.0016306475125532703, "loss": 2.7766, "step": 11324 }, { "epoch": 0.3, "learning_rate": 0.0016305799617096972, "loss": 2.6795, "step": 11325 }, { "epoch": 0.3, "learning_rate": 0.0016305124060889636, "loss": 2.2646, "step": 11326 }, { "epoch": 0.3, "learning_rate": 0.0016304448456915803, "loss": 2.5993, "step": 11327 }, { "epoch": 0.3, "learning_rate": 0.0016303772805180596, "loss": 2.8924, "step": 11328 }, { "epoch": 0.3, "learning_rate": 0.0016303097105689135, "loss": 2.7385, "step": 11329 }, { "epoch": 0.3, "learning_rate": 0.0016302421358446537, "loss": 2.4787, "step": 11330 }, { "epoch": 0.3, "learning_rate": 0.0016301745563457924, "loss": 2.8806, "step": 11331 }, { "epoch": 0.3, "learning_rate": 0.001630106972072841, "loss": 2.2231, "step": 11332 }, { "epoch": 0.3, "learning_rate": 0.0016300393830263116, "loss": 2.2211, "step": 11333 }, { "epoch": 0.3, "learning_rate": 0.0016299717892067167, "loss": 2.5317, "step": 11334 }, { "epoch": 0.3, "learning_rate": 0.0016299041906145683, "loss": 2.6564, "step": 11335 }, { "epoch": 0.3, "learning_rate": 0.0016298365872503785, "loss": 2.4298, "step": 11336 }, { "epoch": 0.3, "learning_rate": 0.0016297689791146591, "loss": 2.9621, "step": 11337 }, { "epoch": 0.3, "learning_rate": 0.0016297013662079224, "loss": 2.2131, "step": 11338 }, { "epoch": 0.3, "learning_rate": 0.0016296337485306807, "loss": 2.196, "step": 11339 }, { "epoch": 0.3, "learning_rate": 0.0016295661260834465, "loss": 2.5282, "step": 11340 }, { "epoch": 0.3, "learning_rate": 0.0016294984988667318, "loss": 2.4575, "step": 11341 }, { "epoch": 0.3, "learning_rate": 0.001629430866881049, "loss": 2.8804, "step": 11342 }, { "epoch": 0.3, "learning_rate": 0.0016293632301269106, "loss": 2.2978, "step": 11343 }, { "epoch": 0.3, "learning_rate": 0.001629295588604829, "loss": 2.3798, "step": 11344 }, { "epoch": 0.3, "learning_rate": 0.001629227942315316, "loss": 2.6446, "step": 11345 }, { "epoch": 0.3, "learning_rate": 0.001629160291258885, "loss": 2.509, "step": 11346 }, { "epoch": 0.3, "learning_rate": 0.001629092635436048, "loss": 2.3668, "step": 11347 }, { "epoch": 0.3, "learning_rate": 0.0016290249748473179, "loss": 2.5118, "step": 11348 }, { "epoch": 0.3, "learning_rate": 0.0016289573094932066, "loss": 2.6481, "step": 11349 }, { "epoch": 0.31, "learning_rate": 0.0016288896393742275, "loss": 3.1162, "step": 11350 }, { "epoch": 0.31, "learning_rate": 0.0016288219644908929, "loss": 2.413, "step": 11351 }, { "epoch": 0.31, "learning_rate": 0.0016287542848437153, "loss": 2.6961, "step": 11352 }, { "epoch": 0.31, "learning_rate": 0.0016286866004332078, "loss": 2.7863, "step": 11353 }, { "epoch": 0.31, "learning_rate": 0.001628618911259883, "loss": 2.6091, "step": 11354 }, { "epoch": 0.31, "learning_rate": 0.001628551217324254, "loss": 2.577, "step": 11355 }, { "epoch": 0.31, "learning_rate": 0.001628483518626833, "loss": 2.6825, "step": 11356 }, { "epoch": 0.31, "learning_rate": 0.0016284158151681333, "loss": 2.2176, "step": 11357 }, { "epoch": 0.31, "learning_rate": 0.0016283481069486675, "loss": 2.7882, "step": 11358 }, { "epoch": 0.31, "learning_rate": 0.0016282803939689492, "loss": 2.8074, "step": 11359 }, { "epoch": 0.31, "learning_rate": 0.0016282126762294908, "loss": 2.5497, "step": 11360 }, { "epoch": 0.31, "learning_rate": 0.0016281449537308055, "loss": 2.562, "step": 11361 }, { "epoch": 0.31, "learning_rate": 0.0016280772264734066, "loss": 2.2345, "step": 11362 }, { "epoch": 0.31, "learning_rate": 0.0016280094944578067, "loss": 2.8546, "step": 11363 }, { "epoch": 0.31, "learning_rate": 0.0016279417576845188, "loss": 2.7033, "step": 11364 }, { "epoch": 0.31, "learning_rate": 0.0016278740161540567, "loss": 2.5307, "step": 11365 }, { "epoch": 0.31, "learning_rate": 0.0016278062698669334, "loss": 2.5545, "step": 11366 }, { "epoch": 0.31, "learning_rate": 0.0016277385188236619, "loss": 2.3067, "step": 11367 }, { "epoch": 0.31, "learning_rate": 0.0016276707630247557, "loss": 2.6332, "step": 11368 }, { "epoch": 0.31, "learning_rate": 0.0016276030024707279, "loss": 2.7704, "step": 11369 }, { "epoch": 0.31, "learning_rate": 0.001627535237162092, "loss": 2.1523, "step": 11370 }, { "epoch": 0.31, "learning_rate": 0.0016274674670993614, "loss": 2.3128, "step": 11371 }, { "epoch": 0.31, "learning_rate": 0.001627399692283049, "loss": 2.9812, "step": 11372 }, { "epoch": 0.31, "learning_rate": 0.0016273319127136695, "loss": 3.0632, "step": 11373 }, { "epoch": 0.31, "learning_rate": 0.0016272641283917354, "loss": 2.9452, "step": 11374 }, { "epoch": 0.31, "learning_rate": 0.0016271963393177603, "loss": 2.8242, "step": 11375 }, { "epoch": 0.31, "learning_rate": 0.0016271285454922575, "loss": 2.4689, "step": 11376 }, { "epoch": 0.31, "learning_rate": 0.0016270607469157413, "loss": 2.5665, "step": 11377 }, { "epoch": 0.31, "learning_rate": 0.001626992943588725, "loss": 2.8335, "step": 11378 }, { "epoch": 0.31, "learning_rate": 0.001626925135511722, "loss": 2.8428, "step": 11379 }, { "epoch": 0.31, "learning_rate": 0.0016268573226852464, "loss": 2.6752, "step": 11380 }, { "epoch": 0.31, "learning_rate": 0.0016267895051098118, "loss": 2.03, "step": 11381 }, { "epoch": 0.31, "learning_rate": 0.0016267216827859322, "loss": 2.4884, "step": 11382 }, { "epoch": 0.31, "learning_rate": 0.001626653855714121, "loss": 2.7536, "step": 11383 }, { "epoch": 0.31, "learning_rate": 0.0016265860238948919, "loss": 2.6572, "step": 11384 }, { "epoch": 0.31, "learning_rate": 0.0016265181873287595, "loss": 2.9776, "step": 11385 }, { "epoch": 0.31, "learning_rate": 0.0016264503460162371, "loss": 2.6373, "step": 11386 }, { "epoch": 0.31, "learning_rate": 0.0016263824999578392, "loss": 2.5547, "step": 11387 }, { "epoch": 0.31, "learning_rate": 0.0016263146491540792, "loss": 2.5409, "step": 11388 }, { "epoch": 0.31, "learning_rate": 0.0016262467936054715, "loss": 2.5983, "step": 11389 }, { "epoch": 0.31, "learning_rate": 0.0016261789333125302, "loss": 2.8686, "step": 11390 }, { "epoch": 0.31, "learning_rate": 0.0016261110682757687, "loss": 2.541, "step": 11391 }, { "epoch": 0.31, "learning_rate": 0.0016260431984957023, "loss": 2.5396, "step": 11392 }, { "epoch": 0.31, "learning_rate": 0.001625975323972844, "loss": 2.8116, "step": 11393 }, { "epoch": 0.31, "learning_rate": 0.001625907444707709, "loss": 2.4178, "step": 11394 }, { "epoch": 0.31, "learning_rate": 0.0016258395607008109, "loss": 2.5382, "step": 11395 }, { "epoch": 0.31, "learning_rate": 0.0016257716719526645, "loss": 2.7719, "step": 11396 }, { "epoch": 0.31, "learning_rate": 0.0016257037784637833, "loss": 3.0923, "step": 11397 }, { "epoch": 0.31, "learning_rate": 0.0016256358802346825, "loss": 2.4851, "step": 11398 }, { "epoch": 0.31, "learning_rate": 0.001625567977265876, "loss": 2.8522, "step": 11399 }, { "epoch": 0.31, "learning_rate": 0.0016255000695578783, "loss": 2.8135, "step": 11400 }, { "epoch": 0.31, "learning_rate": 0.001625432157111204, "loss": 2.3842, "step": 11401 }, { "epoch": 0.31, "learning_rate": 0.0016253642399263674, "loss": 2.3686, "step": 11402 }, { "epoch": 0.31, "learning_rate": 0.001625296318003883, "loss": 2.6613, "step": 11403 }, { "epoch": 0.31, "learning_rate": 0.0016252283913442658, "loss": 2.5503, "step": 11404 }, { "epoch": 0.31, "learning_rate": 0.00162516045994803, "loss": 2.4529, "step": 11405 }, { "epoch": 0.31, "learning_rate": 0.0016250925238156903, "loss": 2.4232, "step": 11406 }, { "epoch": 0.31, "learning_rate": 0.0016250245829477615, "loss": 2.6498, "step": 11407 }, { "epoch": 0.31, "learning_rate": 0.001624956637344758, "loss": 3.0719, "step": 11408 }, { "epoch": 0.31, "learning_rate": 0.0016248886870071945, "loss": 2.5528, "step": 11409 }, { "epoch": 0.31, "learning_rate": 0.0016248207319355865, "loss": 2.8561, "step": 11410 }, { "epoch": 0.31, "learning_rate": 0.001624752772130448, "loss": 2.7091, "step": 11411 }, { "epoch": 0.31, "learning_rate": 0.0016246848075922946, "loss": 2.3267, "step": 11412 }, { "epoch": 0.31, "learning_rate": 0.0016246168383216406, "loss": 2.5068, "step": 11413 }, { "epoch": 0.31, "learning_rate": 0.001624548864319001, "loss": 2.414, "step": 11414 }, { "epoch": 0.31, "learning_rate": 0.001624480885584891, "loss": 2.3354, "step": 11415 }, { "epoch": 0.31, "learning_rate": 0.0016244129021198252, "loss": 2.4396, "step": 11416 }, { "epoch": 0.31, "learning_rate": 0.0016243449139243193, "loss": 2.5967, "step": 11417 }, { "epoch": 0.31, "learning_rate": 0.0016242769209988876, "loss": 2.6858, "step": 11418 }, { "epoch": 0.31, "learning_rate": 0.0016242089233440456, "loss": 2.1027, "step": 11419 }, { "epoch": 0.31, "learning_rate": 0.0016241409209603087, "loss": 2.5218, "step": 11420 }, { "epoch": 0.31, "learning_rate": 0.0016240729138481914, "loss": 2.3715, "step": 11421 }, { "epoch": 0.31, "learning_rate": 0.0016240049020082095, "loss": 2.6773, "step": 11422 }, { "epoch": 0.31, "learning_rate": 0.0016239368854408778, "loss": 2.2305, "step": 11423 }, { "epoch": 0.31, "learning_rate": 0.001623868864146712, "loss": 2.1546, "step": 11424 }, { "epoch": 0.31, "learning_rate": 0.0016238008381262272, "loss": 2.6402, "step": 11425 }, { "epoch": 0.31, "learning_rate": 0.0016237328073799386, "loss": 2.6733, "step": 11426 }, { "epoch": 0.31, "learning_rate": 0.001623664771908362, "loss": 2.4827, "step": 11427 }, { "epoch": 0.31, "learning_rate": 0.0016235967317120125, "loss": 2.5201, "step": 11428 }, { "epoch": 0.31, "learning_rate": 0.0016235286867914058, "loss": 2.412, "step": 11429 }, { "epoch": 0.31, "learning_rate": 0.001623460637147057, "loss": 2.5447, "step": 11430 }, { "epoch": 0.31, "learning_rate": 0.001623392582779482, "loss": 3.1493, "step": 11431 }, { "epoch": 0.31, "learning_rate": 0.0016233245236891962, "loss": 2.8676, "step": 11432 }, { "epoch": 0.31, "learning_rate": 0.0016232564598767155, "loss": 2.6455, "step": 11433 }, { "epoch": 0.31, "learning_rate": 0.0016231883913425547, "loss": 2.5763, "step": 11434 }, { "epoch": 0.31, "learning_rate": 0.0016231203180872304, "loss": 2.2612, "step": 11435 }, { "epoch": 0.31, "learning_rate": 0.001623052240111258, "loss": 2.6087, "step": 11436 }, { "epoch": 0.31, "learning_rate": 0.0016229841574151535, "loss": 3.1568, "step": 11437 }, { "epoch": 0.31, "learning_rate": 0.0016229160699994319, "loss": 2.4946, "step": 11438 }, { "epoch": 0.31, "learning_rate": 0.0016228479778646098, "loss": 2.5708, "step": 11439 }, { "epoch": 0.31, "learning_rate": 0.0016227798810112028, "loss": 2.477, "step": 11440 }, { "epoch": 0.31, "learning_rate": 0.0016227117794397265, "loss": 3.03, "step": 11441 }, { "epoch": 0.31, "learning_rate": 0.001622643673150697, "loss": 2.8007, "step": 11442 }, { "epoch": 0.31, "learning_rate": 0.0016225755621446308, "loss": 2.7339, "step": 11443 }, { "epoch": 0.31, "learning_rate": 0.0016225074464220435, "loss": 2.686, "step": 11444 }, { "epoch": 0.31, "learning_rate": 0.001622439325983451, "loss": 2.5952, "step": 11445 }, { "epoch": 0.31, "learning_rate": 0.001622371200829369, "loss": 2.6765, "step": 11446 }, { "epoch": 0.31, "learning_rate": 0.001622303070960314, "loss": 2.9653, "step": 11447 }, { "epoch": 0.31, "learning_rate": 0.0016222349363768029, "loss": 2.7549, "step": 11448 }, { "epoch": 0.31, "learning_rate": 0.001622166797079351, "loss": 2.7707, "step": 11449 }, { "epoch": 0.31, "learning_rate": 0.0016220986530684743, "loss": 2.0739, "step": 11450 }, { "epoch": 0.31, "learning_rate": 0.0016220305043446897, "loss": 2.5755, "step": 11451 }, { "epoch": 0.31, "learning_rate": 0.0016219623509085128, "loss": 2.3581, "step": 11452 }, { "epoch": 0.31, "learning_rate": 0.0016218941927604606, "loss": 2.7694, "step": 11453 }, { "epoch": 0.31, "learning_rate": 0.0016218260299010491, "loss": 2.9004, "step": 11454 }, { "epoch": 0.31, "learning_rate": 0.0016217578623307952, "loss": 2.8551, "step": 11455 }, { "epoch": 0.31, "learning_rate": 0.0016216896900502146, "loss": 2.289, "step": 11456 }, { "epoch": 0.31, "learning_rate": 0.0016216215130598242, "loss": 2.8226, "step": 11457 }, { "epoch": 0.31, "learning_rate": 0.0016215533313601398, "loss": 2.7883, "step": 11458 }, { "epoch": 0.31, "learning_rate": 0.001621485144951679, "loss": 2.737, "step": 11459 }, { "epoch": 0.31, "learning_rate": 0.0016214169538349577, "loss": 2.363, "step": 11460 }, { "epoch": 0.31, "learning_rate": 0.0016213487580104928, "loss": 2.5264, "step": 11461 }, { "epoch": 0.31, "learning_rate": 0.0016212805574788004, "loss": 2.7616, "step": 11462 }, { "epoch": 0.31, "learning_rate": 0.001621212352240398, "loss": 2.3312, "step": 11463 }, { "epoch": 0.31, "learning_rate": 0.001621144142295802, "loss": 2.2647, "step": 11464 }, { "epoch": 0.31, "learning_rate": 0.0016210759276455288, "loss": 2.7446, "step": 11465 }, { "epoch": 0.31, "learning_rate": 0.0016210077082900952, "loss": 2.8227, "step": 11466 }, { "epoch": 0.31, "learning_rate": 0.0016209394842300183, "loss": 2.9444, "step": 11467 }, { "epoch": 0.31, "learning_rate": 0.001620871255465815, "loss": 2.621, "step": 11468 }, { "epoch": 0.31, "learning_rate": 0.001620803021998002, "loss": 2.7826, "step": 11469 }, { "epoch": 0.31, "learning_rate": 0.0016207347838270963, "loss": 2.4342, "step": 11470 }, { "epoch": 0.31, "learning_rate": 0.0016206665409536152, "loss": 2.6292, "step": 11471 }, { "epoch": 0.31, "learning_rate": 0.0016205982933780749, "loss": 2.6567, "step": 11472 }, { "epoch": 0.31, "learning_rate": 0.0016205300411009929, "loss": 2.579, "step": 11473 }, { "epoch": 0.31, "learning_rate": 0.0016204617841228863, "loss": 2.8612, "step": 11474 }, { "epoch": 0.31, "learning_rate": 0.0016203935224442722, "loss": 2.6955, "step": 11475 }, { "epoch": 0.31, "learning_rate": 0.001620325256065668, "loss": 2.6473, "step": 11476 }, { "epoch": 0.31, "learning_rate": 0.00162025698498759, "loss": 2.5606, "step": 11477 }, { "epoch": 0.31, "learning_rate": 0.0016201887092105564, "loss": 2.3364, "step": 11478 }, { "epoch": 0.31, "learning_rate": 0.001620120428735084, "loss": 2.6096, "step": 11479 }, { "epoch": 0.31, "learning_rate": 0.00162005214356169, "loss": 2.6264, "step": 11480 }, { "epoch": 0.31, "learning_rate": 0.0016199838536908918, "loss": 2.8015, "step": 11481 }, { "epoch": 0.31, "learning_rate": 0.0016199155591232067, "loss": 2.2255, "step": 11482 }, { "epoch": 0.31, "learning_rate": 0.001619847259859152, "loss": 2.6752, "step": 11483 }, { "epoch": 0.31, "learning_rate": 0.0016197789558992457, "loss": 3.1804, "step": 11484 }, { "epoch": 0.31, "learning_rate": 0.0016197106472440046, "loss": 2.5106, "step": 11485 }, { "epoch": 0.31, "learning_rate": 0.0016196423338939465, "loss": 2.8091, "step": 11486 }, { "epoch": 0.31, "learning_rate": 0.001619574015849589, "loss": 2.4944, "step": 11487 }, { "epoch": 0.31, "learning_rate": 0.0016195056931114491, "loss": 2.5459, "step": 11488 }, { "epoch": 0.31, "learning_rate": 0.0016194373656800449, "loss": 2.2878, "step": 11489 }, { "epoch": 0.31, "learning_rate": 0.0016193690335558945, "loss": 2.7574, "step": 11490 }, { "epoch": 0.31, "learning_rate": 0.0016193006967395146, "loss": 2.3934, "step": 11491 }, { "epoch": 0.31, "learning_rate": 0.0016192323552314234, "loss": 2.8488, "step": 11492 }, { "epoch": 0.31, "learning_rate": 0.0016191640090321387, "loss": 2.3147, "step": 11493 }, { "epoch": 0.31, "learning_rate": 0.0016190956581421778, "loss": 2.292, "step": 11494 }, { "epoch": 0.31, "learning_rate": 0.0016190273025620593, "loss": 2.7514, "step": 11495 }, { "epoch": 0.31, "learning_rate": 0.0016189589422923004, "loss": 2.5912, "step": 11496 }, { "epoch": 0.31, "learning_rate": 0.0016188905773334194, "loss": 2.6981, "step": 11497 }, { "epoch": 0.31, "learning_rate": 0.0016188222076859336, "loss": 2.5077, "step": 11498 }, { "epoch": 0.31, "learning_rate": 0.001618753833350362, "loss": 2.4708, "step": 11499 }, { "epoch": 0.31, "learning_rate": 0.0016186854543272214, "loss": 2.51, "step": 11500 }, { "epoch": 0.31, "learning_rate": 0.0016186170706170308, "loss": 2.6962, "step": 11501 }, { "epoch": 0.31, "learning_rate": 0.0016185486822203078, "loss": 2.4532, "step": 11502 }, { "epoch": 0.31, "learning_rate": 0.0016184802891375705, "loss": 2.585, "step": 11503 }, { "epoch": 0.31, "learning_rate": 0.001618411891369337, "loss": 2.5665, "step": 11504 }, { "epoch": 0.31, "learning_rate": 0.0016183434889161256, "loss": 2.6496, "step": 11505 }, { "epoch": 0.31, "learning_rate": 0.0016182750817784548, "loss": 2.2275, "step": 11506 }, { "epoch": 0.31, "learning_rate": 0.0016182066699568422, "loss": 2.8281, "step": 11507 }, { "epoch": 0.31, "learning_rate": 0.0016181382534518067, "loss": 2.3727, "step": 11508 }, { "epoch": 0.31, "learning_rate": 0.001618069832263866, "loss": 2.4244, "step": 11509 }, { "epoch": 0.31, "learning_rate": 0.0016180014063935388, "loss": 2.4628, "step": 11510 }, { "epoch": 0.31, "learning_rate": 0.0016179329758413434, "loss": 2.4275, "step": 11511 }, { "epoch": 0.31, "learning_rate": 0.0016178645406077984, "loss": 2.4418, "step": 11512 }, { "epoch": 0.31, "learning_rate": 0.001617796100693422, "loss": 2.6808, "step": 11513 }, { "epoch": 0.31, "learning_rate": 0.001617727656098733, "loss": 2.7146, "step": 11514 }, { "epoch": 0.31, "learning_rate": 0.0016176592068242496, "loss": 2.5413, "step": 11515 }, { "epoch": 0.31, "learning_rate": 0.0016175907528704903, "loss": 2.6289, "step": 11516 }, { "epoch": 0.31, "learning_rate": 0.0016175222942379742, "loss": 2.5166, "step": 11517 }, { "epoch": 0.31, "learning_rate": 0.0016174538309272192, "loss": 2.8999, "step": 11518 }, { "epoch": 0.31, "learning_rate": 0.0016173853629387444, "loss": 2.5885, "step": 11519 }, { "epoch": 0.31, "learning_rate": 0.0016173168902730687, "loss": 2.4711, "step": 11520 }, { "epoch": 0.31, "learning_rate": 0.0016172484129307106, "loss": 2.6201, "step": 11521 }, { "epoch": 0.31, "learning_rate": 0.0016171799309121888, "loss": 3.0912, "step": 11522 }, { "epoch": 0.31, "learning_rate": 0.0016171114442180225, "loss": 2.8992, "step": 11523 }, { "epoch": 0.31, "learning_rate": 0.0016170429528487298, "loss": 2.6755, "step": 11524 }, { "epoch": 0.31, "learning_rate": 0.0016169744568048298, "loss": 2.4537, "step": 11525 }, { "epoch": 0.31, "learning_rate": 0.0016169059560868422, "loss": 2.7185, "step": 11526 }, { "epoch": 0.31, "learning_rate": 0.0016168374506952852, "loss": 2.9018, "step": 11527 }, { "epoch": 0.31, "learning_rate": 0.0016167689406306777, "loss": 2.2711, "step": 11528 }, { "epoch": 0.31, "learning_rate": 0.0016167004258935394, "loss": 3.0819, "step": 11529 }, { "epoch": 0.31, "learning_rate": 0.0016166319064843883, "loss": 2.4551, "step": 11530 }, { "epoch": 0.31, "learning_rate": 0.0016165633824037449, "loss": 2.2312, "step": 11531 }, { "epoch": 0.31, "learning_rate": 0.0016164948536521269, "loss": 2.7585, "step": 11532 }, { "epoch": 0.31, "learning_rate": 0.0016164263202300545, "loss": 2.6759, "step": 11533 }, { "epoch": 0.31, "learning_rate": 0.001616357782138046, "loss": 2.8222, "step": 11534 }, { "epoch": 0.31, "learning_rate": 0.0016162892393766217, "loss": 2.6039, "step": 11535 }, { "epoch": 0.31, "learning_rate": 0.0016162206919463, "loss": 2.3147, "step": 11536 }, { "epoch": 0.31, "learning_rate": 0.0016161521398476008, "loss": 2.4722, "step": 11537 }, { "epoch": 0.31, "learning_rate": 0.001616083583081043, "loss": 2.6371, "step": 11538 }, { "epoch": 0.31, "learning_rate": 0.0016160150216471458, "loss": 2.8701, "step": 11539 }, { "epoch": 0.31, "learning_rate": 0.0016159464555464294, "loss": 2.5312, "step": 11540 }, { "epoch": 0.31, "learning_rate": 0.0016158778847794127, "loss": 2.6797, "step": 11541 }, { "epoch": 0.31, "learning_rate": 0.0016158093093466151, "loss": 2.8064, "step": 11542 }, { "epoch": 0.31, "learning_rate": 0.001615740729248556, "loss": 2.8242, "step": 11543 }, { "epoch": 0.31, "learning_rate": 0.001615672144485756, "loss": 2.2373, "step": 11544 }, { "epoch": 0.31, "learning_rate": 0.001615603555058733, "loss": 2.2803, "step": 11545 }, { "epoch": 0.31, "learning_rate": 0.0016155349609680081, "loss": 2.6521, "step": 11546 }, { "epoch": 0.31, "learning_rate": 0.0016154663622141002, "loss": 2.2962, "step": 11547 }, { "epoch": 0.31, "learning_rate": 0.0016153977587975291, "loss": 2.9109, "step": 11548 }, { "epoch": 0.31, "learning_rate": 0.0016153291507188148, "loss": 2.4291, "step": 11549 }, { "epoch": 0.31, "learning_rate": 0.001615260537978477, "loss": 2.3644, "step": 11550 }, { "epoch": 0.31, "learning_rate": 0.001615191920577035, "loss": 2.883, "step": 11551 }, { "epoch": 0.31, "learning_rate": 0.0016151232985150091, "loss": 2.5433, "step": 11552 }, { "epoch": 0.31, "learning_rate": 0.0016150546717929191, "loss": 2.3235, "step": 11553 }, { "epoch": 0.31, "learning_rate": 0.0016149860404112849, "loss": 2.7437, "step": 11554 }, { "epoch": 0.31, "learning_rate": 0.0016149174043706262, "loss": 2.6535, "step": 11555 }, { "epoch": 0.31, "learning_rate": 0.0016148487636714632, "loss": 2.4598, "step": 11556 }, { "epoch": 0.31, "learning_rate": 0.0016147801183143164, "loss": 2.3853, "step": 11557 }, { "epoch": 0.31, "learning_rate": 0.001614711468299705, "loss": 2.6059, "step": 11558 }, { "epoch": 0.31, "learning_rate": 0.0016146428136281493, "loss": 2.3158, "step": 11559 }, { "epoch": 0.31, "learning_rate": 0.0016145741543001698, "loss": 2.9243, "step": 11560 }, { "epoch": 0.31, "learning_rate": 0.001614505490316286, "loss": 2.8047, "step": 11561 }, { "epoch": 0.31, "learning_rate": 0.0016144368216770189, "loss": 2.3381, "step": 11562 }, { "epoch": 0.31, "learning_rate": 0.0016143681483828877, "loss": 2.6264, "step": 11563 }, { "epoch": 0.31, "learning_rate": 0.0016142994704344137, "loss": 2.6702, "step": 11564 }, { "epoch": 0.31, "learning_rate": 0.001614230787832117, "loss": 2.5964, "step": 11565 }, { "epoch": 0.31, "learning_rate": 0.0016141621005765173, "loss": 2.4904, "step": 11566 }, { "epoch": 0.31, "learning_rate": 0.0016140934086681352, "loss": 2.5754, "step": 11567 }, { "epoch": 0.31, "learning_rate": 0.0016140247121074914, "loss": 2.3542, "step": 11568 }, { "epoch": 0.31, "learning_rate": 0.0016139560108951062, "loss": 2.5481, "step": 11569 }, { "epoch": 0.31, "learning_rate": 0.0016138873050314999, "loss": 2.7143, "step": 11570 }, { "epoch": 0.31, "learning_rate": 0.001613818594517193, "loss": 2.5804, "step": 11571 }, { "epoch": 0.31, "learning_rate": 0.0016137498793527066, "loss": 2.6028, "step": 11572 }, { "epoch": 0.31, "learning_rate": 0.0016136811595385606, "loss": 2.4633, "step": 11573 }, { "epoch": 0.31, "learning_rate": 0.0016136124350752757, "loss": 2.6825, "step": 11574 }, { "epoch": 0.31, "learning_rate": 0.0016135437059633729, "loss": 2.4031, "step": 11575 }, { "epoch": 0.31, "learning_rate": 0.0016134749722033727, "loss": 2.4075, "step": 11576 }, { "epoch": 0.31, "learning_rate": 0.0016134062337957956, "loss": 2.7054, "step": 11577 }, { "epoch": 0.31, "learning_rate": 0.0016133374907411624, "loss": 2.3435, "step": 11578 }, { "epoch": 0.31, "learning_rate": 0.0016132687430399943, "loss": 2.5343, "step": 11579 }, { "epoch": 0.31, "learning_rate": 0.0016131999906928121, "loss": 2.9964, "step": 11580 }, { "epoch": 0.31, "learning_rate": 0.0016131312337001361, "loss": 2.5734, "step": 11581 }, { "epoch": 0.31, "learning_rate": 0.0016130624720624876, "loss": 2.7144, "step": 11582 }, { "epoch": 0.31, "learning_rate": 0.001612993705780387, "loss": 2.5442, "step": 11583 }, { "epoch": 0.31, "learning_rate": 0.0016129249348543562, "loss": 2.2232, "step": 11584 }, { "epoch": 0.31, "learning_rate": 0.0016128561592849155, "loss": 2.6144, "step": 11585 }, { "epoch": 0.31, "learning_rate": 0.001612787379072586, "loss": 2.1142, "step": 11586 }, { "epoch": 0.31, "learning_rate": 0.001612718594217889, "loss": 2.4053, "step": 11587 }, { "epoch": 0.31, "learning_rate": 0.0016126498047213454, "loss": 2.276, "step": 11588 }, { "epoch": 0.31, "learning_rate": 0.0016125810105834765, "loss": 2.6773, "step": 11589 }, { "epoch": 0.31, "learning_rate": 0.0016125122118048033, "loss": 2.0405, "step": 11590 }, { "epoch": 0.31, "learning_rate": 0.0016124434083858471, "loss": 2.6874, "step": 11591 }, { "epoch": 0.31, "learning_rate": 0.0016123746003271291, "loss": 2.2165, "step": 11592 }, { "epoch": 0.31, "learning_rate": 0.001612305787629171, "loss": 2.5906, "step": 11593 }, { "epoch": 0.31, "learning_rate": 0.001612236970292493, "loss": 2.2547, "step": 11594 }, { "epoch": 0.31, "learning_rate": 0.0016121681483176177, "loss": 2.6471, "step": 11595 }, { "epoch": 0.31, "learning_rate": 0.0016120993217050659, "loss": 2.3914, "step": 11596 }, { "epoch": 0.31, "learning_rate": 0.0016120304904553588, "loss": 2.4508, "step": 11597 }, { "epoch": 0.31, "learning_rate": 0.0016119616545690184, "loss": 2.4728, "step": 11598 }, { "epoch": 0.31, "learning_rate": 0.0016118928140465658, "loss": 2.727, "step": 11599 }, { "epoch": 0.31, "learning_rate": 0.0016118239688885227, "loss": 2.5725, "step": 11600 }, { "epoch": 0.31, "learning_rate": 0.0016117551190954105, "loss": 2.5978, "step": 11601 }, { "epoch": 0.31, "learning_rate": 0.001611686264667751, "loss": 2.5498, "step": 11602 }, { "epoch": 0.31, "learning_rate": 0.0016116174056060655, "loss": 2.9393, "step": 11603 }, { "epoch": 0.31, "learning_rate": 0.0016115485419108762, "loss": 2.3058, "step": 11604 }, { "epoch": 0.31, "learning_rate": 0.0016114796735827045, "loss": 2.4129, "step": 11605 }, { "epoch": 0.31, "learning_rate": 0.0016114108006220716, "loss": 2.4011, "step": 11606 }, { "epoch": 0.31, "learning_rate": 0.0016113419230295001, "loss": 2.5334, "step": 11607 }, { "epoch": 0.31, "learning_rate": 0.0016112730408055116, "loss": 2.3146, "step": 11608 }, { "epoch": 0.31, "learning_rate": 0.0016112041539506276, "loss": 2.5797, "step": 11609 }, { "epoch": 0.31, "learning_rate": 0.0016111352624653703, "loss": 2.2733, "step": 11610 }, { "epoch": 0.31, "learning_rate": 0.0016110663663502617, "loss": 2.5516, "step": 11611 }, { "epoch": 0.31, "learning_rate": 0.0016109974656058235, "loss": 2.5056, "step": 11612 }, { "epoch": 0.31, "learning_rate": 0.0016109285602325775, "loss": 2.7613, "step": 11613 }, { "epoch": 0.31, "learning_rate": 0.0016108596502310462, "loss": 2.2135, "step": 11614 }, { "epoch": 0.31, "learning_rate": 0.0016107907356017514, "loss": 2.8247, "step": 11615 }, { "epoch": 0.31, "learning_rate": 0.001610721816345215, "loss": 2.3528, "step": 11616 }, { "epoch": 0.31, "learning_rate": 0.0016106528924619593, "loss": 2.3775, "step": 11617 }, { "epoch": 0.31, "learning_rate": 0.0016105839639525066, "loss": 2.7092, "step": 11618 }, { "epoch": 0.31, "learning_rate": 0.001610515030817379, "loss": 2.7177, "step": 11619 }, { "epoch": 0.31, "learning_rate": 0.0016104460930570985, "loss": 2.4634, "step": 11620 }, { "epoch": 0.31, "learning_rate": 0.0016103771506721877, "loss": 2.4885, "step": 11621 }, { "epoch": 0.31, "learning_rate": 0.0016103082036631685, "loss": 2.0643, "step": 11622 }, { "epoch": 0.31, "learning_rate": 0.0016102392520305638, "loss": 2.6067, "step": 11623 }, { "epoch": 0.31, "learning_rate": 0.0016101702957748954, "loss": 2.8833, "step": 11624 }, { "epoch": 0.31, "learning_rate": 0.0016101013348966858, "loss": 2.7386, "step": 11625 }, { "epoch": 0.31, "learning_rate": 0.0016100323693964578, "loss": 2.8454, "step": 11626 }, { "epoch": 0.31, "learning_rate": 0.0016099633992747336, "loss": 2.4674, "step": 11627 }, { "epoch": 0.31, "learning_rate": 0.0016098944245320358, "loss": 2.7604, "step": 11628 }, { "epoch": 0.31, "learning_rate": 0.0016098254451688866, "loss": 2.6689, "step": 11629 }, { "epoch": 0.31, "learning_rate": 0.001609756461185809, "loss": 2.9819, "step": 11630 }, { "epoch": 0.31, "learning_rate": 0.0016096874725833254, "loss": 2.57, "step": 11631 }, { "epoch": 0.31, "learning_rate": 0.001609618479361959, "loss": 2.519, "step": 11632 }, { "epoch": 0.31, "learning_rate": 0.0016095494815222314, "loss": 2.6217, "step": 11633 }, { "epoch": 0.31, "learning_rate": 0.0016094804790646661, "loss": 2.4896, "step": 11634 }, { "epoch": 0.31, "learning_rate": 0.0016094114719897856, "loss": 2.7533, "step": 11635 }, { "epoch": 0.31, "learning_rate": 0.001609342460298113, "loss": 2.3126, "step": 11636 }, { "epoch": 0.31, "learning_rate": 0.0016092734439901704, "loss": 1.9686, "step": 11637 }, { "epoch": 0.31, "learning_rate": 0.0016092044230664815, "loss": 2.9294, "step": 11638 }, { "epoch": 0.31, "learning_rate": 0.0016091353975275686, "loss": 2.4713, "step": 11639 }, { "epoch": 0.31, "learning_rate": 0.001609066367373955, "loss": 2.7511, "step": 11640 }, { "epoch": 0.31, "learning_rate": 0.0016089973326061633, "loss": 2.7374, "step": 11641 }, { "epoch": 0.31, "learning_rate": 0.0016089282932247168, "loss": 2.7127, "step": 11642 }, { "epoch": 0.31, "learning_rate": 0.0016088592492301385, "loss": 2.6669, "step": 11643 }, { "epoch": 0.31, "learning_rate": 0.0016087902006229513, "loss": 2.3892, "step": 11644 }, { "epoch": 0.31, "learning_rate": 0.0016087211474036783, "loss": 2.8, "step": 11645 }, { "epoch": 0.31, "learning_rate": 0.0016086520895728428, "loss": 2.5205, "step": 11646 }, { "epoch": 0.31, "learning_rate": 0.001608583027130968, "loss": 2.8579, "step": 11647 }, { "epoch": 0.31, "learning_rate": 0.0016085139600785768, "loss": 2.4493, "step": 11648 }, { "epoch": 0.31, "learning_rate": 0.0016084448884161927, "loss": 2.4335, "step": 11649 }, { "epoch": 0.31, "learning_rate": 0.0016083758121443388, "loss": 2.7888, "step": 11650 }, { "epoch": 0.31, "learning_rate": 0.001608306731263539, "loss": 2.7675, "step": 11651 }, { "epoch": 0.31, "learning_rate": 0.0016082376457743153, "loss": 2.899, "step": 11652 }, { "epoch": 0.31, "learning_rate": 0.0016081685556771925, "loss": 2.9373, "step": 11653 }, { "epoch": 0.31, "learning_rate": 0.0016080994609726936, "loss": 2.3269, "step": 11654 }, { "epoch": 0.31, "learning_rate": 0.0016080303616613416, "loss": 2.6594, "step": 11655 }, { "epoch": 0.31, "learning_rate": 0.0016079612577436602, "loss": 2.2792, "step": 11656 }, { "epoch": 0.31, "learning_rate": 0.0016078921492201732, "loss": 2.5063, "step": 11657 }, { "epoch": 0.31, "learning_rate": 0.001607823036091404, "loss": 2.3335, "step": 11658 }, { "epoch": 0.31, "learning_rate": 0.001607753918357876, "loss": 2.7565, "step": 11659 }, { "epoch": 0.31, "learning_rate": 0.001607684796020113, "loss": 2.7302, "step": 11660 }, { "epoch": 0.31, "learning_rate": 0.0016076156690786388, "loss": 2.3503, "step": 11661 }, { "epoch": 0.31, "learning_rate": 0.0016075465375339766, "loss": 2.4925, "step": 11662 }, { "epoch": 0.31, "learning_rate": 0.0016074774013866506, "loss": 2.3297, "step": 11663 }, { "epoch": 0.31, "learning_rate": 0.0016074082606371844, "loss": 2.5626, "step": 11664 }, { "epoch": 0.31, "learning_rate": 0.0016073391152861018, "loss": 1.9847, "step": 11665 }, { "epoch": 0.31, "learning_rate": 0.0016072699653339269, "loss": 2.5264, "step": 11666 }, { "epoch": 0.31, "learning_rate": 0.0016072008107811833, "loss": 2.968, "step": 11667 }, { "epoch": 0.31, "learning_rate": 0.0016071316516283944, "loss": 2.5219, "step": 11668 }, { "epoch": 0.31, "learning_rate": 0.001607062487876085, "loss": 2.6601, "step": 11669 }, { "epoch": 0.31, "learning_rate": 0.0016069933195247787, "loss": 2.6031, "step": 11670 }, { "epoch": 0.31, "learning_rate": 0.0016069241465749998, "loss": 2.6158, "step": 11671 }, { "epoch": 0.31, "learning_rate": 0.0016068549690272716, "loss": 2.7596, "step": 11672 }, { "epoch": 0.31, "learning_rate": 0.001606785786882119, "loss": 2.5152, "step": 11673 }, { "epoch": 0.31, "learning_rate": 0.0016067166001400657, "loss": 2.8533, "step": 11674 }, { "epoch": 0.31, "learning_rate": 0.0016066474088016359, "loss": 2.3051, "step": 11675 }, { "epoch": 0.31, "learning_rate": 0.0016065782128673533, "loss": 2.8958, "step": 11676 }, { "epoch": 0.31, "learning_rate": 0.0016065090123377433, "loss": 2.1552, "step": 11677 }, { "epoch": 0.31, "learning_rate": 0.001606439807213329, "loss": 2.7372, "step": 11678 }, { "epoch": 0.31, "learning_rate": 0.0016063705974946356, "loss": 2.4079, "step": 11679 }, { "epoch": 0.31, "learning_rate": 0.0016063013831821866, "loss": 2.4686, "step": 11680 }, { "epoch": 0.31, "learning_rate": 0.0016062321642765066, "loss": 2.5955, "step": 11681 }, { "epoch": 0.31, "learning_rate": 0.0016061629407781207, "loss": 2.9609, "step": 11682 }, { "epoch": 0.31, "learning_rate": 0.001606093712687552, "loss": 2.2265, "step": 11683 }, { "epoch": 0.31, "learning_rate": 0.0016060244800053262, "loss": 2.7294, "step": 11684 }, { "epoch": 0.31, "learning_rate": 0.0016059552427319672, "loss": 2.6083, "step": 11685 }, { "epoch": 0.31, "learning_rate": 0.0016058860008679994, "loss": 2.7833, "step": 11686 }, { "epoch": 0.31, "learning_rate": 0.0016058167544139477, "loss": 2.4562, "step": 11687 }, { "epoch": 0.31, "learning_rate": 0.0016057475033703365, "loss": 2.1447, "step": 11688 }, { "epoch": 0.31, "learning_rate": 0.0016056782477376907, "loss": 2.7765, "step": 11689 }, { "epoch": 0.31, "learning_rate": 0.001605608987516535, "loss": 2.2574, "step": 11690 }, { "epoch": 0.31, "learning_rate": 0.0016055397227073933, "loss": 2.2497, "step": 11691 }, { "epoch": 0.31, "learning_rate": 0.0016054704533107911, "loss": 3.0325, "step": 11692 }, { "epoch": 0.31, "learning_rate": 0.0016054011793272531, "loss": 2.4743, "step": 11693 }, { "epoch": 0.31, "learning_rate": 0.001605331900757304, "loss": 2.8686, "step": 11694 }, { "epoch": 0.31, "learning_rate": 0.0016052626176014685, "loss": 2.9849, "step": 11695 }, { "epoch": 0.31, "learning_rate": 0.001605193329860272, "loss": 2.4671, "step": 11696 }, { "epoch": 0.31, "learning_rate": 0.0016051240375342388, "loss": 2.6683, "step": 11697 }, { "epoch": 0.31, "learning_rate": 0.0016050547406238943, "loss": 2.37, "step": 11698 }, { "epoch": 0.31, "learning_rate": 0.0016049854391297627, "loss": 2.8779, "step": 11699 }, { "epoch": 0.31, "learning_rate": 0.0016049161330523698, "loss": 2.5825, "step": 11700 }, { "epoch": 0.31, "learning_rate": 0.0016048468223922407, "loss": 2.8092, "step": 11701 }, { "epoch": 0.31, "learning_rate": 0.0016047775071499001, "loss": 2.5214, "step": 11702 }, { "epoch": 0.31, "learning_rate": 0.0016047081873258732, "loss": 2.4483, "step": 11703 }, { "epoch": 0.31, "learning_rate": 0.0016046388629206852, "loss": 2.7039, "step": 11704 }, { "epoch": 0.31, "learning_rate": 0.0016045695339348609, "loss": 2.2606, "step": 11705 }, { "epoch": 0.31, "learning_rate": 0.0016045002003689263, "loss": 2.4048, "step": 11706 }, { "epoch": 0.31, "learning_rate": 0.0016044308622234062, "loss": 2.5016, "step": 11707 }, { "epoch": 0.31, "learning_rate": 0.001604361519498826, "loss": 2.2282, "step": 11708 }, { "epoch": 0.31, "learning_rate": 0.0016042921721957108, "loss": 2.6411, "step": 11709 }, { "epoch": 0.31, "learning_rate": 0.0016042228203145864, "loss": 2.6417, "step": 11710 }, { "epoch": 0.31, "learning_rate": 0.0016041534638559776, "loss": 2.8456, "step": 11711 }, { "epoch": 0.31, "learning_rate": 0.0016040841028204104, "loss": 2.5766, "step": 11712 }, { "epoch": 0.31, "learning_rate": 0.0016040147372084102, "loss": 2.6256, "step": 11713 }, { "epoch": 0.31, "learning_rate": 0.001603945367020502, "loss": 2.7491, "step": 11714 }, { "epoch": 0.31, "learning_rate": 0.0016038759922572118, "loss": 2.6791, "step": 11715 }, { "epoch": 0.31, "learning_rate": 0.0016038066129190648, "loss": 2.648, "step": 11716 }, { "epoch": 0.31, "learning_rate": 0.0016037372290065872, "loss": 2.8242, "step": 11717 }, { "epoch": 0.31, "learning_rate": 0.0016036678405203042, "loss": 2.726, "step": 11718 }, { "epoch": 0.31, "learning_rate": 0.0016035984474607418, "loss": 2.8594, "step": 11719 }, { "epoch": 0.31, "learning_rate": 0.001603529049828425, "loss": 2.9469, "step": 11720 }, { "epoch": 0.31, "learning_rate": 0.0016034596476238803, "loss": 2.6388, "step": 11721 }, { "epoch": 0.32, "learning_rate": 0.0016033902408476332, "loss": 2.15, "step": 11722 }, { "epoch": 0.32, "learning_rate": 0.0016033208295002095, "loss": 2.5449, "step": 11723 }, { "epoch": 0.32, "learning_rate": 0.001603251413582135, "loss": 2.5085, "step": 11724 }, { "epoch": 0.32, "learning_rate": 0.0016031819930939358, "loss": 2.2677, "step": 11725 }, { "epoch": 0.32, "learning_rate": 0.001603112568036137, "loss": 2.5948, "step": 11726 }, { "epoch": 0.32, "learning_rate": 0.001603043138409266, "loss": 2.2353, "step": 11727 }, { "epoch": 0.32, "learning_rate": 0.0016029737042138478, "loss": 2.2798, "step": 11728 }, { "epoch": 0.32, "learning_rate": 0.0016029042654504084, "loss": 2.4611, "step": 11729 }, { "epoch": 0.32, "learning_rate": 0.0016028348221194743, "loss": 2.3871, "step": 11730 }, { "epoch": 0.32, "learning_rate": 0.0016027653742215714, "loss": 2.5754, "step": 11731 }, { "epoch": 0.32, "learning_rate": 0.0016026959217572256, "loss": 2.7272, "step": 11732 }, { "epoch": 0.32, "learning_rate": 0.0016026264647269635, "loss": 2.5987, "step": 11733 }, { "epoch": 0.32, "learning_rate": 0.0016025570031313109, "loss": 2.5201, "step": 11734 }, { "epoch": 0.32, "learning_rate": 0.001602487536970794, "loss": 2.464, "step": 11735 }, { "epoch": 0.32, "learning_rate": 0.0016024180662459393, "loss": 2.8056, "step": 11736 }, { "epoch": 0.32, "learning_rate": 0.001602348590957273, "loss": 2.8151, "step": 11737 }, { "epoch": 0.32, "learning_rate": 0.0016022791111053216, "loss": 2.7731, "step": 11738 }, { "epoch": 0.32, "learning_rate": 0.0016022096266906111, "loss": 2.686, "step": 11739 }, { "epoch": 0.32, "learning_rate": 0.0016021401377136685, "loss": 2.9324, "step": 11740 }, { "epoch": 0.32, "learning_rate": 0.00160207064417502, "loss": 2.403, "step": 11741 }, { "epoch": 0.32, "learning_rate": 0.0016020011460751915, "loss": 3.0632, "step": 11742 }, { "epoch": 0.32, "learning_rate": 0.00160193164341471, "loss": 2.7517, "step": 11743 }, { "epoch": 0.32, "learning_rate": 0.0016018621361941021, "loss": 2.6529, "step": 11744 }, { "epoch": 0.32, "learning_rate": 0.0016017926244138946, "loss": 2.2153, "step": 11745 }, { "epoch": 0.32, "learning_rate": 0.001601723108074613, "loss": 2.6139, "step": 11746 }, { "epoch": 0.32, "learning_rate": 0.0016016535871767852, "loss": 2.5724, "step": 11747 }, { "epoch": 0.32, "learning_rate": 0.0016015840617209373, "loss": 2.9866, "step": 11748 }, { "epoch": 0.32, "learning_rate": 0.001601514531707596, "loss": 2.6218, "step": 11749 }, { "epoch": 0.32, "learning_rate": 0.0016014449971372881, "loss": 2.4867, "step": 11750 }, { "epoch": 0.32, "learning_rate": 0.0016013754580105407, "loss": 2.6513, "step": 11751 }, { "epoch": 0.32, "learning_rate": 0.0016013059143278803, "loss": 2.4719, "step": 11752 }, { "epoch": 0.32, "learning_rate": 0.0016012363660898336, "loss": 2.8471, "step": 11753 }, { "epoch": 0.32, "learning_rate": 0.0016011668132969276, "loss": 2.6821, "step": 11754 }, { "epoch": 0.32, "learning_rate": 0.00160109725594969, "loss": 2.5228, "step": 11755 }, { "epoch": 0.32, "learning_rate": 0.0016010276940486463, "loss": 2.7737, "step": 11756 }, { "epoch": 0.32, "learning_rate": 0.0016009581275943248, "loss": 2.5081, "step": 11757 }, { "epoch": 0.32, "learning_rate": 0.0016008885565872513, "loss": 2.6831, "step": 11758 }, { "epoch": 0.32, "learning_rate": 0.0016008189810279541, "loss": 2.2967, "step": 11759 }, { "epoch": 0.32, "learning_rate": 0.0016007494009169596, "loss": 2.0592, "step": 11760 }, { "epoch": 0.32, "learning_rate": 0.001600679816254795, "loss": 2.9507, "step": 11761 }, { "epoch": 0.32, "learning_rate": 0.0016006102270419873, "loss": 2.8386, "step": 11762 }, { "epoch": 0.32, "learning_rate": 0.0016005406332790639, "loss": 2.453, "step": 11763 }, { "epoch": 0.32, "learning_rate": 0.0016004710349665522, "loss": 2.622, "step": 11764 }, { "epoch": 0.32, "learning_rate": 0.0016004014321049794, "loss": 2.4229, "step": 11765 }, { "epoch": 0.32, "learning_rate": 0.0016003318246948727, "loss": 1.8687, "step": 11766 }, { "epoch": 0.32, "learning_rate": 0.0016002622127367593, "loss": 2.9054, "step": 11767 }, { "epoch": 0.32, "learning_rate": 0.0016001925962311665, "loss": 2.6732, "step": 11768 }, { "epoch": 0.32, "learning_rate": 0.0016001229751786221, "loss": 2.733, "step": 11769 }, { "epoch": 0.32, "learning_rate": 0.0016000533495796531, "loss": 2.5614, "step": 11770 }, { "epoch": 0.32, "learning_rate": 0.0015999837194347877, "loss": 2.7737, "step": 11771 }, { "epoch": 0.32, "learning_rate": 0.0015999140847445525, "loss": 2.3315, "step": 11772 }, { "epoch": 0.32, "learning_rate": 0.0015998444455094757, "loss": 2.6687, "step": 11773 }, { "epoch": 0.32, "learning_rate": 0.0015997748017300847, "loss": 2.7324, "step": 11774 }, { "epoch": 0.32, "learning_rate": 0.0015997051534069064, "loss": 2.5213, "step": 11775 }, { "epoch": 0.32, "learning_rate": 0.0015996355005404696, "loss": 2.6002, "step": 11776 }, { "epoch": 0.32, "learning_rate": 0.0015995658431313014, "loss": 2.256, "step": 11777 }, { "epoch": 0.32, "learning_rate": 0.0015994961811799295, "loss": 2.5112, "step": 11778 }, { "epoch": 0.32, "learning_rate": 0.0015994265146868818, "loss": 2.5939, "step": 11779 }, { "epoch": 0.32, "learning_rate": 0.001599356843652686, "loss": 2.3351, "step": 11780 }, { "epoch": 0.32, "learning_rate": 0.0015992871680778698, "loss": 2.7926, "step": 11781 }, { "epoch": 0.32, "learning_rate": 0.001599217487962961, "loss": 2.7293, "step": 11782 }, { "epoch": 0.32, "learning_rate": 0.001599147803308488, "loss": 2.463, "step": 11783 }, { "epoch": 0.32, "learning_rate": 0.0015990781141149784, "loss": 2.5045, "step": 11784 }, { "epoch": 0.32, "learning_rate": 0.0015990084203829596, "loss": 2.6976, "step": 11785 }, { "epoch": 0.32, "learning_rate": 0.0015989387221129606, "loss": 2.6662, "step": 11786 }, { "epoch": 0.32, "learning_rate": 0.0015988690193055087, "loss": 2.5516, "step": 11787 }, { "epoch": 0.32, "learning_rate": 0.0015987993119611322, "loss": 2.7321, "step": 11788 }, { "epoch": 0.32, "learning_rate": 0.001598729600080359, "loss": 2.9947, "step": 11789 }, { "epoch": 0.32, "learning_rate": 0.0015986598836637176, "loss": 2.3288, "step": 11790 }, { "epoch": 0.32, "learning_rate": 0.001598590162711736, "loss": 2.4962, "step": 11791 }, { "epoch": 0.32, "learning_rate": 0.0015985204372249422, "loss": 2.5382, "step": 11792 }, { "epoch": 0.32, "learning_rate": 0.0015984507072038644, "loss": 2.4633, "step": 11793 }, { "epoch": 0.32, "learning_rate": 0.0015983809726490318, "loss": 2.6681, "step": 11794 }, { "epoch": 0.32, "learning_rate": 0.0015983112335609714, "loss": 2.8783, "step": 11795 }, { "epoch": 0.32, "learning_rate": 0.0015982414899402117, "loss": 2.5835, "step": 11796 }, { "epoch": 0.32, "learning_rate": 0.0015981717417872818, "loss": 2.25, "step": 11797 }, { "epoch": 0.32, "learning_rate": 0.0015981019891027097, "loss": 2.5461, "step": 11798 }, { "epoch": 0.32, "learning_rate": 0.0015980322318870242, "loss": 2.1874, "step": 11799 }, { "epoch": 0.32, "learning_rate": 0.001597962470140753, "loss": 2.6903, "step": 11800 }, { "epoch": 0.32, "learning_rate": 0.0015978927038644251, "loss": 2.2632, "step": 11801 }, { "epoch": 0.32, "learning_rate": 0.001597822933058569, "loss": 2.3953, "step": 11802 }, { "epoch": 0.32, "learning_rate": 0.0015977531577237131, "loss": 2.2998, "step": 11803 }, { "epoch": 0.32, "learning_rate": 0.0015976833778603863, "loss": 2.4443, "step": 11804 }, { "epoch": 0.32, "learning_rate": 0.001597613593469117, "loss": 2.5368, "step": 11805 }, { "epoch": 0.32, "learning_rate": 0.0015975438045504342, "loss": 2.7202, "step": 11806 }, { "epoch": 0.32, "learning_rate": 0.0015974740111048661, "loss": 2.9892, "step": 11807 }, { "epoch": 0.32, "learning_rate": 0.001597404213132942, "loss": 2.8834, "step": 11808 }, { "epoch": 0.32, "learning_rate": 0.00159733441063519, "loss": 2.474, "step": 11809 }, { "epoch": 0.32, "learning_rate": 0.0015972646036121396, "loss": 2.7992, "step": 11810 }, { "epoch": 0.32, "learning_rate": 0.0015971947920643194, "loss": 2.338, "step": 11811 }, { "epoch": 0.32, "learning_rate": 0.0015971249759922578, "loss": 2.8889, "step": 11812 }, { "epoch": 0.32, "learning_rate": 0.0015970551553964847, "loss": 2.6628, "step": 11813 }, { "epoch": 0.32, "learning_rate": 0.0015969853302775282, "loss": 2.4319, "step": 11814 }, { "epoch": 0.32, "learning_rate": 0.0015969155006359175, "loss": 2.5387, "step": 11815 }, { "epoch": 0.32, "learning_rate": 0.0015968456664721816, "loss": 2.6177, "step": 11816 }, { "epoch": 0.32, "learning_rate": 0.0015967758277868498, "loss": 2.2217, "step": 11817 }, { "epoch": 0.32, "learning_rate": 0.001596705984580451, "loss": 2.7702, "step": 11818 }, { "epoch": 0.32, "learning_rate": 0.0015966361368535144, "loss": 2.4698, "step": 11819 }, { "epoch": 0.32, "learning_rate": 0.001596566284606569, "loss": 2.5556, "step": 11820 }, { "epoch": 0.32, "learning_rate": 0.0015964964278401444, "loss": 2.3418, "step": 11821 }, { "epoch": 0.32, "learning_rate": 0.001596426566554769, "loss": 2.4414, "step": 11822 }, { "epoch": 0.32, "learning_rate": 0.001596356700750973, "loss": 2.8746, "step": 11823 }, { "epoch": 0.32, "learning_rate": 0.0015962868304292847, "loss": 2.6925, "step": 11824 }, { "epoch": 0.32, "learning_rate": 0.0015962169555902347, "loss": 2.7903, "step": 11825 }, { "epoch": 0.32, "learning_rate": 0.001596147076234351, "loss": 2.9735, "step": 11826 }, { "epoch": 0.32, "learning_rate": 0.0015960771923621642, "loss": 2.7269, "step": 11827 }, { "epoch": 0.32, "learning_rate": 0.0015960073039742028, "loss": 2.0997, "step": 11828 }, { "epoch": 0.32, "learning_rate": 0.0015959374110709966, "loss": 2.2557, "step": 11829 }, { "epoch": 0.32, "learning_rate": 0.001595867513653075, "loss": 2.8573, "step": 11830 }, { "epoch": 0.32, "learning_rate": 0.001595797611720968, "loss": 3.0838, "step": 11831 }, { "epoch": 0.32, "learning_rate": 0.0015957277052752047, "loss": 2.5515, "step": 11832 }, { "epoch": 0.32, "learning_rate": 0.0015956577943163147, "loss": 2.5275, "step": 11833 }, { "epoch": 0.32, "learning_rate": 0.001595587878844828, "loss": 2.1963, "step": 11834 }, { "epoch": 0.32, "learning_rate": 0.0015955179588612737, "loss": 2.9257, "step": 11835 }, { "epoch": 0.32, "learning_rate": 0.001595448034366182, "loss": 2.7686, "step": 11836 }, { "epoch": 0.32, "learning_rate": 0.0015953781053600821, "loss": 2.3054, "step": 11837 }, { "epoch": 0.32, "learning_rate": 0.0015953081718435044, "loss": 2.5869, "step": 11838 }, { "epoch": 0.32, "learning_rate": 0.0015952382338169785, "loss": 2.5972, "step": 11839 }, { "epoch": 0.32, "learning_rate": 0.0015951682912810341, "loss": 2.7408, "step": 11840 }, { "epoch": 0.32, "learning_rate": 0.0015950983442362013, "loss": 2.5544, "step": 11841 }, { "epoch": 0.32, "learning_rate": 0.0015950283926830097, "loss": 2.772, "step": 11842 }, { "epoch": 0.32, "learning_rate": 0.001594958436621989, "loss": 2.2128, "step": 11843 }, { "epoch": 0.32, "learning_rate": 0.0015948884760536698, "loss": 2.4175, "step": 11844 }, { "epoch": 0.32, "learning_rate": 0.0015948185109785822, "loss": 2.6173, "step": 11845 }, { "epoch": 0.32, "learning_rate": 0.0015947485413972556, "loss": 2.4511, "step": 11846 }, { "epoch": 0.32, "learning_rate": 0.0015946785673102205, "loss": 2.4631, "step": 11847 }, { "epoch": 0.32, "learning_rate": 0.0015946085887180068, "loss": 3.228, "step": 11848 }, { "epoch": 0.32, "learning_rate": 0.0015945386056211448, "loss": 2.6479, "step": 11849 }, { "epoch": 0.32, "learning_rate": 0.0015944686180201647, "loss": 2.4019, "step": 11850 }, { "epoch": 0.32, "learning_rate": 0.0015943986259155962, "loss": 2.6217, "step": 11851 }, { "epoch": 0.32, "learning_rate": 0.0015943286293079704, "loss": 2.3256, "step": 11852 }, { "epoch": 0.32, "learning_rate": 0.001594258628197817, "loss": 3.0706, "step": 11853 }, { "epoch": 0.32, "learning_rate": 0.0015941886225856665, "loss": 2.3794, "step": 11854 }, { "epoch": 0.32, "learning_rate": 0.0015941186124720493, "loss": 2.2536, "step": 11855 }, { "epoch": 0.32, "learning_rate": 0.0015940485978574958, "loss": 2.2708, "step": 11856 }, { "epoch": 0.32, "learning_rate": 0.0015939785787425361, "loss": 2.7495, "step": 11857 }, { "epoch": 0.32, "learning_rate": 0.001593908555127701, "loss": 2.1374, "step": 11858 }, { "epoch": 0.32, "learning_rate": 0.0015938385270135207, "loss": 2.275, "step": 11859 }, { "epoch": 0.32, "learning_rate": 0.0015937684944005261, "loss": 2.4446, "step": 11860 }, { "epoch": 0.32, "learning_rate": 0.0015936984572892474, "loss": 2.2581, "step": 11861 }, { "epoch": 0.32, "learning_rate": 0.0015936284156802154, "loss": 2.5837, "step": 11862 }, { "epoch": 0.32, "learning_rate": 0.0015935583695739605, "loss": 2.3193, "step": 11863 }, { "epoch": 0.32, "learning_rate": 0.0015934883189710138, "loss": 2.5247, "step": 11864 }, { "epoch": 0.32, "learning_rate": 0.0015934182638719058, "loss": 2.408, "step": 11865 }, { "epoch": 0.32, "learning_rate": 0.0015933482042771667, "loss": 2.6832, "step": 11866 }, { "epoch": 0.32, "learning_rate": 0.0015932781401873277, "loss": 2.7003, "step": 11867 }, { "epoch": 0.32, "learning_rate": 0.0015932080716029198, "loss": 2.5285, "step": 11868 }, { "epoch": 0.32, "learning_rate": 0.001593137998524474, "loss": 2.504, "step": 11869 }, { "epoch": 0.32, "learning_rate": 0.00159306792095252, "loss": 2.3361, "step": 11870 }, { "epoch": 0.32, "learning_rate": 0.0015929978388875897, "loss": 3.107, "step": 11871 }, { "epoch": 0.32, "learning_rate": 0.0015929277523302142, "loss": 3.1656, "step": 11872 }, { "epoch": 0.32, "learning_rate": 0.0015928576612809235, "loss": 2.7209, "step": 11873 }, { "epoch": 0.32, "learning_rate": 0.0015927875657402494, "loss": 2.3748, "step": 11874 }, { "epoch": 0.32, "learning_rate": 0.0015927174657087227, "loss": 2.6502, "step": 11875 }, { "epoch": 0.32, "learning_rate": 0.0015926473611868744, "loss": 2.4593, "step": 11876 }, { "epoch": 0.32, "learning_rate": 0.0015925772521752357, "loss": 2.4167, "step": 11877 }, { "epoch": 0.32, "learning_rate": 0.0015925071386743376, "loss": 2.7013, "step": 11878 }, { "epoch": 0.32, "learning_rate": 0.0015924370206847115, "loss": 2.4756, "step": 11879 }, { "epoch": 0.32, "learning_rate": 0.0015923668982068882, "loss": 2.7688, "step": 11880 }, { "epoch": 0.32, "learning_rate": 0.0015922967712413993, "loss": 2.9924, "step": 11881 }, { "epoch": 0.32, "learning_rate": 0.001592226639788776, "loss": 2.8884, "step": 11882 }, { "epoch": 0.32, "learning_rate": 0.0015921565038495493, "loss": 2.6433, "step": 11883 }, { "epoch": 0.32, "learning_rate": 0.0015920863634242513, "loss": 2.5819, "step": 11884 }, { "epoch": 0.32, "learning_rate": 0.0015920162185134126, "loss": 2.5547, "step": 11885 }, { "epoch": 0.32, "learning_rate": 0.0015919460691175647, "loss": 3.1274, "step": 11886 }, { "epoch": 0.32, "learning_rate": 0.0015918759152372395, "loss": 3.0078, "step": 11887 }, { "epoch": 0.32, "learning_rate": 0.0015918057568729681, "loss": 2.9131, "step": 11888 }, { "epoch": 0.32, "learning_rate": 0.001591735594025282, "loss": 2.7098, "step": 11889 }, { "epoch": 0.32, "learning_rate": 0.001591665426694713, "loss": 2.2714, "step": 11890 }, { "epoch": 0.32, "learning_rate": 0.0015915952548817922, "loss": 2.5203, "step": 11891 }, { "epoch": 0.32, "learning_rate": 0.001591525078587052, "loss": 3.0532, "step": 11892 }, { "epoch": 0.32, "learning_rate": 0.001591454897811023, "loss": 2.5112, "step": 11893 }, { "epoch": 0.32, "learning_rate": 0.0015913847125542376, "loss": 2.2758, "step": 11894 }, { "epoch": 0.32, "learning_rate": 0.0015913145228172274, "loss": 2.8645, "step": 11895 }, { "epoch": 0.32, "learning_rate": 0.0015912443286005243, "loss": 2.8391, "step": 11896 }, { "epoch": 0.32, "learning_rate": 0.0015911741299046596, "loss": 2.8494, "step": 11897 }, { "epoch": 0.32, "learning_rate": 0.0015911039267301654, "loss": 2.2074, "step": 11898 }, { "epoch": 0.32, "learning_rate": 0.001591033719077574, "loss": 2.6847, "step": 11899 }, { "epoch": 0.32, "learning_rate": 0.0015909635069474165, "loss": 2.6438, "step": 11900 }, { "epoch": 0.32, "learning_rate": 0.0015908932903402249, "loss": 2.6929, "step": 11901 }, { "epoch": 0.32, "learning_rate": 0.0015908230692565316, "loss": 2.7826, "step": 11902 }, { "epoch": 0.32, "learning_rate": 0.0015907528436968682, "loss": 2.7025, "step": 11903 }, { "epoch": 0.32, "learning_rate": 0.001590682613661767, "loss": 2.661, "step": 11904 }, { "epoch": 0.32, "learning_rate": 0.0015906123791517598, "loss": 2.705, "step": 11905 }, { "epoch": 0.32, "learning_rate": 0.0015905421401673787, "loss": 2.5855, "step": 11906 }, { "epoch": 0.32, "learning_rate": 0.0015904718967091563, "loss": 2.4911, "step": 11907 }, { "epoch": 0.32, "learning_rate": 0.0015904016487776243, "loss": 2.9905, "step": 11908 }, { "epoch": 0.32, "learning_rate": 0.0015903313963733145, "loss": 2.4072, "step": 11909 }, { "epoch": 0.32, "learning_rate": 0.0015902611394967604, "loss": 2.6092, "step": 11910 }, { "epoch": 0.32, "learning_rate": 0.0015901908781484927, "loss": 2.6587, "step": 11911 }, { "epoch": 0.32, "learning_rate": 0.0015901206123290449, "loss": 2.4232, "step": 11912 }, { "epoch": 0.32, "learning_rate": 0.0015900503420389486, "loss": 2.4885, "step": 11913 }, { "epoch": 0.32, "learning_rate": 0.0015899800672787364, "loss": 2.6647, "step": 11914 }, { "epoch": 0.32, "learning_rate": 0.0015899097880489408, "loss": 2.3406, "step": 11915 }, { "epoch": 0.32, "learning_rate": 0.0015898395043500942, "loss": 2.4623, "step": 11916 }, { "epoch": 0.32, "learning_rate": 0.0015897692161827286, "loss": 2.1971, "step": 11917 }, { "epoch": 0.32, "learning_rate": 0.001589698923547377, "loss": 2.7765, "step": 11918 }, { "epoch": 0.32, "learning_rate": 0.001589628626444572, "loss": 2.4982, "step": 11919 }, { "epoch": 0.32, "learning_rate": 0.0015895583248748458, "loss": 2.6833, "step": 11920 }, { "epoch": 0.32, "learning_rate": 0.001589488018838731, "loss": 2.8099, "step": 11921 }, { "epoch": 0.32, "learning_rate": 0.0015894177083367604, "loss": 2.3877, "step": 11922 }, { "epoch": 0.32, "learning_rate": 0.0015893473933694668, "loss": 2.7135, "step": 11923 }, { "epoch": 0.32, "learning_rate": 0.0015892770739373827, "loss": 2.2173, "step": 11924 }, { "epoch": 0.32, "learning_rate": 0.0015892067500410407, "loss": 2.7294, "step": 11925 }, { "epoch": 0.32, "learning_rate": 0.0015891364216809739, "loss": 2.6377, "step": 11926 }, { "epoch": 0.32, "learning_rate": 0.0015890660888577147, "loss": 2.5828, "step": 11927 }, { "epoch": 0.32, "learning_rate": 0.001588995751571796, "loss": 2.7388, "step": 11928 }, { "epoch": 0.32, "learning_rate": 0.001588925409823751, "loss": 2.3003, "step": 11929 }, { "epoch": 0.32, "learning_rate": 0.0015888550636141126, "loss": 2.6969, "step": 11930 }, { "epoch": 0.32, "learning_rate": 0.0015887847129434133, "loss": 2.6805, "step": 11931 }, { "epoch": 0.32, "learning_rate": 0.001588714357812186, "loss": 2.738, "step": 11932 }, { "epoch": 0.32, "learning_rate": 0.0015886439982209645, "loss": 2.9177, "step": 11933 }, { "epoch": 0.32, "learning_rate": 0.001588573634170281, "loss": 2.1723, "step": 11934 }, { "epoch": 0.32, "learning_rate": 0.0015885032656606688, "loss": 2.8698, "step": 11935 }, { "epoch": 0.32, "learning_rate": 0.0015884328926926612, "loss": 2.8278, "step": 11936 }, { "epoch": 0.32, "learning_rate": 0.001588362515266791, "loss": 3.0835, "step": 11937 }, { "epoch": 0.32, "learning_rate": 0.001588292133383592, "loss": 3.0244, "step": 11938 }, { "epoch": 0.32, "learning_rate": 0.0015882217470435966, "loss": 2.7062, "step": 11939 }, { "epoch": 0.32, "learning_rate": 0.0015881513562473386, "loss": 2.5438, "step": 11940 }, { "epoch": 0.32, "learning_rate": 0.001588080960995351, "loss": 2.2976, "step": 11941 }, { "epoch": 0.32, "learning_rate": 0.0015880105612881671, "loss": 2.3305, "step": 11942 }, { "epoch": 0.32, "learning_rate": 0.0015879401571263208, "loss": 2.3403, "step": 11943 }, { "epoch": 0.32, "learning_rate": 0.0015878697485103446, "loss": 2.6539, "step": 11944 }, { "epoch": 0.32, "learning_rate": 0.0015877993354407724, "loss": 3.0024, "step": 11945 }, { "epoch": 0.32, "learning_rate": 0.0015877289179181374, "loss": 2.643, "step": 11946 }, { "epoch": 0.32, "learning_rate": 0.0015876584959429731, "loss": 2.8434, "step": 11947 }, { "epoch": 0.32, "learning_rate": 0.001587588069515813, "loss": 2.7767, "step": 11948 }, { "epoch": 0.32, "learning_rate": 0.0015875176386371912, "loss": 2.7235, "step": 11949 }, { "epoch": 0.32, "learning_rate": 0.0015874472033076405, "loss": 2.268, "step": 11950 }, { "epoch": 0.32, "learning_rate": 0.0015873767635276948, "loss": 2.4488, "step": 11951 }, { "epoch": 0.32, "learning_rate": 0.0015873063192978877, "loss": 2.5697, "step": 11952 }, { "epoch": 0.32, "learning_rate": 0.0015872358706187533, "loss": 2.9245, "step": 11953 }, { "epoch": 0.32, "learning_rate": 0.0015871654174908249, "loss": 2.7477, "step": 11954 }, { "epoch": 0.32, "learning_rate": 0.0015870949599146359, "loss": 2.5681, "step": 11955 }, { "epoch": 0.32, "learning_rate": 0.0015870244978907204, "loss": 2.2966, "step": 11956 }, { "epoch": 0.32, "learning_rate": 0.0015869540314196126, "loss": 2.4322, "step": 11957 }, { "epoch": 0.32, "learning_rate": 0.0015868835605018458, "loss": 2.7064, "step": 11958 }, { "epoch": 0.32, "learning_rate": 0.0015868130851379543, "loss": 2.3645, "step": 11959 }, { "epoch": 0.32, "learning_rate": 0.0015867426053284715, "loss": 2.5537, "step": 11960 }, { "epoch": 0.32, "learning_rate": 0.0015866721210739316, "loss": 2.3972, "step": 11961 }, { "epoch": 0.32, "learning_rate": 0.0015866016323748688, "loss": 2.4764, "step": 11962 }, { "epoch": 0.32, "learning_rate": 0.0015865311392318168, "loss": 2.3781, "step": 11963 }, { "epoch": 0.32, "learning_rate": 0.0015864606416453096, "loss": 2.6466, "step": 11964 }, { "epoch": 0.32, "learning_rate": 0.0015863901396158818, "loss": 2.3388, "step": 11965 }, { "epoch": 0.32, "learning_rate": 0.001586319633144067, "loss": 2.6483, "step": 11966 }, { "epoch": 0.32, "learning_rate": 0.0015862491222303995, "loss": 2.6972, "step": 11967 }, { "epoch": 0.32, "learning_rate": 0.0015861786068754134, "loss": 2.305, "step": 11968 }, { "epoch": 0.32, "learning_rate": 0.001586108087079643, "loss": 3.0938, "step": 11969 }, { "epoch": 0.32, "learning_rate": 0.0015860375628436224, "loss": 2.8705, "step": 11970 }, { "epoch": 0.32, "learning_rate": 0.001585967034167886, "loss": 3.2138, "step": 11971 }, { "epoch": 0.32, "learning_rate": 0.001585896501052968, "loss": 2.8337, "step": 11972 }, { "epoch": 0.32, "learning_rate": 0.0015858259634994032, "loss": 2.7012, "step": 11973 }, { "epoch": 0.32, "learning_rate": 0.0015857554215077255, "loss": 2.6707, "step": 11974 }, { "epoch": 0.32, "learning_rate": 0.0015856848750784693, "loss": 2.2667, "step": 11975 }, { "epoch": 0.32, "learning_rate": 0.0015856143242121694, "loss": 2.3697, "step": 11976 }, { "epoch": 0.32, "learning_rate": 0.00158554376890936, "loss": 2.2156, "step": 11977 }, { "epoch": 0.32, "learning_rate": 0.0015854732091705758, "loss": 2.2805, "step": 11978 }, { "epoch": 0.32, "learning_rate": 0.0015854026449963513, "loss": 2.5645, "step": 11979 }, { "epoch": 0.32, "learning_rate": 0.0015853320763872206, "loss": 2.3323, "step": 11980 }, { "epoch": 0.32, "learning_rate": 0.0015852615033437193, "loss": 2.8768, "step": 11981 }, { "epoch": 0.32, "learning_rate": 0.001585190925866381, "loss": 2.0348, "step": 11982 }, { "epoch": 0.32, "learning_rate": 0.001585120343955741, "loss": 2.1075, "step": 11983 }, { "epoch": 0.32, "learning_rate": 0.001585049757612334, "loss": 2.7277, "step": 11984 }, { "epoch": 0.32, "learning_rate": 0.0015849791668366944, "loss": 2.5528, "step": 11985 }, { "epoch": 0.32, "learning_rate": 0.0015849085716293577, "loss": 2.571, "step": 11986 }, { "epoch": 0.32, "learning_rate": 0.0015848379719908576, "loss": 2.1873, "step": 11987 }, { "epoch": 0.32, "learning_rate": 0.0015847673679217301, "loss": 2.8532, "step": 11988 }, { "epoch": 0.32, "learning_rate": 0.0015846967594225095, "loss": 2.8259, "step": 11989 }, { "epoch": 0.32, "learning_rate": 0.0015846261464937306, "loss": 2.5415, "step": 11990 }, { "epoch": 0.32, "learning_rate": 0.0015845555291359283, "loss": 2.7679, "step": 11991 }, { "epoch": 0.32, "learning_rate": 0.0015844849073496383, "loss": 2.4277, "step": 11992 }, { "epoch": 0.32, "learning_rate": 0.0015844142811353948, "loss": 2.8568, "step": 11993 }, { "epoch": 0.32, "learning_rate": 0.0015843436504937337, "loss": 2.8366, "step": 11994 }, { "epoch": 0.32, "learning_rate": 0.0015842730154251887, "loss": 2.8668, "step": 11995 }, { "epoch": 0.32, "learning_rate": 0.0015842023759302965, "loss": 2.5141, "step": 11996 }, { "epoch": 0.32, "learning_rate": 0.0015841317320095913, "loss": 2.5021, "step": 11997 }, { "epoch": 0.32, "learning_rate": 0.0015840610836636087, "loss": 2.374, "step": 11998 }, { "epoch": 0.32, "learning_rate": 0.0015839904308928836, "loss": 2.6471, "step": 11999 }, { "epoch": 0.32, "learning_rate": 0.0015839197736979514, "loss": 2.9218, "step": 12000 }, { "epoch": 0.32, "learning_rate": 0.0015838491120793476, "loss": 2.5153, "step": 12001 }, { "epoch": 0.32, "learning_rate": 0.0015837784460376071, "loss": 2.4186, "step": 12002 }, { "epoch": 0.32, "learning_rate": 0.0015837077755732655, "loss": 3.0265, "step": 12003 }, { "epoch": 0.32, "learning_rate": 0.0015836371006868579, "loss": 2.777, "step": 12004 }, { "epoch": 0.32, "learning_rate": 0.0015835664213789205, "loss": 3.0768, "step": 12005 }, { "epoch": 0.32, "learning_rate": 0.0015834957376499878, "loss": 2.605, "step": 12006 }, { "epoch": 0.32, "learning_rate": 0.0015834250495005957, "loss": 2.9666, "step": 12007 }, { "epoch": 0.32, "learning_rate": 0.00158335435693128, "loss": 2.0627, "step": 12008 }, { "epoch": 0.32, "learning_rate": 0.0015832836599425758, "loss": 2.5561, "step": 12009 }, { "epoch": 0.32, "learning_rate": 0.001583212958535019, "loss": 2.7867, "step": 12010 }, { "epoch": 0.32, "learning_rate": 0.0015831422527091453, "loss": 2.3393, "step": 12011 }, { "epoch": 0.32, "learning_rate": 0.0015830715424654898, "loss": 2.5748, "step": 12012 }, { "epoch": 0.32, "learning_rate": 0.0015830008278045888, "loss": 2.3383, "step": 12013 }, { "epoch": 0.32, "learning_rate": 0.0015829301087269775, "loss": 2.5213, "step": 12014 }, { "epoch": 0.32, "learning_rate": 0.0015828593852331915, "loss": 2.2188, "step": 12015 }, { "epoch": 0.32, "learning_rate": 0.0015827886573237678, "loss": 2.3921, "step": 12016 }, { "epoch": 0.32, "learning_rate": 0.0015827179249992412, "loss": 2.5896, "step": 12017 }, { "epoch": 0.32, "learning_rate": 0.0015826471882601477, "loss": 2.8075, "step": 12018 }, { "epoch": 0.32, "learning_rate": 0.001582576447107023, "loss": 2.7765, "step": 12019 }, { "epoch": 0.32, "learning_rate": 0.0015825057015404038, "loss": 2.7501, "step": 12020 }, { "epoch": 0.32, "learning_rate": 0.0015824349515608253, "loss": 2.9719, "step": 12021 }, { "epoch": 0.32, "learning_rate": 0.0015823641971688235, "loss": 2.3602, "step": 12022 }, { "epoch": 0.32, "learning_rate": 0.001582293438364935, "loss": 2.483, "step": 12023 }, { "epoch": 0.32, "learning_rate": 0.0015822226751496956, "loss": 2.5617, "step": 12024 }, { "epoch": 0.32, "learning_rate": 0.0015821519075236413, "loss": 2.5489, "step": 12025 }, { "epoch": 0.32, "learning_rate": 0.001582081135487308, "loss": 2.521, "step": 12026 }, { "epoch": 0.32, "learning_rate": 0.001582010359041232, "loss": 2.3953, "step": 12027 }, { "epoch": 0.32, "learning_rate": 0.0015819395781859497, "loss": 2.6271, "step": 12028 }, { "epoch": 0.32, "learning_rate": 0.0015818687929219973, "loss": 2.4262, "step": 12029 }, { "epoch": 0.32, "learning_rate": 0.0015817980032499107, "loss": 2.3222, "step": 12030 }, { "epoch": 0.32, "learning_rate": 0.001581727209170227, "loss": 2.5892, "step": 12031 }, { "epoch": 0.32, "learning_rate": 0.0015816564106834812, "loss": 2.6253, "step": 12032 }, { "epoch": 0.32, "learning_rate": 0.001581585607790211, "loss": 2.4379, "step": 12033 }, { "epoch": 0.32, "learning_rate": 0.001581514800490952, "loss": 2.5392, "step": 12034 }, { "epoch": 0.32, "learning_rate": 0.0015814439887862407, "loss": 2.3842, "step": 12035 }, { "epoch": 0.32, "learning_rate": 0.0015813731726766142, "loss": 2.5491, "step": 12036 }, { "epoch": 0.32, "learning_rate": 0.001581302352162608, "loss": 2.2397, "step": 12037 }, { "epoch": 0.32, "learning_rate": 0.0015812315272447591, "loss": 2.2941, "step": 12038 }, { "epoch": 0.32, "learning_rate": 0.0015811606979236042, "loss": 2.6681, "step": 12039 }, { "epoch": 0.32, "learning_rate": 0.0015810898641996798, "loss": 2.8574, "step": 12040 }, { "epoch": 0.32, "learning_rate": 0.0015810190260735224, "loss": 2.1522, "step": 12041 }, { "epoch": 0.32, "learning_rate": 0.0015809481835456687, "loss": 2.6561, "step": 12042 }, { "epoch": 0.32, "learning_rate": 0.0015808773366166556, "loss": 2.5059, "step": 12043 }, { "epoch": 0.32, "learning_rate": 0.0015808064852870195, "loss": 2.7556, "step": 12044 }, { "epoch": 0.32, "learning_rate": 0.0015807356295572973, "loss": 2.8479, "step": 12045 }, { "epoch": 0.32, "learning_rate": 0.001580664769428026, "loss": 2.7466, "step": 12046 }, { "epoch": 0.32, "learning_rate": 0.0015805939048997419, "loss": 2.6575, "step": 12047 }, { "epoch": 0.32, "learning_rate": 0.0015805230359729823, "loss": 2.3631, "step": 12048 }, { "epoch": 0.32, "learning_rate": 0.001580452162648284, "loss": 3.0545, "step": 12049 }, { "epoch": 0.32, "learning_rate": 0.001580381284926184, "loss": 2.7854, "step": 12050 }, { "epoch": 0.32, "learning_rate": 0.0015803104028072191, "loss": 2.4078, "step": 12051 }, { "epoch": 0.32, "learning_rate": 0.0015802395162919263, "loss": 3.2397, "step": 12052 }, { "epoch": 0.32, "learning_rate": 0.0015801686253808427, "loss": 2.8181, "step": 12053 }, { "epoch": 0.32, "learning_rate": 0.0015800977300745051, "loss": 2.432, "step": 12054 }, { "epoch": 0.32, "learning_rate": 0.001580026830373451, "loss": 2.3947, "step": 12055 }, { "epoch": 0.32, "learning_rate": 0.0015799559262782172, "loss": 2.2492, "step": 12056 }, { "epoch": 0.32, "learning_rate": 0.001579885017789341, "loss": 2.592, "step": 12057 }, { "epoch": 0.32, "learning_rate": 0.0015798141049073598, "loss": 2.6123, "step": 12058 }, { "epoch": 0.32, "learning_rate": 0.0015797431876328103, "loss": 2.835, "step": 12059 }, { "epoch": 0.32, "learning_rate": 0.0015796722659662304, "loss": 2.8589, "step": 12060 }, { "epoch": 0.32, "learning_rate": 0.0015796013399081569, "loss": 2.6282, "step": 12061 }, { "epoch": 0.32, "learning_rate": 0.0015795304094591272, "loss": 2.7629, "step": 12062 }, { "epoch": 0.32, "learning_rate": 0.001579459474619679, "loss": 2.632, "step": 12063 }, { "epoch": 0.32, "learning_rate": 0.0015793885353903492, "loss": 2.3843, "step": 12064 }, { "epoch": 0.32, "learning_rate": 0.0015793175917716753, "loss": 2.3562, "step": 12065 }, { "epoch": 0.32, "learning_rate": 0.0015792466437641948, "loss": 2.5704, "step": 12066 }, { "epoch": 0.32, "learning_rate": 0.001579175691368446, "loss": 2.518, "step": 12067 }, { "epoch": 0.32, "learning_rate": 0.001579104734584965, "loss": 2.5931, "step": 12068 }, { "epoch": 0.32, "learning_rate": 0.0015790337734142904, "loss": 2.4916, "step": 12069 }, { "epoch": 0.32, "learning_rate": 0.0015789628078569594, "loss": 2.3008, "step": 12070 }, { "epoch": 0.32, "learning_rate": 0.0015788918379135094, "loss": 2.4786, "step": 12071 }, { "epoch": 0.32, "learning_rate": 0.0015788208635844785, "loss": 2.8566, "step": 12072 }, { "epoch": 0.32, "learning_rate": 0.0015787498848704043, "loss": 2.4814, "step": 12073 }, { "epoch": 0.32, "learning_rate": 0.0015786789017718243, "loss": 2.8232, "step": 12074 }, { "epoch": 0.32, "learning_rate": 0.0015786079142892765, "loss": 2.6598, "step": 12075 }, { "epoch": 0.32, "learning_rate": 0.0015785369224232987, "loss": 2.5583, "step": 12076 }, { "epoch": 0.32, "learning_rate": 0.0015784659261744288, "loss": 2.3909, "step": 12077 }, { "epoch": 0.32, "learning_rate": 0.0015783949255432043, "loss": 2.6195, "step": 12078 }, { "epoch": 0.32, "learning_rate": 0.001578323920530163, "loss": 2.2511, "step": 12079 }, { "epoch": 0.32, "learning_rate": 0.0015782529111358432, "loss": 2.976, "step": 12080 }, { "epoch": 0.32, "learning_rate": 0.0015781818973607824, "loss": 1.9241, "step": 12081 }, { "epoch": 0.32, "learning_rate": 0.0015781108792055193, "loss": 2.5736, "step": 12082 }, { "epoch": 0.32, "learning_rate": 0.0015780398566705917, "loss": 2.7706, "step": 12083 }, { "epoch": 0.32, "learning_rate": 0.001577968829756537, "loss": 2.8723, "step": 12084 }, { "epoch": 0.32, "learning_rate": 0.0015778977984638942, "loss": 2.6706, "step": 12085 }, { "epoch": 0.32, "learning_rate": 0.001577826762793201, "loss": 3.2462, "step": 12086 }, { "epoch": 0.32, "learning_rate": 0.0015777557227449953, "loss": 2.694, "step": 12087 }, { "epoch": 0.32, "learning_rate": 0.0015776846783198157, "loss": 2.7623, "step": 12088 }, { "epoch": 0.32, "learning_rate": 0.0015776136295182002, "loss": 2.7165, "step": 12089 }, { "epoch": 0.32, "learning_rate": 0.001577542576340687, "loss": 2.4582, "step": 12090 }, { "epoch": 0.32, "learning_rate": 0.0015774715187878146, "loss": 2.6407, "step": 12091 }, { "epoch": 0.32, "learning_rate": 0.0015774004568601212, "loss": 2.82, "step": 12092 }, { "epoch": 0.32, "learning_rate": 0.0015773293905581452, "loss": 2.5709, "step": 12093 }, { "epoch": 0.33, "learning_rate": 0.001577258319882425, "loss": 2.2527, "step": 12094 }, { "epoch": 0.33, "learning_rate": 0.001577187244833499, "loss": 2.7565, "step": 12095 }, { "epoch": 0.33, "learning_rate": 0.0015771161654119052, "loss": 2.3926, "step": 12096 }, { "epoch": 0.33, "learning_rate": 0.001577045081618183, "loss": 2.8694, "step": 12097 }, { "epoch": 0.33, "learning_rate": 0.0015769739934528705, "loss": 2.7102, "step": 12098 }, { "epoch": 0.33, "learning_rate": 0.001576902900916506, "loss": 2.7438, "step": 12099 }, { "epoch": 0.33, "learning_rate": 0.0015768318040096279, "loss": 2.733, "step": 12100 }, { "epoch": 0.33, "learning_rate": 0.0015767607027327756, "loss": 1.9848, "step": 12101 }, { "epoch": 0.33, "learning_rate": 0.0015766895970864873, "loss": 2.8839, "step": 12102 }, { "epoch": 0.33, "learning_rate": 0.0015766184870713016, "loss": 2.4089, "step": 12103 }, { "epoch": 0.33, "learning_rate": 0.0015765473726877574, "loss": 2.1269, "step": 12104 }, { "epoch": 0.33, "learning_rate": 0.0015764762539363932, "loss": 2.5528, "step": 12105 }, { "epoch": 0.33, "learning_rate": 0.001576405130817748, "loss": 2.6628, "step": 12106 }, { "epoch": 0.33, "learning_rate": 0.0015763340033323608, "loss": 2.4994, "step": 12107 }, { "epoch": 0.33, "learning_rate": 0.00157626287148077, "loss": 2.4029, "step": 12108 }, { "epoch": 0.33, "learning_rate": 0.001576191735263515, "loss": 2.7773, "step": 12109 }, { "epoch": 0.33, "learning_rate": 0.0015761205946811343, "loss": 2.7188, "step": 12110 }, { "epoch": 0.33, "learning_rate": 0.0015760494497341672, "loss": 2.1555, "step": 12111 }, { "epoch": 0.33, "learning_rate": 0.0015759783004231519, "loss": 2.6908, "step": 12112 }, { "epoch": 0.33, "learning_rate": 0.0015759071467486283, "loss": 2.2483, "step": 12113 }, { "epoch": 0.33, "learning_rate": 0.0015758359887111351, "loss": 2.4799, "step": 12114 }, { "epoch": 0.33, "learning_rate": 0.0015757648263112114, "loss": 2.7093, "step": 12115 }, { "epoch": 0.33, "learning_rate": 0.0015756936595493962, "loss": 2.8323, "step": 12116 }, { "epoch": 0.33, "learning_rate": 0.001575622488426229, "loss": 2.5331, "step": 12117 }, { "epoch": 0.33, "learning_rate": 0.0015755513129422484, "loss": 2.3552, "step": 12118 }, { "epoch": 0.33, "learning_rate": 0.0015754801330979944, "loss": 3.2553, "step": 12119 }, { "epoch": 0.33, "learning_rate": 0.0015754089488940056, "loss": 2.5212, "step": 12120 }, { "epoch": 0.33, "learning_rate": 0.0015753377603308213, "loss": 2.4422, "step": 12121 }, { "epoch": 0.33, "learning_rate": 0.0015752665674089812, "loss": 2.5684, "step": 12122 }, { "epoch": 0.33, "learning_rate": 0.0015751953701290242, "loss": 2.6679, "step": 12123 }, { "epoch": 0.33, "learning_rate": 0.00157512416849149, "loss": 2.4437, "step": 12124 }, { "epoch": 0.33, "learning_rate": 0.001575052962496918, "loss": 2.6933, "step": 12125 }, { "epoch": 0.33, "learning_rate": 0.0015749817521458476, "loss": 2.3835, "step": 12126 }, { "epoch": 0.33, "learning_rate": 0.0015749105374388184, "loss": 2.4845, "step": 12127 }, { "epoch": 0.33, "learning_rate": 0.0015748393183763695, "loss": 2.6174, "step": 12128 }, { "epoch": 0.33, "learning_rate": 0.0015747680949590407, "loss": 2.3146, "step": 12129 }, { "epoch": 0.33, "learning_rate": 0.0015746968671873716, "loss": 2.8204, "step": 12130 }, { "epoch": 0.33, "learning_rate": 0.001574625635061902, "loss": 2.7108, "step": 12131 }, { "epoch": 0.33, "learning_rate": 0.001574554398583171, "loss": 2.6546, "step": 12132 }, { "epoch": 0.33, "learning_rate": 0.0015744831577517186, "loss": 2.8287, "step": 12133 }, { "epoch": 0.33, "learning_rate": 0.0015744119125680846, "loss": 2.5768, "step": 12134 }, { "epoch": 0.33, "learning_rate": 0.0015743406630328086, "loss": 2.7265, "step": 12135 }, { "epoch": 0.33, "learning_rate": 0.0015742694091464304, "loss": 2.8174, "step": 12136 }, { "epoch": 0.33, "learning_rate": 0.00157419815090949, "loss": 2.772, "step": 12137 }, { "epoch": 0.33, "learning_rate": 0.001574126888322527, "loss": 2.836, "step": 12138 }, { "epoch": 0.33, "learning_rate": 0.0015740556213860812, "loss": 2.8059, "step": 12139 }, { "epoch": 0.33, "learning_rate": 0.0015739843501006926, "loss": 2.728, "step": 12140 }, { "epoch": 0.33, "learning_rate": 0.0015739130744669017, "loss": 2.9623, "step": 12141 }, { "epoch": 0.33, "learning_rate": 0.0015738417944852476, "loss": 2.8766, "step": 12142 }, { "epoch": 0.33, "learning_rate": 0.0015737705101562705, "loss": 2.5341, "step": 12143 }, { "epoch": 0.33, "learning_rate": 0.0015736992214805108, "loss": 2.5804, "step": 12144 }, { "epoch": 0.33, "learning_rate": 0.0015736279284585084, "loss": 2.4737, "step": 12145 }, { "epoch": 0.33, "learning_rate": 0.0015735566310908031, "loss": 2.4605, "step": 12146 }, { "epoch": 0.33, "learning_rate": 0.0015734853293779354, "loss": 2.7379, "step": 12147 }, { "epoch": 0.33, "learning_rate": 0.0015734140233204456, "loss": 2.6735, "step": 12148 }, { "epoch": 0.33, "learning_rate": 0.0015733427129188736, "loss": 2.8148, "step": 12149 }, { "epoch": 0.33, "learning_rate": 0.0015732713981737596, "loss": 2.4846, "step": 12150 }, { "epoch": 0.33, "learning_rate": 0.001573200079085644, "loss": 2.8182, "step": 12151 }, { "epoch": 0.33, "learning_rate": 0.001573128755655067, "loss": 2.332, "step": 12152 }, { "epoch": 0.33, "learning_rate": 0.0015730574278825693, "loss": 2.5669, "step": 12153 }, { "epoch": 0.33, "learning_rate": 0.0015729860957686911, "loss": 2.1157, "step": 12154 }, { "epoch": 0.33, "learning_rate": 0.001572914759313972, "loss": 2.3764, "step": 12155 }, { "epoch": 0.33, "learning_rate": 0.0015728434185189534, "loss": 2.6984, "step": 12156 }, { "epoch": 0.33, "learning_rate": 0.0015727720733841757, "loss": 3.0122, "step": 12157 }, { "epoch": 0.33, "learning_rate": 0.0015727007239101792, "loss": 2.59, "step": 12158 }, { "epoch": 0.33, "learning_rate": 0.0015726293700975042, "loss": 2.465, "step": 12159 }, { "epoch": 0.33, "learning_rate": 0.0015725580119466914, "loss": 2.3313, "step": 12160 }, { "epoch": 0.33, "learning_rate": 0.0015724866494582818, "loss": 2.7893, "step": 12161 }, { "epoch": 0.33, "learning_rate": 0.0015724152826328153, "loss": 2.4678, "step": 12162 }, { "epoch": 0.33, "learning_rate": 0.0015723439114708332, "loss": 2.6528, "step": 12163 }, { "epoch": 0.33, "learning_rate": 0.0015722725359728759, "loss": 2.5606, "step": 12164 }, { "epoch": 0.33, "learning_rate": 0.001572201156139484, "loss": 2.6428, "step": 12165 }, { "epoch": 0.33, "learning_rate": 0.0015721297719711986, "loss": 2.5263, "step": 12166 }, { "epoch": 0.33, "learning_rate": 0.0015720583834685602, "loss": 2.6672, "step": 12167 }, { "epoch": 0.33, "learning_rate": 0.00157198699063211, "loss": 3.2208, "step": 12168 }, { "epoch": 0.33, "learning_rate": 0.0015719155934623887, "loss": 2.3372, "step": 12169 }, { "epoch": 0.33, "learning_rate": 0.0015718441919599366, "loss": 2.4885, "step": 12170 }, { "epoch": 0.33, "learning_rate": 0.0015717727861252956, "loss": 2.4623, "step": 12171 }, { "epoch": 0.33, "learning_rate": 0.0015717013759590061, "loss": 2.4493, "step": 12172 }, { "epoch": 0.33, "learning_rate": 0.0015716299614616093, "loss": 2.6442, "step": 12173 }, { "epoch": 0.33, "learning_rate": 0.0015715585426336455, "loss": 3.3018, "step": 12174 }, { "epoch": 0.33, "learning_rate": 0.0015714871194756573, "loss": 2.8477, "step": 12175 }, { "epoch": 0.33, "learning_rate": 0.001571415691988184, "loss": 2.4618, "step": 12176 }, { "epoch": 0.33, "learning_rate": 0.0015713442601717682, "loss": 2.8473, "step": 12177 }, { "epoch": 0.33, "learning_rate": 0.0015712728240269503, "loss": 2.672, "step": 12178 }, { "epoch": 0.33, "learning_rate": 0.0015712013835542714, "loss": 2.1115, "step": 12179 }, { "epoch": 0.33, "learning_rate": 0.001571129938754273, "loss": 2.5467, "step": 12180 }, { "epoch": 0.33, "learning_rate": 0.0015710584896274965, "loss": 2.7661, "step": 12181 }, { "epoch": 0.33, "learning_rate": 0.0015709870361744827, "loss": 2.8624, "step": 12182 }, { "epoch": 0.33, "learning_rate": 0.0015709155783957733, "loss": 2.4312, "step": 12183 }, { "epoch": 0.33, "learning_rate": 0.0015708441162919095, "loss": 2.648, "step": 12184 }, { "epoch": 0.33, "learning_rate": 0.001570772649863433, "loss": 2.2069, "step": 12185 }, { "epoch": 0.33, "learning_rate": 0.0015707011791108844, "loss": 2.5628, "step": 12186 }, { "epoch": 0.33, "learning_rate": 0.0015706297040348064, "loss": 2.4284, "step": 12187 }, { "epoch": 0.33, "learning_rate": 0.0015705582246357394, "loss": 2.8055, "step": 12188 }, { "epoch": 0.33, "learning_rate": 0.0015704867409142254, "loss": 2.6291, "step": 12189 }, { "epoch": 0.33, "learning_rate": 0.0015704152528708056, "loss": 2.3281, "step": 12190 }, { "epoch": 0.33, "learning_rate": 0.001570343760506022, "loss": 2.7676, "step": 12191 }, { "epoch": 0.33, "learning_rate": 0.0015702722638204162, "loss": 2.5921, "step": 12192 }, { "epoch": 0.33, "learning_rate": 0.0015702007628145293, "loss": 2.8778, "step": 12193 }, { "epoch": 0.33, "learning_rate": 0.0015701292574889036, "loss": 2.2808, "step": 12194 }, { "epoch": 0.33, "learning_rate": 0.0015700577478440804, "loss": 2.3792, "step": 12195 }, { "epoch": 0.33, "learning_rate": 0.001569986233880602, "loss": 2.3446, "step": 12196 }, { "epoch": 0.33, "learning_rate": 0.0015699147155990097, "loss": 3.0138, "step": 12197 }, { "epoch": 0.33, "learning_rate": 0.001569843192999845, "loss": 2.8138, "step": 12198 }, { "epoch": 0.33, "learning_rate": 0.0015697716660836504, "loss": 2.5086, "step": 12199 }, { "epoch": 0.33, "learning_rate": 0.001569700134850968, "loss": 2.565, "step": 12200 }, { "epoch": 0.33, "learning_rate": 0.0015696285993023384, "loss": 2.8235, "step": 12201 }, { "epoch": 0.33, "learning_rate": 0.0015695570594383046, "loss": 2.5409, "step": 12202 }, { "epoch": 0.33, "learning_rate": 0.0015694855152594087, "loss": 2.5838, "step": 12203 }, { "epoch": 0.33, "learning_rate": 0.001569413966766192, "loss": 2.455, "step": 12204 }, { "epoch": 0.33, "learning_rate": 0.0015693424139591975, "loss": 2.1425, "step": 12205 }, { "epoch": 0.33, "learning_rate": 0.0015692708568389657, "loss": 2.4697, "step": 12206 }, { "epoch": 0.33, "learning_rate": 0.0015691992954060404, "loss": 2.5317, "step": 12207 }, { "epoch": 0.33, "learning_rate": 0.0015691277296609627, "loss": 2.4767, "step": 12208 }, { "epoch": 0.33, "learning_rate": 0.001569056159604275, "loss": 2.7422, "step": 12209 }, { "epoch": 0.33, "learning_rate": 0.0015689845852365197, "loss": 2.4078, "step": 12210 }, { "epoch": 0.33, "learning_rate": 0.001568913006558239, "loss": 2.6749, "step": 12211 }, { "epoch": 0.33, "learning_rate": 0.001568841423569975, "loss": 2.3449, "step": 12212 }, { "epoch": 0.33, "learning_rate": 0.00156876983627227, "loss": 2.739, "step": 12213 }, { "epoch": 0.33, "learning_rate": 0.0015686982446656665, "loss": 2.4989, "step": 12214 }, { "epoch": 0.33, "learning_rate": 0.0015686266487507068, "loss": 2.2224, "step": 12215 }, { "epoch": 0.33, "learning_rate": 0.001568555048527933, "loss": 2.7093, "step": 12216 }, { "epoch": 0.33, "learning_rate": 0.001568483443997888, "loss": 3.0738, "step": 12217 }, { "epoch": 0.33, "learning_rate": 0.0015684118351611143, "loss": 2.45, "step": 12218 }, { "epoch": 0.33, "learning_rate": 0.0015683402220181537, "loss": 2.6302, "step": 12219 }, { "epoch": 0.33, "learning_rate": 0.0015682686045695499, "loss": 2.2797, "step": 12220 }, { "epoch": 0.33, "learning_rate": 0.0015681969828158437, "loss": 2.7863, "step": 12221 }, { "epoch": 0.33, "learning_rate": 0.0015681253567575797, "loss": 2.4128, "step": 12222 }, { "epoch": 0.33, "learning_rate": 0.001568053726395299, "loss": 2.7436, "step": 12223 }, { "epoch": 0.33, "learning_rate": 0.001567982091729545, "loss": 2.5484, "step": 12224 }, { "epoch": 0.33, "learning_rate": 0.0015679104527608603, "loss": 2.8679, "step": 12225 }, { "epoch": 0.33, "learning_rate": 0.0015678388094897873, "loss": 2.5995, "step": 12226 }, { "epoch": 0.33, "learning_rate": 0.0015677671619168693, "loss": 2.3333, "step": 12227 }, { "epoch": 0.33, "learning_rate": 0.0015676955100426486, "loss": 1.8624, "step": 12228 }, { "epoch": 0.33, "learning_rate": 0.0015676238538676684, "loss": 2.5353, "step": 12229 }, { "epoch": 0.33, "learning_rate": 0.0015675521933924711, "loss": 2.9089, "step": 12230 }, { "epoch": 0.33, "learning_rate": 0.0015674805286176002, "loss": 2.2868, "step": 12231 }, { "epoch": 0.33, "learning_rate": 0.001567408859543598, "loss": 2.8272, "step": 12232 }, { "epoch": 0.33, "learning_rate": 0.0015673371861710077, "loss": 2.7564, "step": 12233 }, { "epoch": 0.33, "learning_rate": 0.0015672655085003724, "loss": 2.3749, "step": 12234 }, { "epoch": 0.33, "learning_rate": 0.0015671938265322352, "loss": 2.834, "step": 12235 }, { "epoch": 0.33, "learning_rate": 0.0015671221402671388, "loss": 2.7055, "step": 12236 }, { "epoch": 0.33, "learning_rate": 0.0015670504497056262, "loss": 2.4361, "step": 12237 }, { "epoch": 0.33, "learning_rate": 0.0015669787548482411, "loss": 2.7824, "step": 12238 }, { "epoch": 0.33, "learning_rate": 0.001566907055695526, "loss": 2.8313, "step": 12239 }, { "epoch": 0.33, "learning_rate": 0.001566835352248025, "loss": 2.3498, "step": 12240 }, { "epoch": 0.33, "learning_rate": 0.00156676364450628, "loss": 2.5122, "step": 12241 }, { "epoch": 0.33, "learning_rate": 0.0015666919324708356, "loss": 2.5086, "step": 12242 }, { "epoch": 0.33, "learning_rate": 0.001566620216142234, "loss": 2.3605, "step": 12243 }, { "epoch": 0.33, "learning_rate": 0.001566548495521019, "loss": 2.4254, "step": 12244 }, { "epoch": 0.33, "learning_rate": 0.0015664767706077341, "loss": 2.6996, "step": 12245 }, { "epoch": 0.33, "learning_rate": 0.0015664050414029222, "loss": 2.1762, "step": 12246 }, { "epoch": 0.33, "learning_rate": 0.0015663333079071271, "loss": 2.3686, "step": 12247 }, { "epoch": 0.33, "learning_rate": 0.0015662615701208921, "loss": 2.9598, "step": 12248 }, { "epoch": 0.33, "learning_rate": 0.0015661898280447607, "loss": 2.4193, "step": 12249 }, { "epoch": 0.33, "learning_rate": 0.0015661180816792766, "loss": 2.3303, "step": 12250 }, { "epoch": 0.33, "learning_rate": 0.0015660463310249828, "loss": 2.6734, "step": 12251 }, { "epoch": 0.33, "learning_rate": 0.0015659745760824232, "loss": 2.8539, "step": 12252 }, { "epoch": 0.33, "learning_rate": 0.0015659028168521416, "loss": 2.9617, "step": 12253 }, { "epoch": 0.33, "learning_rate": 0.0015658310533346812, "loss": 2.5368, "step": 12254 }, { "epoch": 0.33, "learning_rate": 0.0015657592855305863, "loss": 2.5425, "step": 12255 }, { "epoch": 0.33, "learning_rate": 0.0015656875134403996, "loss": 2.27, "step": 12256 }, { "epoch": 0.33, "learning_rate": 0.001565615737064666, "loss": 2.5373, "step": 12257 }, { "epoch": 0.33, "learning_rate": 0.0015655439564039285, "loss": 2.6743, "step": 12258 }, { "epoch": 0.33, "learning_rate": 0.001565472171458731, "loss": 2.7327, "step": 12259 }, { "epoch": 0.33, "learning_rate": 0.0015654003822296175, "loss": 2.3754, "step": 12260 }, { "epoch": 0.33, "learning_rate": 0.0015653285887171318, "loss": 2.6289, "step": 12261 }, { "epoch": 0.33, "learning_rate": 0.0015652567909218175, "loss": 2.457, "step": 12262 }, { "epoch": 0.33, "learning_rate": 0.0015651849888442192, "loss": 2.9487, "step": 12263 }, { "epoch": 0.33, "learning_rate": 0.0015651131824848804, "loss": 2.3807, "step": 12264 }, { "epoch": 0.33, "learning_rate": 0.0015650413718443453, "loss": 2.2428, "step": 12265 }, { "epoch": 0.33, "learning_rate": 0.0015649695569231574, "loss": 2.7233, "step": 12266 }, { "epoch": 0.33, "learning_rate": 0.0015648977377218617, "loss": 2.4044, "step": 12267 }, { "epoch": 0.33, "learning_rate": 0.001564825914241001, "loss": 2.9435, "step": 12268 }, { "epoch": 0.33, "learning_rate": 0.0015647540864811207, "loss": 2.2809, "step": 12269 }, { "epoch": 0.33, "learning_rate": 0.0015646822544427641, "loss": 2.5957, "step": 12270 }, { "epoch": 0.33, "learning_rate": 0.001564610418126476, "loss": 2.4865, "step": 12271 }, { "epoch": 0.33, "learning_rate": 0.0015645385775328, "loss": 2.5632, "step": 12272 }, { "epoch": 0.33, "learning_rate": 0.001564466732662281, "loss": 2.5807, "step": 12273 }, { "epoch": 0.33, "learning_rate": 0.0015643948835154626, "loss": 2.4637, "step": 12274 }, { "epoch": 0.33, "learning_rate": 0.0015643230300928896, "loss": 2.6561, "step": 12275 }, { "epoch": 0.33, "learning_rate": 0.0015642511723951062, "loss": 2.5515, "step": 12276 }, { "epoch": 0.33, "learning_rate": 0.001564179310422657, "loss": 2.4099, "step": 12277 }, { "epoch": 0.33, "learning_rate": 0.001564107444176086, "loss": 3.0725, "step": 12278 }, { "epoch": 0.33, "learning_rate": 0.001564035573655938, "loss": 2.6045, "step": 12279 }, { "epoch": 0.33, "learning_rate": 0.0015639636988627572, "loss": 2.6076, "step": 12280 }, { "epoch": 0.33, "learning_rate": 0.0015638918197970885, "loss": 2.5358, "step": 12281 }, { "epoch": 0.33, "learning_rate": 0.0015638199364594759, "loss": 2.7035, "step": 12282 }, { "epoch": 0.33, "learning_rate": 0.001563748048850464, "loss": 2.4057, "step": 12283 }, { "epoch": 0.33, "learning_rate": 0.0015636761569705981, "loss": 2.7606, "step": 12284 }, { "epoch": 0.33, "learning_rate": 0.0015636042608204225, "loss": 2.6539, "step": 12285 }, { "epoch": 0.33, "learning_rate": 0.0015635323604004814, "loss": 2.5494, "step": 12286 }, { "epoch": 0.33, "learning_rate": 0.00156346045571132, "loss": 2.4271, "step": 12287 }, { "epoch": 0.33, "learning_rate": 0.0015633885467534832, "loss": 3.033, "step": 12288 }, { "epoch": 0.33, "learning_rate": 0.0015633166335275153, "loss": 2.3204, "step": 12289 }, { "epoch": 0.33, "learning_rate": 0.0015632447160339614, "loss": 2.4734, "step": 12290 }, { "epoch": 0.33, "learning_rate": 0.001563172794273366, "loss": 2.2039, "step": 12291 }, { "epoch": 0.33, "learning_rate": 0.0015631008682462743, "loss": 2.6354, "step": 12292 }, { "epoch": 0.33, "learning_rate": 0.0015630289379532313, "loss": 2.4624, "step": 12293 }, { "epoch": 0.33, "learning_rate": 0.0015629570033947814, "loss": 2.3864, "step": 12294 }, { "epoch": 0.33, "learning_rate": 0.00156288506457147, "loss": 2.559, "step": 12295 }, { "epoch": 0.33, "learning_rate": 0.0015628131214838422, "loss": 2.4725, "step": 12296 }, { "epoch": 0.33, "learning_rate": 0.0015627411741324427, "loss": 2.3355, "step": 12297 }, { "epoch": 0.33, "learning_rate": 0.0015626692225178165, "loss": 2.6224, "step": 12298 }, { "epoch": 0.33, "learning_rate": 0.0015625972666405091, "loss": 2.6027, "step": 12299 }, { "epoch": 0.33, "learning_rate": 0.001562525306501065, "loss": 2.1614, "step": 12300 }, { "epoch": 0.33, "learning_rate": 0.0015624533421000303, "loss": 2.4695, "step": 12301 }, { "epoch": 0.33, "learning_rate": 0.0015623813734379492, "loss": 2.434, "step": 12302 }, { "epoch": 0.33, "learning_rate": 0.0015623094005153676, "loss": 2.5381, "step": 12303 }, { "epoch": 0.33, "learning_rate": 0.0015622374233328303, "loss": 2.9054, "step": 12304 }, { "epoch": 0.33, "learning_rate": 0.001562165441890883, "loss": 2.6685, "step": 12305 }, { "epoch": 0.33, "learning_rate": 0.0015620934561900708, "loss": 2.562, "step": 12306 }, { "epoch": 0.33, "learning_rate": 0.0015620214662309389, "loss": 2.4804, "step": 12307 }, { "epoch": 0.33, "learning_rate": 0.001561949472014033, "loss": 2.4116, "step": 12308 }, { "epoch": 0.33, "learning_rate": 0.0015618774735398984, "loss": 2.3347, "step": 12309 }, { "epoch": 0.33, "learning_rate": 0.0015618054708090806, "loss": 2.4182, "step": 12310 }, { "epoch": 0.33, "learning_rate": 0.0015617334638221246, "loss": 2.6126, "step": 12311 }, { "epoch": 0.33, "learning_rate": 0.0015616614525795765, "loss": 2.81, "step": 12312 }, { "epoch": 0.33, "learning_rate": 0.0015615894370819819, "loss": 2.4025, "step": 12313 }, { "epoch": 0.33, "learning_rate": 0.001561517417329886, "loss": 2.7509, "step": 12314 }, { "epoch": 0.33, "learning_rate": 0.0015614453933238345, "loss": 2.0762, "step": 12315 }, { "epoch": 0.33, "learning_rate": 0.0015613733650643728, "loss": 3.0729, "step": 12316 }, { "epoch": 0.33, "learning_rate": 0.001561301332552047, "loss": 2.8221, "step": 12317 }, { "epoch": 0.33, "learning_rate": 0.001561229295787403, "loss": 2.5276, "step": 12318 }, { "epoch": 0.33, "learning_rate": 0.0015611572547709859, "loss": 2.6508, "step": 12319 }, { "epoch": 0.33, "learning_rate": 0.0015610852095033416, "loss": 2.6637, "step": 12320 }, { "epoch": 0.33, "learning_rate": 0.0015610131599850163, "loss": 2.503, "step": 12321 }, { "epoch": 0.33, "learning_rate": 0.0015609411062165557, "loss": 2.4516, "step": 12322 }, { "epoch": 0.33, "learning_rate": 0.0015608690481985054, "loss": 2.7489, "step": 12323 }, { "epoch": 0.33, "learning_rate": 0.0015607969859314115, "loss": 2.323, "step": 12324 }, { "epoch": 0.33, "learning_rate": 0.00156072491941582, "loss": 2.3811, "step": 12325 }, { "epoch": 0.33, "learning_rate": 0.0015606528486522765, "loss": 2.3994, "step": 12326 }, { "epoch": 0.33, "learning_rate": 0.0015605807736413274, "loss": 2.3215, "step": 12327 }, { "epoch": 0.33, "learning_rate": 0.0015605086943835187, "loss": 2.6107, "step": 12328 }, { "epoch": 0.33, "learning_rate": 0.0015604366108793962, "loss": 2.5757, "step": 12329 }, { "epoch": 0.33, "learning_rate": 0.0015603645231295061, "loss": 2.8798, "step": 12330 }, { "epoch": 0.33, "learning_rate": 0.0015602924311343947, "loss": 2.8559, "step": 12331 }, { "epoch": 0.33, "learning_rate": 0.001560220334894608, "loss": 2.2781, "step": 12332 }, { "epoch": 0.33, "learning_rate": 0.0015601482344106922, "loss": 2.8753, "step": 12333 }, { "epoch": 0.33, "learning_rate": 0.0015600761296831933, "loss": 2.2473, "step": 12334 }, { "epoch": 0.33, "learning_rate": 0.001560004020712658, "loss": 2.5524, "step": 12335 }, { "epoch": 0.33, "learning_rate": 0.0015599319074996324, "loss": 2.2533, "step": 12336 }, { "epoch": 0.33, "learning_rate": 0.0015598597900446625, "loss": 2.3033, "step": 12337 }, { "epoch": 0.33, "learning_rate": 0.001559787668348295, "loss": 2.5791, "step": 12338 }, { "epoch": 0.33, "learning_rate": 0.0015597155424110763, "loss": 2.4935, "step": 12339 }, { "epoch": 0.33, "learning_rate": 0.001559643412233553, "loss": 2.5576, "step": 12340 }, { "epoch": 0.33, "learning_rate": 0.001559571277816271, "loss": 3.0472, "step": 12341 }, { "epoch": 0.33, "learning_rate": 0.0015594991391597768, "loss": 2.4342, "step": 12342 }, { "epoch": 0.33, "learning_rate": 0.0015594269962646173, "loss": 2.5646, "step": 12343 }, { "epoch": 0.33, "learning_rate": 0.001559354849131339, "loss": 2.6934, "step": 12344 }, { "epoch": 0.33, "learning_rate": 0.0015592826977604887, "loss": 2.6361, "step": 12345 }, { "epoch": 0.33, "learning_rate": 0.001559210542152612, "loss": 2.1667, "step": 12346 }, { "epoch": 0.33, "learning_rate": 0.0015591383823082565, "loss": 1.9914, "step": 12347 }, { "epoch": 0.33, "learning_rate": 0.0015590662182279687, "loss": 2.6528, "step": 12348 }, { "epoch": 0.33, "learning_rate": 0.001558994049912295, "loss": 2.2824, "step": 12349 }, { "epoch": 0.33, "learning_rate": 0.0015589218773617822, "loss": 2.1863, "step": 12350 }, { "epoch": 0.33, "learning_rate": 0.0015588497005769775, "loss": 2.2972, "step": 12351 }, { "epoch": 0.33, "learning_rate": 0.0015587775195584272, "loss": 2.4732, "step": 12352 }, { "epoch": 0.33, "learning_rate": 0.0015587053343066786, "loss": 2.4281, "step": 12353 }, { "epoch": 0.33, "learning_rate": 0.0015586331448222777, "loss": 2.6763, "step": 12354 }, { "epoch": 0.33, "learning_rate": 0.0015585609511057723, "loss": 2.2329, "step": 12355 }, { "epoch": 0.33, "learning_rate": 0.0015584887531577092, "loss": 2.4186, "step": 12356 }, { "epoch": 0.33, "learning_rate": 0.001558416550978635, "loss": 2.6094, "step": 12357 }, { "epoch": 0.33, "learning_rate": 0.0015583443445690967, "loss": 2.5807, "step": 12358 }, { "epoch": 0.33, "learning_rate": 0.0015582721339296418, "loss": 2.4982, "step": 12359 }, { "epoch": 0.33, "learning_rate": 0.0015581999190608165, "loss": 2.3186, "step": 12360 }, { "epoch": 0.33, "learning_rate": 0.0015581276999631687, "loss": 2.8037, "step": 12361 }, { "epoch": 0.33, "learning_rate": 0.0015580554766372453, "loss": 2.4618, "step": 12362 }, { "epoch": 0.33, "learning_rate": 0.0015579832490835934, "loss": 2.5256, "step": 12363 }, { "epoch": 0.33, "learning_rate": 0.00155791101730276, "loss": 2.3099, "step": 12364 }, { "epoch": 0.33, "learning_rate": 0.0015578387812952925, "loss": 2.6865, "step": 12365 }, { "epoch": 0.33, "learning_rate": 0.001557766541061738, "loss": 2.1721, "step": 12366 }, { "epoch": 0.33, "learning_rate": 0.0015576942966026444, "loss": 2.6877, "step": 12367 }, { "epoch": 0.33, "learning_rate": 0.0015576220479185583, "loss": 2.2638, "step": 12368 }, { "epoch": 0.33, "learning_rate": 0.001557549795010027, "loss": 2.6704, "step": 12369 }, { "epoch": 0.33, "learning_rate": 0.0015574775378775982, "loss": 2.5155, "step": 12370 }, { "epoch": 0.33, "learning_rate": 0.0015574052765218193, "loss": 2.8373, "step": 12371 }, { "epoch": 0.33, "learning_rate": 0.001557333010943238, "loss": 2.4101, "step": 12372 }, { "epoch": 0.33, "learning_rate": 0.001557260741142401, "loss": 2.2794, "step": 12373 }, { "epoch": 0.33, "learning_rate": 0.0015571884671198564, "loss": 2.7479, "step": 12374 }, { "epoch": 0.33, "learning_rate": 0.0015571161888761518, "loss": 2.3914, "step": 12375 }, { "epoch": 0.33, "learning_rate": 0.0015570439064118342, "loss": 2.5613, "step": 12376 }, { "epoch": 0.33, "learning_rate": 0.0015569716197274517, "loss": 2.797, "step": 12377 }, { "epoch": 0.33, "learning_rate": 0.0015568993288235518, "loss": 2.3119, "step": 12378 }, { "epoch": 0.33, "learning_rate": 0.001556827033700682, "loss": 2.522, "step": 12379 }, { "epoch": 0.33, "learning_rate": 0.0015567547343593904, "loss": 2.1196, "step": 12380 }, { "epoch": 0.33, "learning_rate": 0.0015566824308002243, "loss": 2.8154, "step": 12381 }, { "epoch": 0.33, "learning_rate": 0.0015566101230237318, "loss": 2.1267, "step": 12382 }, { "epoch": 0.33, "learning_rate": 0.0015565378110304604, "loss": 2.6763, "step": 12383 }, { "epoch": 0.33, "learning_rate": 0.0015564654948209582, "loss": 2.56, "step": 12384 }, { "epoch": 0.33, "learning_rate": 0.0015563931743957727, "loss": 2.8565, "step": 12385 }, { "epoch": 0.33, "learning_rate": 0.001556320849755452, "loss": 2.4722, "step": 12386 }, { "epoch": 0.33, "learning_rate": 0.0015562485209005441, "loss": 2.4731, "step": 12387 }, { "epoch": 0.33, "learning_rate": 0.0015561761878315967, "loss": 2.7062, "step": 12388 }, { "epoch": 0.33, "learning_rate": 0.001556103850549158, "loss": 2.7413, "step": 12389 }, { "epoch": 0.33, "learning_rate": 0.001556031509053776, "loss": 3.2262, "step": 12390 }, { "epoch": 0.33, "learning_rate": 0.0015559591633459986, "loss": 2.5591, "step": 12391 }, { "epoch": 0.33, "learning_rate": 0.0015558868134263742, "loss": 2.4014, "step": 12392 }, { "epoch": 0.33, "learning_rate": 0.0015558144592954504, "loss": 2.7844, "step": 12393 }, { "epoch": 0.33, "learning_rate": 0.001555742100953776, "loss": 2.2656, "step": 12394 }, { "epoch": 0.33, "learning_rate": 0.0015556697384018984, "loss": 2.4741, "step": 12395 }, { "epoch": 0.33, "learning_rate": 0.0015555973716403664, "loss": 2.2429, "step": 12396 }, { "epoch": 0.33, "learning_rate": 0.001555525000669728, "loss": 2.4646, "step": 12397 }, { "epoch": 0.33, "learning_rate": 0.0015554526254905317, "loss": 2.3539, "step": 12398 }, { "epoch": 0.33, "learning_rate": 0.0015553802461033253, "loss": 2.7833, "step": 12399 }, { "epoch": 0.33, "learning_rate": 0.0015553078625086577, "loss": 2.3141, "step": 12400 }, { "epoch": 0.33, "learning_rate": 0.001555235474707077, "loss": 2.3229, "step": 12401 }, { "epoch": 0.33, "learning_rate": 0.0015551630826991314, "loss": 3.0452, "step": 12402 }, { "epoch": 0.33, "learning_rate": 0.0015550906864853697, "loss": 2.3142, "step": 12403 }, { "epoch": 0.33, "learning_rate": 0.00155501828606634, "loss": 2.6931, "step": 12404 }, { "epoch": 0.33, "learning_rate": 0.0015549458814425915, "loss": 2.6873, "step": 12405 }, { "epoch": 0.33, "learning_rate": 0.0015548734726146716, "loss": 3.1543, "step": 12406 }, { "epoch": 0.33, "learning_rate": 0.0015548010595831298, "loss": 2.8398, "step": 12407 }, { "epoch": 0.33, "learning_rate": 0.0015547286423485142, "loss": 2.8955, "step": 12408 }, { "epoch": 0.33, "learning_rate": 0.0015546562209113738, "loss": 2.8836, "step": 12409 }, { "epoch": 0.33, "learning_rate": 0.0015545837952722571, "loss": 2.5617, "step": 12410 }, { "epoch": 0.33, "learning_rate": 0.0015545113654317124, "loss": 2.0008, "step": 12411 }, { "epoch": 0.33, "learning_rate": 0.0015544389313902887, "loss": 2.7144, "step": 12412 }, { "epoch": 0.33, "learning_rate": 0.001554366493148535, "loss": 2.6688, "step": 12413 }, { "epoch": 0.33, "learning_rate": 0.0015542940507070001, "loss": 2.4338, "step": 12414 }, { "epoch": 0.33, "learning_rate": 0.0015542216040662323, "loss": 2.4333, "step": 12415 }, { "epoch": 0.33, "learning_rate": 0.0015541491532267803, "loss": 2.4143, "step": 12416 }, { "epoch": 0.33, "learning_rate": 0.001554076698189194, "loss": 2.7915, "step": 12417 }, { "epoch": 0.33, "learning_rate": 0.0015540042389540214, "loss": 2.3867, "step": 12418 }, { "epoch": 0.33, "learning_rate": 0.0015539317755218118, "loss": 2.4096, "step": 12419 }, { "epoch": 0.33, "learning_rate": 0.0015538593078931143, "loss": 2.9599, "step": 12420 }, { "epoch": 0.33, "learning_rate": 0.0015537868360684772, "loss": 2.2798, "step": 12421 }, { "epoch": 0.33, "learning_rate": 0.0015537143600484506, "loss": 2.622, "step": 12422 }, { "epoch": 0.33, "learning_rate": 0.0015536418798335826, "loss": 2.5524, "step": 12423 }, { "epoch": 0.33, "learning_rate": 0.0015535693954244227, "loss": 2.8627, "step": 12424 }, { "epoch": 0.33, "learning_rate": 0.0015534969068215206, "loss": 2.6933, "step": 12425 }, { "epoch": 0.33, "learning_rate": 0.0015534244140254243, "loss": 2.67, "step": 12426 }, { "epoch": 0.33, "learning_rate": 0.0015533519170366837, "loss": 2.7621, "step": 12427 }, { "epoch": 0.33, "learning_rate": 0.0015532794158558479, "loss": 2.6349, "step": 12428 }, { "epoch": 0.33, "learning_rate": 0.0015532069104834663, "loss": 2.7681, "step": 12429 }, { "epoch": 0.33, "learning_rate": 0.001553134400920088, "loss": 2.6641, "step": 12430 }, { "epoch": 0.33, "learning_rate": 0.0015530618871662622, "loss": 2.3073, "step": 12431 }, { "epoch": 0.33, "learning_rate": 0.0015529893692225387, "loss": 2.6361, "step": 12432 }, { "epoch": 0.33, "learning_rate": 0.0015529168470894664, "loss": 2.558, "step": 12433 }, { "epoch": 0.33, "learning_rate": 0.001552844320767595, "loss": 2.7639, "step": 12434 }, { "epoch": 0.33, "learning_rate": 0.001552771790257474, "loss": 2.5655, "step": 12435 }, { "epoch": 0.33, "learning_rate": 0.0015526992555596527, "loss": 2.5683, "step": 12436 }, { "epoch": 0.33, "learning_rate": 0.0015526267166746804, "loss": 2.4193, "step": 12437 }, { "epoch": 0.33, "learning_rate": 0.0015525541736031072, "loss": 2.5594, "step": 12438 }, { "epoch": 0.33, "learning_rate": 0.0015524816263454819, "loss": 2.3509, "step": 12439 }, { "epoch": 0.33, "learning_rate": 0.001552409074902355, "loss": 2.4042, "step": 12440 }, { "epoch": 0.33, "learning_rate": 0.0015523365192742756, "loss": 2.7211, "step": 12441 }, { "epoch": 0.33, "learning_rate": 0.0015522639594617936, "loss": 2.7052, "step": 12442 }, { "epoch": 0.33, "learning_rate": 0.0015521913954654582, "loss": 2.8261, "step": 12443 }, { "epoch": 0.33, "learning_rate": 0.00155211882728582, "loss": 2.6478, "step": 12444 }, { "epoch": 0.33, "learning_rate": 0.001552046254923428, "loss": 2.6203, "step": 12445 }, { "epoch": 0.33, "learning_rate": 0.0015519736783788324, "loss": 2.7621, "step": 12446 }, { "epoch": 0.33, "learning_rate": 0.0015519010976525825, "loss": 2.4328, "step": 12447 }, { "epoch": 0.33, "learning_rate": 0.001551828512745229, "loss": 2.6305, "step": 12448 }, { "epoch": 0.33, "learning_rate": 0.0015517559236573213, "loss": 2.4364, "step": 12449 }, { "epoch": 0.33, "learning_rate": 0.0015516833303894093, "loss": 2.3773, "step": 12450 }, { "epoch": 0.33, "learning_rate": 0.0015516107329420427, "loss": 2.6359, "step": 12451 }, { "epoch": 0.33, "learning_rate": 0.0015515381313157724, "loss": 2.3358, "step": 12452 }, { "epoch": 0.33, "learning_rate": 0.0015514655255111473, "loss": 2.2922, "step": 12453 }, { "epoch": 0.33, "learning_rate": 0.0015513929155287186, "loss": 2.6059, "step": 12454 }, { "epoch": 0.33, "learning_rate": 0.0015513203013690351, "loss": 2.7934, "step": 12455 }, { "epoch": 0.33, "learning_rate": 0.0015512476830326478, "loss": 3.2901, "step": 12456 }, { "epoch": 0.33, "learning_rate": 0.0015511750605201064, "loss": 2.3975, "step": 12457 }, { "epoch": 0.33, "learning_rate": 0.0015511024338319616, "loss": 2.4907, "step": 12458 }, { "epoch": 0.33, "learning_rate": 0.0015510298029687633, "loss": 3.1751, "step": 12459 }, { "epoch": 0.33, "learning_rate": 0.0015509571679310614, "loss": 2.6052, "step": 12460 }, { "epoch": 0.33, "learning_rate": 0.0015508845287194068, "loss": 2.8112, "step": 12461 }, { "epoch": 0.33, "learning_rate": 0.0015508118853343495, "loss": 2.5056, "step": 12462 }, { "epoch": 0.33, "learning_rate": 0.0015507392377764398, "loss": 2.8811, "step": 12463 }, { "epoch": 0.33, "learning_rate": 0.001550666586046228, "loss": 2.2448, "step": 12464 }, { "epoch": 0.33, "learning_rate": 0.0015505939301442646, "loss": 2.7009, "step": 12465 }, { "epoch": 0.34, "learning_rate": 0.0015505212700711003, "loss": 2.4108, "step": 12466 }, { "epoch": 0.34, "learning_rate": 0.0015504486058272847, "loss": 2.6062, "step": 12467 }, { "epoch": 0.34, "learning_rate": 0.0015503759374133695, "loss": 2.9655, "step": 12468 }, { "epoch": 0.34, "learning_rate": 0.0015503032648299042, "loss": 2.4611, "step": 12469 }, { "epoch": 0.34, "learning_rate": 0.0015502305880774397, "loss": 2.7269, "step": 12470 }, { "epoch": 0.34, "learning_rate": 0.001550157907156527, "loss": 2.8176, "step": 12471 }, { "epoch": 0.34, "learning_rate": 0.0015500852220677159, "loss": 2.3036, "step": 12472 }, { "epoch": 0.34, "learning_rate": 0.001550012532811558, "loss": 2.3445, "step": 12473 }, { "epoch": 0.34, "learning_rate": 0.001549939839388603, "loss": 2.5446, "step": 12474 }, { "epoch": 0.34, "learning_rate": 0.0015498671417994024, "loss": 2.6015, "step": 12475 }, { "epoch": 0.34, "learning_rate": 0.0015497944400445069, "loss": 2.2842, "step": 12476 }, { "epoch": 0.34, "learning_rate": 0.0015497217341244665, "loss": 2.5659, "step": 12477 }, { "epoch": 0.34, "learning_rate": 0.0015496490240398326, "loss": 2.3778, "step": 12478 }, { "epoch": 0.34, "learning_rate": 0.0015495763097911563, "loss": 2.7993, "step": 12479 }, { "epoch": 0.34, "learning_rate": 0.0015495035913789877, "loss": 2.4349, "step": 12480 }, { "epoch": 0.34, "learning_rate": 0.0015494308688038785, "loss": 2.6833, "step": 12481 }, { "epoch": 0.34, "learning_rate": 0.0015493581420663789, "loss": 2.3599, "step": 12482 }, { "epoch": 0.34, "learning_rate": 0.0015492854111670406, "loss": 2.7025, "step": 12483 }, { "epoch": 0.34, "learning_rate": 0.0015492126761064142, "loss": 2.9021, "step": 12484 }, { "epoch": 0.34, "learning_rate": 0.0015491399368850506, "loss": 2.6981, "step": 12485 }, { "epoch": 0.34, "learning_rate": 0.0015490671935035009, "loss": 2.1729, "step": 12486 }, { "epoch": 0.34, "learning_rate": 0.0015489944459623165, "loss": 2.7092, "step": 12487 }, { "epoch": 0.34, "learning_rate": 0.0015489216942620482, "loss": 2.5395, "step": 12488 }, { "epoch": 0.34, "learning_rate": 0.0015488489384032475, "loss": 2.6712, "step": 12489 }, { "epoch": 0.34, "learning_rate": 0.0015487761783864649, "loss": 2.6454, "step": 12490 }, { "epoch": 0.34, "learning_rate": 0.0015487034142122526, "loss": 2.9291, "step": 12491 }, { "epoch": 0.34, "learning_rate": 0.0015486306458811611, "loss": 2.7577, "step": 12492 }, { "epoch": 0.34, "learning_rate": 0.001548557873393742, "loss": 2.7181, "step": 12493 }, { "epoch": 0.34, "learning_rate": 0.0015484850967505466, "loss": 2.6455, "step": 12494 }, { "epoch": 0.34, "learning_rate": 0.0015484123159521259, "loss": 2.5276, "step": 12495 }, { "epoch": 0.34, "learning_rate": 0.0015483395309990318, "loss": 2.7638, "step": 12496 }, { "epoch": 0.34, "learning_rate": 0.0015482667418918155, "loss": 2.5593, "step": 12497 }, { "epoch": 0.34, "learning_rate": 0.001548193948631028, "loss": 2.5758, "step": 12498 }, { "epoch": 0.34, "learning_rate": 0.0015481211512172214, "loss": 2.3646, "step": 12499 }, { "epoch": 0.34, "learning_rate": 0.001548048349650947, "loss": 2.3711, "step": 12500 }, { "epoch": 0.34, "learning_rate": 0.0015479755439327563, "loss": 2.5828, "step": 12501 }, { "epoch": 0.34, "learning_rate": 0.0015479027340632005, "loss": 2.2231, "step": 12502 }, { "epoch": 0.34, "learning_rate": 0.0015478299200428318, "loss": 2.5858, "step": 12503 }, { "epoch": 0.34, "learning_rate": 0.0015477571018722017, "loss": 2.6552, "step": 12504 }, { "epoch": 0.34, "learning_rate": 0.0015476842795518616, "loss": 2.6655, "step": 12505 }, { "epoch": 0.34, "learning_rate": 0.0015476114530823632, "loss": 2.4535, "step": 12506 }, { "epoch": 0.34, "learning_rate": 0.0015475386224642587, "loss": 2.8522, "step": 12507 }, { "epoch": 0.34, "learning_rate": 0.001547465787698099, "loss": 2.951, "step": 12508 }, { "epoch": 0.34, "learning_rate": 0.0015473929487844367, "loss": 2.8528, "step": 12509 }, { "epoch": 0.34, "learning_rate": 0.0015473201057238232, "loss": 2.8093, "step": 12510 }, { "epoch": 0.34, "learning_rate": 0.0015472472585168105, "loss": 2.5718, "step": 12511 }, { "epoch": 0.34, "learning_rate": 0.0015471744071639502, "loss": 2.3413, "step": 12512 }, { "epoch": 0.34, "learning_rate": 0.0015471015516657944, "loss": 2.6251, "step": 12513 }, { "epoch": 0.34, "learning_rate": 0.0015470286920228954, "loss": 2.4917, "step": 12514 }, { "epoch": 0.34, "learning_rate": 0.0015469558282358044, "loss": 2.8357, "step": 12515 }, { "epoch": 0.34, "learning_rate": 0.0015468829603050743, "loss": 2.5338, "step": 12516 }, { "epoch": 0.34, "learning_rate": 0.0015468100882312563, "loss": 2.617, "step": 12517 }, { "epoch": 0.34, "learning_rate": 0.001546737212014903, "loss": 2.3997, "step": 12518 }, { "epoch": 0.34, "learning_rate": 0.0015466643316565665, "loss": 2.5481, "step": 12519 }, { "epoch": 0.34, "learning_rate": 0.0015465914471567985, "loss": 2.785, "step": 12520 }, { "epoch": 0.34, "learning_rate": 0.0015465185585161515, "loss": 2.9042, "step": 12521 }, { "epoch": 0.34, "learning_rate": 0.0015464456657351775, "loss": 2.4112, "step": 12522 }, { "epoch": 0.34, "learning_rate": 0.0015463727688144289, "loss": 2.139, "step": 12523 }, { "epoch": 0.34, "learning_rate": 0.001546299867754458, "loss": 2.4009, "step": 12524 }, { "epoch": 0.34, "learning_rate": 0.0015462269625558167, "loss": 2.8122, "step": 12525 }, { "epoch": 0.34, "learning_rate": 0.0015461540532190577, "loss": 2.7077, "step": 12526 }, { "epoch": 0.34, "learning_rate": 0.0015460811397447335, "loss": 2.6809, "step": 12527 }, { "epoch": 0.34, "learning_rate": 0.0015460082221333959, "loss": 2.4574, "step": 12528 }, { "epoch": 0.34, "learning_rate": 0.0015459353003855977, "loss": 2.1959, "step": 12529 }, { "epoch": 0.34, "learning_rate": 0.0015458623745018914, "loss": 2.5774, "step": 12530 }, { "epoch": 0.34, "learning_rate": 0.0015457894444828291, "loss": 2.5542, "step": 12531 }, { "epoch": 0.34, "learning_rate": 0.0015457165103289637, "loss": 2.4189, "step": 12532 }, { "epoch": 0.34, "learning_rate": 0.0015456435720408474, "loss": 2.4352, "step": 12533 }, { "epoch": 0.34, "learning_rate": 0.0015455706296190334, "loss": 2.462, "step": 12534 }, { "epoch": 0.34, "learning_rate": 0.0015454976830640735, "loss": 2.5188, "step": 12535 }, { "epoch": 0.34, "learning_rate": 0.0015454247323765206, "loss": 2.5106, "step": 12536 }, { "epoch": 0.34, "learning_rate": 0.0015453517775569276, "loss": 2.1264, "step": 12537 }, { "epoch": 0.34, "learning_rate": 0.0015452788186058471, "loss": 2.792, "step": 12538 }, { "epoch": 0.34, "learning_rate": 0.0015452058555238315, "loss": 2.3606, "step": 12539 }, { "epoch": 0.34, "learning_rate": 0.0015451328883114345, "loss": 2.7549, "step": 12540 }, { "epoch": 0.34, "learning_rate": 0.0015450599169692075, "loss": 2.7023, "step": 12541 }, { "epoch": 0.34, "learning_rate": 0.001544986941497704, "loss": 2.3633, "step": 12542 }, { "epoch": 0.34, "learning_rate": 0.001544913961897477, "loss": 2.3602, "step": 12543 }, { "epoch": 0.34, "learning_rate": 0.0015448409781690794, "loss": 2.3911, "step": 12544 }, { "epoch": 0.34, "learning_rate": 0.0015447679903130638, "loss": 2.3486, "step": 12545 }, { "epoch": 0.34, "learning_rate": 0.0015446949983299835, "loss": 2.2871, "step": 12546 }, { "epoch": 0.34, "learning_rate": 0.0015446220022203915, "loss": 2.8267, "step": 12547 }, { "epoch": 0.34, "learning_rate": 0.00154454900198484, "loss": 2.4507, "step": 12548 }, { "epoch": 0.34, "learning_rate": 0.0015444759976238828, "loss": 2.5731, "step": 12549 }, { "epoch": 0.34, "learning_rate": 0.0015444029891380727, "loss": 2.2791, "step": 12550 }, { "epoch": 0.34, "learning_rate": 0.0015443299765279632, "loss": 2.7898, "step": 12551 }, { "epoch": 0.34, "learning_rate": 0.0015442569597941067, "loss": 2.682, "step": 12552 }, { "epoch": 0.34, "learning_rate": 0.0015441839389370572, "loss": 2.7703, "step": 12553 }, { "epoch": 0.34, "learning_rate": 0.001544110913957367, "loss": 2.6338, "step": 12554 }, { "epoch": 0.34, "learning_rate": 0.0015440378848555905, "loss": 2.6832, "step": 12555 }, { "epoch": 0.34, "learning_rate": 0.0015439648516322796, "loss": 2.4427, "step": 12556 }, { "epoch": 0.34, "learning_rate": 0.0015438918142879885, "loss": 2.5112, "step": 12557 }, { "epoch": 0.34, "learning_rate": 0.0015438187728232702, "loss": 2.4696, "step": 12558 }, { "epoch": 0.34, "learning_rate": 0.0015437457272386781, "loss": 2.5587, "step": 12559 }, { "epoch": 0.34, "learning_rate": 0.0015436726775347655, "loss": 2.221, "step": 12560 }, { "epoch": 0.34, "learning_rate": 0.001543599623712086, "loss": 2.7855, "step": 12561 }, { "epoch": 0.34, "learning_rate": 0.001543526565771193, "loss": 2.547, "step": 12562 }, { "epoch": 0.34, "learning_rate": 0.0015434535037126401, "loss": 2.73, "step": 12563 }, { "epoch": 0.34, "learning_rate": 0.00154338043753698, "loss": 2.47, "step": 12564 }, { "epoch": 0.34, "learning_rate": 0.0015433073672447672, "loss": 2.5052, "step": 12565 }, { "epoch": 0.34, "learning_rate": 0.001543234292836555, "loss": 2.668, "step": 12566 }, { "epoch": 0.34, "learning_rate": 0.0015431612143128968, "loss": 2.7328, "step": 12567 }, { "epoch": 0.34, "learning_rate": 0.0015430881316743465, "loss": 2.6725, "step": 12568 }, { "epoch": 0.34, "learning_rate": 0.0015430150449214572, "loss": 2.5496, "step": 12569 }, { "epoch": 0.34, "learning_rate": 0.0015429419540547835, "loss": 2.6651, "step": 12570 }, { "epoch": 0.34, "learning_rate": 0.0015428688590748787, "loss": 2.8692, "step": 12571 }, { "epoch": 0.34, "learning_rate": 0.001542795759982296, "loss": 2.2722, "step": 12572 }, { "epoch": 0.34, "learning_rate": 0.00154272265677759, "loss": 2.5452, "step": 12573 }, { "epoch": 0.34, "learning_rate": 0.001542649549461314, "loss": 2.645, "step": 12574 }, { "epoch": 0.34, "learning_rate": 0.0015425764380340222, "loss": 2.6278, "step": 12575 }, { "epoch": 0.34, "learning_rate": 0.001542503322496268, "loss": 2.5807, "step": 12576 }, { "epoch": 0.34, "learning_rate": 0.001542430202848606, "loss": 2.8849, "step": 12577 }, { "epoch": 0.34, "learning_rate": 0.0015423570790915895, "loss": 2.305, "step": 12578 }, { "epoch": 0.34, "learning_rate": 0.0015422839512257726, "loss": 2.4133, "step": 12579 }, { "epoch": 0.34, "learning_rate": 0.00154221081925171, "loss": 2.6637, "step": 12580 }, { "epoch": 0.34, "learning_rate": 0.0015421376831699547, "loss": 2.485, "step": 12581 }, { "epoch": 0.34, "learning_rate": 0.0015420645429810613, "loss": 2.4408, "step": 12582 }, { "epoch": 0.34, "learning_rate": 0.0015419913986855838, "loss": 2.6467, "step": 12583 }, { "epoch": 0.34, "learning_rate": 0.0015419182502840764, "loss": 2.8003, "step": 12584 }, { "epoch": 0.34, "learning_rate": 0.0015418450977770935, "loss": 2.4322, "step": 12585 }, { "epoch": 0.34, "learning_rate": 0.0015417719411651887, "loss": 2.6902, "step": 12586 }, { "epoch": 0.34, "learning_rate": 0.0015416987804489164, "loss": 2.7949, "step": 12587 }, { "epoch": 0.34, "learning_rate": 0.0015416256156288314, "loss": 2.5973, "step": 12588 }, { "epoch": 0.34, "learning_rate": 0.0015415524467054876, "loss": 2.2405, "step": 12589 }, { "epoch": 0.34, "learning_rate": 0.001541479273679439, "loss": 3.0078, "step": 12590 }, { "epoch": 0.34, "learning_rate": 0.0015414060965512402, "loss": 2.5043, "step": 12591 }, { "epoch": 0.34, "learning_rate": 0.0015413329153214457, "loss": 2.5396, "step": 12592 }, { "epoch": 0.34, "learning_rate": 0.00154125972999061, "loss": 2.6818, "step": 12593 }, { "epoch": 0.34, "learning_rate": 0.001541186540559287, "loss": 2.8225, "step": 12594 }, { "epoch": 0.34, "learning_rate": 0.0015411133470280317, "loss": 2.5724, "step": 12595 }, { "epoch": 0.34, "learning_rate": 0.0015410401493973981, "loss": 2.3844, "step": 12596 }, { "epoch": 0.34, "learning_rate": 0.0015409669476679415, "loss": 2.4948, "step": 12597 }, { "epoch": 0.34, "learning_rate": 0.001540893741840216, "loss": 2.9219, "step": 12598 }, { "epoch": 0.34, "learning_rate": 0.001540820531914776, "loss": 2.3192, "step": 12599 }, { "epoch": 0.34, "learning_rate": 0.0015407473178921766, "loss": 2.7948, "step": 12600 }, { "epoch": 0.34, "learning_rate": 0.001540674099772972, "loss": 2.3152, "step": 12601 }, { "epoch": 0.34, "learning_rate": 0.001540600877557717, "loss": 2.6612, "step": 12602 }, { "epoch": 0.34, "learning_rate": 0.0015405276512469666, "loss": 2.6067, "step": 12603 }, { "epoch": 0.34, "learning_rate": 0.0015404544208412752, "loss": 2.7681, "step": 12604 }, { "epoch": 0.34, "learning_rate": 0.001540381186341198, "loss": 3.0183, "step": 12605 }, { "epoch": 0.34, "learning_rate": 0.0015403079477472894, "loss": 2.6729, "step": 12606 }, { "epoch": 0.34, "learning_rate": 0.0015402347050601042, "loss": 2.801, "step": 12607 }, { "epoch": 0.34, "learning_rate": 0.0015401614582801976, "loss": 2.6677, "step": 12608 }, { "epoch": 0.34, "learning_rate": 0.0015400882074081243, "loss": 2.687, "step": 12609 }, { "epoch": 0.34, "learning_rate": 0.0015400149524444396, "loss": 2.2368, "step": 12610 }, { "epoch": 0.34, "learning_rate": 0.0015399416933896978, "loss": 2.9923, "step": 12611 }, { "epoch": 0.34, "learning_rate": 0.0015398684302444544, "loss": 2.7032, "step": 12612 }, { "epoch": 0.34, "learning_rate": 0.0015397951630092643, "loss": 3.2359, "step": 12613 }, { "epoch": 0.34, "learning_rate": 0.0015397218916846824, "loss": 2.8232, "step": 12614 }, { "epoch": 0.34, "learning_rate": 0.0015396486162712639, "loss": 2.6577, "step": 12615 }, { "epoch": 0.34, "learning_rate": 0.0015395753367695643, "loss": 2.3721, "step": 12616 }, { "epoch": 0.34, "learning_rate": 0.0015395020531801386, "loss": 2.6982, "step": 12617 }, { "epoch": 0.34, "learning_rate": 0.001539428765503541, "loss": 2.5076, "step": 12618 }, { "epoch": 0.34, "learning_rate": 0.001539355473740328, "loss": 2.3957, "step": 12619 }, { "epoch": 0.34, "learning_rate": 0.0015392821778910546, "loss": 2.3921, "step": 12620 }, { "epoch": 0.34, "learning_rate": 0.0015392088779562756, "loss": 2.542, "step": 12621 }, { "epoch": 0.34, "learning_rate": 0.0015391355739365461, "loss": 2.4672, "step": 12622 }, { "epoch": 0.34, "learning_rate": 0.0015390622658324228, "loss": 3.2529, "step": 12623 }, { "epoch": 0.34, "learning_rate": 0.0015389889536444597, "loss": 2.4389, "step": 12624 }, { "epoch": 0.34, "learning_rate": 0.0015389156373732122, "loss": 2.4684, "step": 12625 }, { "epoch": 0.34, "learning_rate": 0.0015388423170192365, "loss": 2.8032, "step": 12626 }, { "epoch": 0.34, "learning_rate": 0.0015387689925830878, "loss": 2.4004, "step": 12627 }, { "epoch": 0.34, "learning_rate": 0.0015386956640653215, "loss": 3.018, "step": 12628 }, { "epoch": 0.34, "learning_rate": 0.0015386223314664935, "loss": 2.8513, "step": 12629 }, { "epoch": 0.34, "learning_rate": 0.0015385489947871585, "loss": 2.3498, "step": 12630 }, { "epoch": 0.34, "learning_rate": 0.0015384756540278727, "loss": 3.1444, "step": 12631 }, { "epoch": 0.34, "learning_rate": 0.0015384023091891922, "loss": 2.5497, "step": 12632 }, { "epoch": 0.34, "learning_rate": 0.0015383289602716715, "loss": 2.6095, "step": 12633 }, { "epoch": 0.34, "learning_rate": 0.0015382556072758668, "loss": 3.0348, "step": 12634 }, { "epoch": 0.34, "learning_rate": 0.001538182250202334, "loss": 2.281, "step": 12635 }, { "epoch": 0.34, "learning_rate": 0.0015381088890516286, "loss": 2.3857, "step": 12636 }, { "epoch": 0.34, "learning_rate": 0.001538035523824307, "loss": 3.0187, "step": 12637 }, { "epoch": 0.34, "learning_rate": 0.0015379621545209235, "loss": 2.5521, "step": 12638 }, { "epoch": 0.34, "learning_rate": 0.0015378887811420354, "loss": 2.9685, "step": 12639 }, { "epoch": 0.34, "learning_rate": 0.0015378154036881982, "loss": 2.6639, "step": 12640 }, { "epoch": 0.34, "learning_rate": 0.0015377420221599674, "loss": 2.5342, "step": 12641 }, { "epoch": 0.34, "learning_rate": 0.0015376686365578993, "loss": 2.3734, "step": 12642 }, { "epoch": 0.34, "learning_rate": 0.0015375952468825499, "loss": 2.6332, "step": 12643 }, { "epoch": 0.34, "learning_rate": 0.0015375218531344746, "loss": 2.4795, "step": 12644 }, { "epoch": 0.34, "learning_rate": 0.0015374484553142302, "loss": 2.3569, "step": 12645 }, { "epoch": 0.34, "learning_rate": 0.0015373750534223723, "loss": 2.4735, "step": 12646 }, { "epoch": 0.34, "learning_rate": 0.001537301647459457, "loss": 2.356, "step": 12647 }, { "epoch": 0.34, "learning_rate": 0.0015372282374260405, "loss": 2.804, "step": 12648 }, { "epoch": 0.34, "learning_rate": 0.0015371548233226791, "loss": 2.6601, "step": 12649 }, { "epoch": 0.34, "learning_rate": 0.0015370814051499284, "loss": 2.4342, "step": 12650 }, { "epoch": 0.34, "learning_rate": 0.0015370079829083454, "loss": 2.426, "step": 12651 }, { "epoch": 0.34, "learning_rate": 0.0015369345565984858, "loss": 2.805, "step": 12652 }, { "epoch": 0.34, "learning_rate": 0.0015368611262209057, "loss": 2.1313, "step": 12653 }, { "epoch": 0.34, "learning_rate": 0.0015367876917761621, "loss": 2.6002, "step": 12654 }, { "epoch": 0.34, "learning_rate": 0.0015367142532648108, "loss": 2.5524, "step": 12655 }, { "epoch": 0.34, "learning_rate": 0.0015366408106874084, "loss": 2.7221, "step": 12656 }, { "epoch": 0.34, "learning_rate": 0.0015365673640445109, "loss": 2.6646, "step": 12657 }, { "epoch": 0.34, "learning_rate": 0.0015364939133366748, "loss": 2.8025, "step": 12658 }, { "epoch": 0.34, "learning_rate": 0.0015364204585644572, "loss": 2.6645, "step": 12659 }, { "epoch": 0.34, "learning_rate": 0.001536346999728414, "loss": 2.3799, "step": 12660 }, { "epoch": 0.34, "learning_rate": 0.0015362735368291017, "loss": 2.626, "step": 12661 }, { "epoch": 0.34, "learning_rate": 0.0015362000698670771, "loss": 2.8275, "step": 12662 }, { "epoch": 0.34, "learning_rate": 0.0015361265988428966, "loss": 2.5615, "step": 12663 }, { "epoch": 0.34, "learning_rate": 0.0015360531237571164, "loss": 2.8903, "step": 12664 }, { "epoch": 0.34, "learning_rate": 0.0015359796446102938, "loss": 2.7204, "step": 12665 }, { "epoch": 0.34, "learning_rate": 0.0015359061614029857, "loss": 3.0698, "step": 12666 }, { "epoch": 0.34, "learning_rate": 0.0015358326741357479, "loss": 2.573, "step": 12667 }, { "epoch": 0.34, "learning_rate": 0.0015357591828091377, "loss": 2.7057, "step": 12668 }, { "epoch": 0.34, "learning_rate": 0.0015356856874237117, "loss": 2.3153, "step": 12669 }, { "epoch": 0.34, "learning_rate": 0.0015356121879800267, "loss": 2.5646, "step": 12670 }, { "epoch": 0.34, "learning_rate": 0.0015355386844786395, "loss": 2.6137, "step": 12671 }, { "epoch": 0.34, "learning_rate": 0.001535465176920107, "loss": 2.5621, "step": 12672 }, { "epoch": 0.34, "learning_rate": 0.001535391665304986, "loss": 2.4048, "step": 12673 }, { "epoch": 0.34, "learning_rate": 0.0015353181496338335, "loss": 2.3691, "step": 12674 }, { "epoch": 0.34, "learning_rate": 0.0015352446299072065, "loss": 2.5287, "step": 12675 }, { "epoch": 0.34, "learning_rate": 0.0015351711061256617, "loss": 2.6396, "step": 12676 }, { "epoch": 0.34, "learning_rate": 0.0015350975782897564, "loss": 2.4736, "step": 12677 }, { "epoch": 0.34, "learning_rate": 0.0015350240464000473, "loss": 2.6703, "step": 12678 }, { "epoch": 0.34, "learning_rate": 0.001534950510457092, "loss": 2.5297, "step": 12679 }, { "epoch": 0.34, "learning_rate": 0.001534876970461447, "loss": 2.5334, "step": 12680 }, { "epoch": 0.34, "learning_rate": 0.00153480342641367, "loss": 2.6551, "step": 12681 }, { "epoch": 0.34, "learning_rate": 0.0015347298783143176, "loss": 2.4583, "step": 12682 }, { "epoch": 0.34, "learning_rate": 0.0015346563261639475, "loss": 2.2985, "step": 12683 }, { "epoch": 0.34, "learning_rate": 0.0015345827699631163, "loss": 2.1581, "step": 12684 }, { "epoch": 0.34, "learning_rate": 0.0015345092097123817, "loss": 2.5444, "step": 12685 }, { "epoch": 0.34, "learning_rate": 0.001534435645412301, "loss": 2.5688, "step": 12686 }, { "epoch": 0.34, "learning_rate": 0.0015343620770634314, "loss": 2.8637, "step": 12687 }, { "epoch": 0.34, "learning_rate": 0.0015342885046663302, "loss": 2.6423, "step": 12688 }, { "epoch": 0.34, "learning_rate": 0.0015342149282215546, "loss": 2.6666, "step": 12689 }, { "epoch": 0.34, "learning_rate": 0.001534141347729663, "loss": 2.3421, "step": 12690 }, { "epoch": 0.34, "learning_rate": 0.001534067763191211, "loss": 2.3496, "step": 12691 }, { "epoch": 0.34, "learning_rate": 0.0015339941746067576, "loss": 2.9088, "step": 12692 }, { "epoch": 0.34, "learning_rate": 0.0015339205819768597, "loss": 2.8259, "step": 12693 }, { "epoch": 0.34, "learning_rate": 0.0015338469853020751, "loss": 2.72, "step": 12694 }, { "epoch": 0.34, "learning_rate": 0.0015337733845829612, "loss": 2.8351, "step": 12695 }, { "epoch": 0.34, "learning_rate": 0.0015336997798200756, "loss": 2.2508, "step": 12696 }, { "epoch": 0.34, "learning_rate": 0.0015336261710139753, "loss": 2.3732, "step": 12697 }, { "epoch": 0.34, "learning_rate": 0.0015335525581652192, "loss": 2.5375, "step": 12698 }, { "epoch": 0.34, "learning_rate": 0.0015334789412743645, "loss": 2.3024, "step": 12699 }, { "epoch": 0.34, "learning_rate": 0.001533405320341968, "loss": 2.7206, "step": 12700 }, { "epoch": 0.34, "learning_rate": 0.0015333316953685884, "loss": 2.4239, "step": 12701 }, { "epoch": 0.34, "learning_rate": 0.0015332580663547834, "loss": 2.404, "step": 12702 }, { "epoch": 0.34, "learning_rate": 0.0015331844333011106, "loss": 2.5334, "step": 12703 }, { "epoch": 0.34, "learning_rate": 0.0015331107962081277, "loss": 2.7711, "step": 12704 }, { "epoch": 0.34, "learning_rate": 0.0015330371550763928, "loss": 2.5875, "step": 12705 }, { "epoch": 0.34, "learning_rate": 0.0015329635099064639, "loss": 2.9704, "step": 12706 }, { "epoch": 0.34, "learning_rate": 0.0015328898606988984, "loss": 2.9569, "step": 12707 }, { "epoch": 0.34, "learning_rate": 0.0015328162074542547, "loss": 2.584, "step": 12708 }, { "epoch": 0.34, "learning_rate": 0.0015327425501730908, "loss": 2.7779, "step": 12709 }, { "epoch": 0.34, "learning_rate": 0.0015326688888559644, "loss": 3.0454, "step": 12710 }, { "epoch": 0.34, "learning_rate": 0.0015325952235034337, "loss": 2.3881, "step": 12711 }, { "epoch": 0.34, "learning_rate": 0.001532521554116057, "loss": 2.4881, "step": 12712 }, { "epoch": 0.34, "learning_rate": 0.0015324478806943921, "loss": 2.4327, "step": 12713 }, { "epoch": 0.34, "learning_rate": 0.0015323742032389974, "loss": 2.6444, "step": 12714 }, { "epoch": 0.34, "learning_rate": 0.0015323005217504307, "loss": 2.5768, "step": 12715 }, { "epoch": 0.34, "learning_rate": 0.0015322268362292504, "loss": 2.7606, "step": 12716 }, { "epoch": 0.34, "learning_rate": 0.001532153146676015, "loss": 2.6413, "step": 12717 }, { "epoch": 0.34, "learning_rate": 0.0015320794530912824, "loss": 2.6509, "step": 12718 }, { "epoch": 0.34, "learning_rate": 0.001532005755475611, "loss": 2.3769, "step": 12719 }, { "epoch": 0.34, "learning_rate": 0.0015319320538295588, "loss": 2.6356, "step": 12720 }, { "epoch": 0.34, "learning_rate": 0.0015318583481536848, "loss": 2.5012, "step": 12721 }, { "epoch": 0.34, "learning_rate": 0.001531784638448547, "loss": 2.2888, "step": 12722 }, { "epoch": 0.34, "learning_rate": 0.0015317109247147038, "loss": 2.552, "step": 12723 }, { "epoch": 0.34, "learning_rate": 0.0015316372069527136, "loss": 2.9231, "step": 12724 }, { "epoch": 0.34, "learning_rate": 0.0015315634851631353, "loss": 2.655, "step": 12725 }, { "epoch": 0.34, "learning_rate": 0.0015314897593465269, "loss": 2.5945, "step": 12726 }, { "epoch": 0.34, "learning_rate": 0.0015314160295034466, "loss": 3.0655, "step": 12727 }, { "epoch": 0.34, "learning_rate": 0.0015313422956344542, "loss": 2.6287, "step": 12728 }, { "epoch": 0.34, "learning_rate": 0.0015312685577401073, "loss": 2.2508, "step": 12729 }, { "epoch": 0.34, "learning_rate": 0.0015311948158209649, "loss": 2.2765, "step": 12730 }, { "epoch": 0.34, "learning_rate": 0.0015311210698775854, "loss": 2.5372, "step": 12731 }, { "epoch": 0.34, "learning_rate": 0.0015310473199105275, "loss": 2.6855, "step": 12732 }, { "epoch": 0.34, "learning_rate": 0.00153097356592035, "loss": 2.2469, "step": 12733 }, { "epoch": 0.34, "learning_rate": 0.0015308998079076122, "loss": 2.5937, "step": 12734 }, { "epoch": 0.34, "learning_rate": 0.001530826045872872, "loss": 2.6132, "step": 12735 }, { "epoch": 0.34, "learning_rate": 0.0015307522798166887, "loss": 2.6769, "step": 12736 }, { "epoch": 0.34, "learning_rate": 0.0015306785097396207, "loss": 2.7803, "step": 12737 }, { "epoch": 0.34, "learning_rate": 0.0015306047356422278, "loss": 2.3561, "step": 12738 }, { "epoch": 0.34, "learning_rate": 0.001530530957525068, "loss": 2.8686, "step": 12739 }, { "epoch": 0.34, "learning_rate": 0.0015304571753887001, "loss": 2.2018, "step": 12740 }, { "epoch": 0.34, "learning_rate": 0.001530383389233684, "loss": 2.527, "step": 12741 }, { "epoch": 0.34, "learning_rate": 0.001530309599060578, "loss": 2.358, "step": 12742 }, { "epoch": 0.34, "learning_rate": 0.0015302358048699411, "loss": 2.9171, "step": 12743 }, { "epoch": 0.34, "learning_rate": 0.0015301620066623326, "loss": 2.3753, "step": 12744 }, { "epoch": 0.34, "learning_rate": 0.0015300882044383117, "loss": 2.1898, "step": 12745 }, { "epoch": 0.34, "learning_rate": 0.0015300143981984374, "loss": 2.4604, "step": 12746 }, { "epoch": 0.34, "learning_rate": 0.0015299405879432685, "loss": 2.6872, "step": 12747 }, { "epoch": 0.34, "learning_rate": 0.0015298667736733647, "loss": 2.5633, "step": 12748 }, { "epoch": 0.34, "learning_rate": 0.0015297929553892851, "loss": 2.6726, "step": 12749 }, { "epoch": 0.34, "learning_rate": 0.0015297191330915884, "loss": 2.5233, "step": 12750 }, { "epoch": 0.34, "learning_rate": 0.0015296453067808343, "loss": 2.6258, "step": 12751 }, { "epoch": 0.34, "learning_rate": 0.0015295714764575821, "loss": 2.5939, "step": 12752 }, { "epoch": 0.34, "learning_rate": 0.0015294976421223912, "loss": 2.4835, "step": 12753 }, { "epoch": 0.34, "learning_rate": 0.0015294238037758209, "loss": 2.2858, "step": 12754 }, { "epoch": 0.34, "learning_rate": 0.00152934996141843, "loss": 2.4632, "step": 12755 }, { "epoch": 0.34, "learning_rate": 0.001529276115050779, "loss": 2.92, "step": 12756 }, { "epoch": 0.34, "learning_rate": 0.0015292022646734265, "loss": 2.9423, "step": 12757 }, { "epoch": 0.34, "learning_rate": 0.0015291284102869325, "loss": 3.3089, "step": 12758 }, { "epoch": 0.34, "learning_rate": 0.001529054551891856, "loss": 2.4231, "step": 12759 }, { "epoch": 0.34, "learning_rate": 0.0015289806894887568, "loss": 2.2895, "step": 12760 }, { "epoch": 0.34, "learning_rate": 0.0015289068230781946, "loss": 2.6986, "step": 12761 }, { "epoch": 0.34, "learning_rate": 0.0015288329526607289, "loss": 2.829, "step": 12762 }, { "epoch": 0.34, "learning_rate": 0.0015287590782369189, "loss": 2.6505, "step": 12763 }, { "epoch": 0.34, "learning_rate": 0.0015286851998073253, "loss": 2.4589, "step": 12764 }, { "epoch": 0.34, "learning_rate": 0.0015286113173725068, "loss": 2.587, "step": 12765 }, { "epoch": 0.34, "learning_rate": 0.0015285374309330236, "loss": 2.4851, "step": 12766 }, { "epoch": 0.34, "learning_rate": 0.001528463540489435, "loss": 2.7658, "step": 12767 }, { "epoch": 0.34, "learning_rate": 0.0015283896460423013, "loss": 2.6528, "step": 12768 }, { "epoch": 0.34, "learning_rate": 0.0015283157475921823, "loss": 2.229, "step": 12769 }, { "epoch": 0.34, "learning_rate": 0.0015282418451396372, "loss": 2.5512, "step": 12770 }, { "epoch": 0.34, "learning_rate": 0.0015281679386852268, "loss": 2.4144, "step": 12771 }, { "epoch": 0.34, "learning_rate": 0.0015280940282295101, "loss": 2.4639, "step": 12772 }, { "epoch": 0.34, "learning_rate": 0.0015280201137730476, "loss": 2.3973, "step": 12773 }, { "epoch": 0.34, "learning_rate": 0.0015279461953163992, "loss": 2.7526, "step": 12774 }, { "epoch": 0.34, "learning_rate": 0.001527872272860125, "loss": 2.4239, "step": 12775 }, { "epoch": 0.34, "learning_rate": 0.0015277983464047843, "loss": 2.764, "step": 12776 }, { "epoch": 0.34, "learning_rate": 0.0015277244159509382, "loss": 2.5602, "step": 12777 }, { "epoch": 0.34, "learning_rate": 0.001527650481499146, "loss": 2.8335, "step": 12778 }, { "epoch": 0.34, "learning_rate": 0.0015275765430499684, "loss": 2.7596, "step": 12779 }, { "epoch": 0.34, "learning_rate": 0.001527502600603965, "loss": 2.7273, "step": 12780 }, { "epoch": 0.34, "learning_rate": 0.0015274286541616961, "loss": 2.5434, "step": 12781 }, { "epoch": 0.34, "learning_rate": 0.0015273547037237224, "loss": 2.8698, "step": 12782 }, { "epoch": 0.34, "learning_rate": 0.001527280749290603, "loss": 2.7241, "step": 12783 }, { "epoch": 0.34, "learning_rate": 0.0015272067908628996, "loss": 2.2371, "step": 12784 }, { "epoch": 0.34, "learning_rate": 0.0015271328284411716, "loss": 2.6968, "step": 12785 }, { "epoch": 0.34, "learning_rate": 0.0015270588620259799, "loss": 2.8954, "step": 12786 }, { "epoch": 0.34, "learning_rate": 0.0015269848916178836, "loss": 2.5219, "step": 12787 }, { "epoch": 0.34, "learning_rate": 0.0015269109172174446, "loss": 2.6407, "step": 12788 }, { "epoch": 0.34, "learning_rate": 0.0015268369388252228, "loss": 2.7295, "step": 12789 }, { "epoch": 0.34, "learning_rate": 0.001526762956441778, "loss": 2.3644, "step": 12790 }, { "epoch": 0.34, "learning_rate": 0.0015266889700676718, "loss": 2.5304, "step": 12791 }, { "epoch": 0.34, "learning_rate": 0.0015266149797034641, "loss": 2.7412, "step": 12792 }, { "epoch": 0.34, "learning_rate": 0.001526540985349715, "loss": 2.7133, "step": 12793 }, { "epoch": 0.34, "learning_rate": 0.0015264669870069857, "loss": 2.6655, "step": 12794 }, { "epoch": 0.34, "learning_rate": 0.0015263929846758369, "loss": 2.6535, "step": 12795 }, { "epoch": 0.34, "learning_rate": 0.0015263189783568287, "loss": 2.6806, "step": 12796 }, { "epoch": 0.34, "learning_rate": 0.001526244968050522, "loss": 2.4201, "step": 12797 }, { "epoch": 0.34, "learning_rate": 0.0015261709537574776, "loss": 2.7614, "step": 12798 }, { "epoch": 0.34, "learning_rate": 0.001526096935478256, "loss": 2.8249, "step": 12799 }, { "epoch": 0.34, "learning_rate": 0.0015260229132134184, "loss": 2.7605, "step": 12800 }, { "epoch": 0.34, "learning_rate": 0.001525948886963525, "loss": 2.0437, "step": 12801 }, { "epoch": 0.34, "learning_rate": 0.001525874856729137, "loss": 2.6081, "step": 12802 }, { "epoch": 0.34, "learning_rate": 0.0015258008225108148, "loss": 2.3821, "step": 12803 }, { "epoch": 0.34, "learning_rate": 0.00152572678430912, "loss": 2.5089, "step": 12804 }, { "epoch": 0.34, "learning_rate": 0.0015256527421246126, "loss": 2.6495, "step": 12805 }, { "epoch": 0.34, "learning_rate": 0.0015255786959578544, "loss": 2.2284, "step": 12806 }, { "epoch": 0.34, "learning_rate": 0.0015255046458094057, "loss": 2.7063, "step": 12807 }, { "epoch": 0.34, "learning_rate": 0.0015254305916798279, "loss": 2.8659, "step": 12808 }, { "epoch": 0.34, "learning_rate": 0.0015253565335696818, "loss": 2.4179, "step": 12809 }, { "epoch": 0.34, "learning_rate": 0.0015252824714795286, "loss": 2.5925, "step": 12810 }, { "epoch": 0.34, "learning_rate": 0.0015252084054099293, "loss": 2.4016, "step": 12811 }, { "epoch": 0.34, "learning_rate": 0.0015251343353614452, "loss": 2.6323, "step": 12812 }, { "epoch": 0.34, "learning_rate": 0.0015250602613346366, "loss": 2.3248, "step": 12813 }, { "epoch": 0.34, "learning_rate": 0.001524986183330066, "loss": 2.466, "step": 12814 }, { "epoch": 0.34, "learning_rate": 0.001524912101348294, "loss": 2.3122, "step": 12815 }, { "epoch": 0.34, "learning_rate": 0.0015248380153898814, "loss": 2.2461, "step": 12816 }, { "epoch": 0.34, "learning_rate": 0.0015247639254553898, "loss": 2.4967, "step": 12817 }, { "epoch": 0.34, "learning_rate": 0.0015246898315453806, "loss": 2.6739, "step": 12818 }, { "epoch": 0.34, "learning_rate": 0.001524615733660415, "loss": 2.5485, "step": 12819 }, { "epoch": 0.34, "learning_rate": 0.0015245416318010547, "loss": 2.7162, "step": 12820 }, { "epoch": 0.34, "learning_rate": 0.0015244675259678605, "loss": 2.9229, "step": 12821 }, { "epoch": 0.34, "learning_rate": 0.0015243934161613942, "loss": 2.8114, "step": 12822 }, { "epoch": 0.34, "learning_rate": 0.0015243193023822168, "loss": 2.3942, "step": 12823 }, { "epoch": 0.34, "learning_rate": 0.0015242451846308907, "loss": 2.74, "step": 12824 }, { "epoch": 0.34, "learning_rate": 0.0015241710629079763, "loss": 2.3158, "step": 12825 }, { "epoch": 0.34, "learning_rate": 0.001524096937214036, "loss": 2.6195, "step": 12826 }, { "epoch": 0.34, "learning_rate": 0.0015240228075496308, "loss": 2.6343, "step": 12827 }, { "epoch": 0.34, "learning_rate": 0.0015239486739153226, "loss": 2.6992, "step": 12828 }, { "epoch": 0.34, "learning_rate": 0.0015238745363116725, "loss": 2.2463, "step": 12829 }, { "epoch": 0.34, "learning_rate": 0.001523800394739243, "loss": 2.6714, "step": 12830 }, { "epoch": 0.34, "learning_rate": 0.0015237262491985956, "loss": 2.5119, "step": 12831 }, { "epoch": 0.34, "learning_rate": 0.0015236520996902913, "loss": 2.3761, "step": 12832 }, { "epoch": 0.34, "learning_rate": 0.0015235779462148922, "loss": 3.0361, "step": 12833 }, { "epoch": 0.34, "learning_rate": 0.0015235037887729606, "loss": 3.1931, "step": 12834 }, { "epoch": 0.34, "learning_rate": 0.0015234296273650579, "loss": 2.3974, "step": 12835 }, { "epoch": 0.34, "learning_rate": 0.0015233554619917457, "loss": 2.7226, "step": 12836 }, { "epoch": 0.34, "learning_rate": 0.001523281292653586, "loss": 2.6665, "step": 12837 }, { "epoch": 0.35, "learning_rate": 0.0015232071193511411, "loss": 2.8241, "step": 12838 }, { "epoch": 0.35, "learning_rate": 0.0015231329420849723, "loss": 2.4498, "step": 12839 }, { "epoch": 0.35, "learning_rate": 0.0015230587608556418, "loss": 2.2765, "step": 12840 }, { "epoch": 0.35, "learning_rate": 0.001522984575663712, "loss": 2.855, "step": 12841 }, { "epoch": 0.35, "learning_rate": 0.0015229103865097443, "loss": 2.9475, "step": 12842 }, { "epoch": 0.35, "learning_rate": 0.0015228361933943013, "loss": 2.664, "step": 12843 }, { "epoch": 0.35, "learning_rate": 0.0015227619963179445, "loss": 2.4882, "step": 12844 }, { "epoch": 0.35, "learning_rate": 0.0015226877952812363, "loss": 2.5078, "step": 12845 }, { "epoch": 0.35, "learning_rate": 0.001522613590284739, "loss": 2.6874, "step": 12846 }, { "epoch": 0.35, "learning_rate": 0.0015225393813290142, "loss": 2.5297, "step": 12847 }, { "epoch": 0.35, "learning_rate": 0.0015224651684146249, "loss": 2.4147, "step": 12848 }, { "epoch": 0.35, "learning_rate": 0.0015223909515421324, "loss": 2.8178, "step": 12849 }, { "epoch": 0.35, "learning_rate": 0.0015223167307120999, "loss": 2.7242, "step": 12850 }, { "epoch": 0.35, "learning_rate": 0.0015222425059250892, "loss": 2.536, "step": 12851 }, { "epoch": 0.35, "learning_rate": 0.0015221682771816623, "loss": 2.5159, "step": 12852 }, { "epoch": 0.35, "learning_rate": 0.001522094044482382, "loss": 2.612, "step": 12853 }, { "epoch": 0.35, "learning_rate": 0.0015220198078278108, "loss": 2.4023, "step": 12854 }, { "epoch": 0.35, "learning_rate": 0.0015219455672185107, "loss": 2.8182, "step": 12855 }, { "epoch": 0.35, "learning_rate": 0.0015218713226550443, "loss": 2.8045, "step": 12856 }, { "epoch": 0.35, "learning_rate": 0.001521797074137974, "loss": 2.8053, "step": 12857 }, { "epoch": 0.35, "learning_rate": 0.0015217228216678627, "loss": 2.6892, "step": 12858 }, { "epoch": 0.35, "learning_rate": 0.0015216485652452723, "loss": 2.6671, "step": 12859 }, { "epoch": 0.35, "learning_rate": 0.0015215743048707653, "loss": 2.9904, "step": 12860 }, { "epoch": 0.35, "learning_rate": 0.0015215000405449054, "loss": 2.7051, "step": 12861 }, { "epoch": 0.35, "learning_rate": 0.0015214257722682535, "loss": 2.8945, "step": 12862 }, { "epoch": 0.35, "learning_rate": 0.0015213515000413738, "loss": 2.3609, "step": 12863 }, { "epoch": 0.35, "learning_rate": 0.0015212772238648283, "loss": 2.7311, "step": 12864 }, { "epoch": 0.35, "learning_rate": 0.0015212029437391796, "loss": 2.5663, "step": 12865 }, { "epoch": 0.35, "learning_rate": 0.0015211286596649907, "loss": 2.4304, "step": 12866 }, { "epoch": 0.35, "learning_rate": 0.0015210543716428241, "loss": 2.4696, "step": 12867 }, { "epoch": 0.35, "learning_rate": 0.001520980079673243, "loss": 2.2609, "step": 12868 }, { "epoch": 0.35, "learning_rate": 0.0015209057837568096, "loss": 2.8352, "step": 12869 }, { "epoch": 0.35, "learning_rate": 0.0015208314838940874, "loss": 2.2322, "step": 12870 }, { "epoch": 0.35, "learning_rate": 0.001520757180085639, "loss": 2.755, "step": 12871 }, { "epoch": 0.35, "learning_rate": 0.0015206828723320267, "loss": 2.7192, "step": 12872 }, { "epoch": 0.35, "learning_rate": 0.0015206085606338147, "loss": 2.657, "step": 12873 }, { "epoch": 0.35, "learning_rate": 0.0015205342449915653, "loss": 2.9799, "step": 12874 }, { "epoch": 0.35, "learning_rate": 0.0015204599254058412, "loss": 2.5452, "step": 12875 }, { "epoch": 0.35, "learning_rate": 0.001520385601877206, "loss": 2.5901, "step": 12876 }, { "epoch": 0.35, "learning_rate": 0.0015203112744062225, "loss": 2.7017, "step": 12877 }, { "epoch": 0.35, "learning_rate": 0.0015202369429934536, "loss": 2.6532, "step": 12878 }, { "epoch": 0.35, "learning_rate": 0.0015201626076394629, "loss": 2.6679, "step": 12879 }, { "epoch": 0.35, "learning_rate": 0.001520088268344813, "loss": 2.6557, "step": 12880 }, { "epoch": 0.35, "learning_rate": 0.0015200139251100677, "loss": 2.8799, "step": 12881 }, { "epoch": 0.35, "learning_rate": 0.0015199395779357896, "loss": 2.7385, "step": 12882 }, { "epoch": 0.35, "learning_rate": 0.0015198652268225423, "loss": 2.4657, "step": 12883 }, { "epoch": 0.35, "learning_rate": 0.001519790871770889, "loss": 2.7439, "step": 12884 }, { "epoch": 0.35, "learning_rate": 0.0015197165127813928, "loss": 2.6685, "step": 12885 }, { "epoch": 0.35, "learning_rate": 0.0015196421498546175, "loss": 2.3741, "step": 12886 }, { "epoch": 0.35, "learning_rate": 0.001519567782991126, "loss": 2.4181, "step": 12887 }, { "epoch": 0.35, "learning_rate": 0.0015194934121914821, "loss": 2.7329, "step": 12888 }, { "epoch": 0.35, "learning_rate": 0.001519419037456249, "loss": 2.3511, "step": 12889 }, { "epoch": 0.35, "learning_rate": 0.00151934465878599, "loss": 2.7787, "step": 12890 }, { "epoch": 0.35, "learning_rate": 0.0015192702761812685, "loss": 2.5091, "step": 12891 }, { "epoch": 0.35, "learning_rate": 0.0015191958896426483, "loss": 2.5116, "step": 12892 }, { "epoch": 0.35, "learning_rate": 0.001519121499170693, "loss": 2.8197, "step": 12893 }, { "epoch": 0.35, "learning_rate": 0.0015190471047659662, "loss": 2.6228, "step": 12894 }, { "epoch": 0.35, "learning_rate": 0.001518972706429031, "loss": 2.7443, "step": 12895 }, { "epoch": 0.35, "learning_rate": 0.0015188983041604515, "loss": 2.4981, "step": 12896 }, { "epoch": 0.35, "learning_rate": 0.001518823897960791, "loss": 2.2278, "step": 12897 }, { "epoch": 0.35, "learning_rate": 0.0015187494878306136, "loss": 2.3719, "step": 12898 }, { "epoch": 0.35, "learning_rate": 0.001518675073770483, "loss": 2.4267, "step": 12899 }, { "epoch": 0.35, "learning_rate": 0.0015186006557809627, "loss": 2.884, "step": 12900 }, { "epoch": 0.35, "learning_rate": 0.0015185262338626164, "loss": 2.5155, "step": 12901 }, { "epoch": 0.35, "learning_rate": 0.0015184518080160081, "loss": 2.4179, "step": 12902 }, { "epoch": 0.35, "learning_rate": 0.0015183773782417014, "loss": 2.2097, "step": 12903 }, { "epoch": 0.35, "learning_rate": 0.0015183029445402605, "loss": 2.7346, "step": 12904 }, { "epoch": 0.35, "learning_rate": 0.0015182285069122493, "loss": 2.6963, "step": 12905 }, { "epoch": 0.35, "learning_rate": 0.0015181540653582317, "loss": 3.0009, "step": 12906 }, { "epoch": 0.35, "learning_rate": 0.0015180796198787712, "loss": 2.4667, "step": 12907 }, { "epoch": 0.35, "learning_rate": 0.0015180051704744319, "loss": 2.7623, "step": 12908 }, { "epoch": 0.35, "learning_rate": 0.0015179307171457788, "loss": 2.7842, "step": 12909 }, { "epoch": 0.35, "learning_rate": 0.001517856259893375, "loss": 2.595, "step": 12910 }, { "epoch": 0.35, "learning_rate": 0.0015177817987177841, "loss": 2.4962, "step": 12911 }, { "epoch": 0.35, "learning_rate": 0.0015177073336195715, "loss": 2.6875, "step": 12912 }, { "epoch": 0.35, "learning_rate": 0.0015176328645993005, "loss": 2.8384, "step": 12913 }, { "epoch": 0.35, "learning_rate": 0.0015175583916575354, "loss": 2.8767, "step": 12914 }, { "epoch": 0.35, "learning_rate": 0.0015174839147948406, "loss": 2.8994, "step": 12915 }, { "epoch": 0.35, "learning_rate": 0.00151740943401178, "loss": 2.781, "step": 12916 }, { "epoch": 0.35, "learning_rate": 0.0015173349493089183, "loss": 2.8371, "step": 12917 }, { "epoch": 0.35, "learning_rate": 0.0015172604606868193, "loss": 2.628, "step": 12918 }, { "epoch": 0.35, "learning_rate": 0.0015171859681460474, "loss": 2.0932, "step": 12919 }, { "epoch": 0.35, "learning_rate": 0.0015171114716871674, "loss": 2.5142, "step": 12920 }, { "epoch": 0.35, "learning_rate": 0.001517036971310743, "loss": 2.7371, "step": 12921 }, { "epoch": 0.35, "learning_rate": 0.0015169624670173393, "loss": 2.746, "step": 12922 }, { "epoch": 0.35, "learning_rate": 0.00151688795880752, "loss": 2.4979, "step": 12923 }, { "epoch": 0.35, "learning_rate": 0.0015168134466818505, "loss": 2.8423, "step": 12924 }, { "epoch": 0.35, "learning_rate": 0.0015167389306408943, "loss": 2.4893, "step": 12925 }, { "epoch": 0.35, "learning_rate": 0.0015166644106852161, "loss": 2.5632, "step": 12926 }, { "epoch": 0.35, "learning_rate": 0.0015165898868153814, "loss": 2.4352, "step": 12927 }, { "epoch": 0.35, "learning_rate": 0.0015165153590319537, "loss": 2.7508, "step": 12928 }, { "epoch": 0.35, "learning_rate": 0.0015164408273354976, "loss": 2.5678, "step": 12929 }, { "epoch": 0.35, "learning_rate": 0.0015163662917265786, "loss": 2.5461, "step": 12930 }, { "epoch": 0.35, "learning_rate": 0.001516291752205761, "loss": 2.874, "step": 12931 }, { "epoch": 0.35, "learning_rate": 0.0015162172087736091, "loss": 2.8178, "step": 12932 }, { "epoch": 0.35, "learning_rate": 0.0015161426614306878, "loss": 2.9281, "step": 12933 }, { "epoch": 0.35, "learning_rate": 0.0015160681101775621, "loss": 2.7394, "step": 12934 }, { "epoch": 0.35, "learning_rate": 0.0015159935550147967, "loss": 2.96, "step": 12935 }, { "epoch": 0.35, "learning_rate": 0.0015159189959429566, "loss": 2.9406, "step": 12936 }, { "epoch": 0.35, "learning_rate": 0.0015158444329626062, "loss": 2.2365, "step": 12937 }, { "epoch": 0.35, "learning_rate": 0.0015157698660743105, "loss": 2.5414, "step": 12938 }, { "epoch": 0.35, "learning_rate": 0.0015156952952786347, "loss": 2.5962, "step": 12939 }, { "epoch": 0.35, "learning_rate": 0.0015156207205761433, "loss": 2.8858, "step": 12940 }, { "epoch": 0.35, "learning_rate": 0.001515546141967402, "loss": 2.6438, "step": 12941 }, { "epoch": 0.35, "learning_rate": 0.0015154715594529748, "loss": 2.6645, "step": 12942 }, { "epoch": 0.35, "learning_rate": 0.0015153969730334275, "loss": 2.6798, "step": 12943 }, { "epoch": 0.35, "learning_rate": 0.0015153223827093249, "loss": 2.4508, "step": 12944 }, { "epoch": 0.35, "learning_rate": 0.0015152477884812319, "loss": 2.3435, "step": 12945 }, { "epoch": 0.35, "learning_rate": 0.0015151731903497137, "loss": 2.2705, "step": 12946 }, { "epoch": 0.35, "learning_rate": 0.0015150985883153356, "loss": 2.5035, "step": 12947 }, { "epoch": 0.35, "learning_rate": 0.0015150239823786627, "loss": 2.3257, "step": 12948 }, { "epoch": 0.35, "learning_rate": 0.0015149493725402604, "loss": 2.2578, "step": 12949 }, { "epoch": 0.35, "learning_rate": 0.0015148747588006933, "loss": 2.6387, "step": 12950 }, { "epoch": 0.35, "learning_rate": 0.0015148001411605272, "loss": 2.6343, "step": 12951 }, { "epoch": 0.35, "learning_rate": 0.0015147255196203276, "loss": 2.6806, "step": 12952 }, { "epoch": 0.35, "learning_rate": 0.001514650894180659, "loss": 2.4976, "step": 12953 }, { "epoch": 0.35, "learning_rate": 0.0015145762648420878, "loss": 2.3726, "step": 12954 }, { "epoch": 0.35, "learning_rate": 0.0015145016316051782, "loss": 2.6029, "step": 12955 }, { "epoch": 0.35, "learning_rate": 0.0015144269944704968, "loss": 2.5085, "step": 12956 }, { "epoch": 0.35, "learning_rate": 0.0015143523534386079, "loss": 2.2266, "step": 12957 }, { "epoch": 0.35, "learning_rate": 0.001514277708510078, "loss": 2.5611, "step": 12958 }, { "epoch": 0.35, "learning_rate": 0.0015142030596854718, "loss": 2.5701, "step": 12959 }, { "epoch": 0.35, "learning_rate": 0.0015141284069653555, "loss": 2.7004, "step": 12960 }, { "epoch": 0.35, "learning_rate": 0.001514053750350294, "loss": 2.5633, "step": 12961 }, { "epoch": 0.35, "learning_rate": 0.0015139790898408532, "loss": 2.6511, "step": 12962 }, { "epoch": 0.35, "learning_rate": 0.001513904425437599, "loss": 2.5256, "step": 12963 }, { "epoch": 0.35, "learning_rate": 0.0015138297571410963, "loss": 2.6416, "step": 12964 }, { "epoch": 0.35, "learning_rate": 0.0015137550849519115, "loss": 2.6525, "step": 12965 }, { "epoch": 0.35, "learning_rate": 0.00151368040887061, "loss": 2.2589, "step": 12966 }, { "epoch": 0.35, "learning_rate": 0.0015136057288977576, "loss": 2.6823, "step": 12967 }, { "epoch": 0.35, "learning_rate": 0.00151353104503392, "loss": 2.4286, "step": 12968 }, { "epoch": 0.35, "learning_rate": 0.001513456357279663, "loss": 2.6118, "step": 12969 }, { "epoch": 0.35, "learning_rate": 0.0015133816656355524, "loss": 2.9088, "step": 12970 }, { "epoch": 0.35, "learning_rate": 0.001513306970102154, "loss": 2.3942, "step": 12971 }, { "epoch": 0.35, "learning_rate": 0.001513232270680034, "loss": 2.2688, "step": 12972 }, { "epoch": 0.35, "learning_rate": 0.001513157567369758, "loss": 2.3477, "step": 12973 }, { "epoch": 0.35, "learning_rate": 0.0015130828601718918, "loss": 2.6341, "step": 12974 }, { "epoch": 0.35, "learning_rate": 0.0015130081490870018, "loss": 2.5811, "step": 12975 }, { "epoch": 0.35, "learning_rate": 0.0015129334341156537, "loss": 2.6711, "step": 12976 }, { "epoch": 0.35, "learning_rate": 0.0015128587152584136, "loss": 2.4703, "step": 12977 }, { "epoch": 0.35, "learning_rate": 0.0015127839925158475, "loss": 2.4249, "step": 12978 }, { "epoch": 0.35, "learning_rate": 0.0015127092658885218, "loss": 2.9051, "step": 12979 }, { "epoch": 0.35, "learning_rate": 0.0015126345353770024, "loss": 2.8236, "step": 12980 }, { "epoch": 0.35, "learning_rate": 0.0015125598009818548, "loss": 2.7565, "step": 12981 }, { "epoch": 0.35, "learning_rate": 0.0015124850627036464, "loss": 2.3941, "step": 12982 }, { "epoch": 0.35, "learning_rate": 0.0015124103205429427, "loss": 2.6114, "step": 12983 }, { "epoch": 0.35, "learning_rate": 0.0015123355745003098, "loss": 2.548, "step": 12984 }, { "epoch": 0.35, "learning_rate": 0.0015122608245763142, "loss": 2.777, "step": 12985 }, { "epoch": 0.35, "learning_rate": 0.0015121860707715223, "loss": 2.7234, "step": 12986 }, { "epoch": 0.35, "learning_rate": 0.0015121113130865003, "loss": 2.6595, "step": 12987 }, { "epoch": 0.35, "learning_rate": 0.0015120365515218144, "loss": 2.5934, "step": 12988 }, { "epoch": 0.35, "learning_rate": 0.0015119617860780315, "loss": 2.2568, "step": 12989 }, { "epoch": 0.35, "learning_rate": 0.0015118870167557174, "loss": 2.5261, "step": 12990 }, { "epoch": 0.35, "learning_rate": 0.0015118122435554386, "loss": 2.192, "step": 12991 }, { "epoch": 0.35, "learning_rate": 0.001511737466477762, "loss": 2.9238, "step": 12992 }, { "epoch": 0.35, "learning_rate": 0.0015116626855232536, "loss": 2.2985, "step": 12993 }, { "epoch": 0.35, "learning_rate": 0.0015115879006924805, "loss": 2.5776, "step": 12994 }, { "epoch": 0.35, "learning_rate": 0.001511513111986009, "loss": 2.3815, "step": 12995 }, { "epoch": 0.35, "learning_rate": 0.001511438319404405, "loss": 2.7279, "step": 12996 }, { "epoch": 0.35, "learning_rate": 0.001511363522948236, "loss": 2.9515, "step": 12997 }, { "epoch": 0.35, "learning_rate": 0.0015112887226180684, "loss": 2.12, "step": 12998 }, { "epoch": 0.35, "learning_rate": 0.0015112139184144692, "loss": 2.3103, "step": 12999 }, { "epoch": 0.35, "learning_rate": 0.0015111391103380045, "loss": 2.5874, "step": 13000 }, { "epoch": 0.35, "learning_rate": 0.0015110642983892412, "loss": 2.6695, "step": 13001 }, { "epoch": 0.35, "learning_rate": 0.0015109894825687462, "loss": 2.4638, "step": 13002 }, { "epoch": 0.35, "learning_rate": 0.0015109146628770863, "loss": 2.9489, "step": 13003 }, { "epoch": 0.35, "learning_rate": 0.001510839839314828, "loss": 2.5872, "step": 13004 }, { "epoch": 0.35, "learning_rate": 0.0015107650118825386, "loss": 2.7447, "step": 13005 }, { "epoch": 0.35, "learning_rate": 0.001510690180580785, "loss": 2.7356, "step": 13006 }, { "epoch": 0.35, "learning_rate": 0.0015106153454101335, "loss": 2.8097, "step": 13007 }, { "epoch": 0.35, "learning_rate": 0.0015105405063711515, "loss": 2.6168, "step": 13008 }, { "epoch": 0.35, "learning_rate": 0.0015104656634644064, "loss": 2.6092, "step": 13009 }, { "epoch": 0.35, "learning_rate": 0.0015103908166904643, "loss": 2.6287, "step": 13010 }, { "epoch": 0.35, "learning_rate": 0.0015103159660498923, "loss": 2.4825, "step": 13011 }, { "epoch": 0.35, "learning_rate": 0.0015102411115432584, "loss": 2.6651, "step": 13012 }, { "epoch": 0.35, "learning_rate": 0.0015101662531711289, "loss": 2.7816, "step": 13013 }, { "epoch": 0.35, "learning_rate": 0.0015100913909340706, "loss": 2.8819, "step": 13014 }, { "epoch": 0.35, "learning_rate": 0.0015100165248326516, "loss": 2.4068, "step": 13015 }, { "epoch": 0.35, "learning_rate": 0.0015099416548674386, "loss": 2.4999, "step": 13016 }, { "epoch": 0.35, "learning_rate": 0.0015098667810389983, "loss": 2.5572, "step": 13017 }, { "epoch": 0.35, "learning_rate": 0.001509791903347899, "loss": 2.1623, "step": 13018 }, { "epoch": 0.35, "learning_rate": 0.0015097170217947071, "loss": 2.4202, "step": 13019 }, { "epoch": 0.35, "learning_rate": 0.0015096421363799905, "loss": 2.8115, "step": 13020 }, { "epoch": 0.35, "learning_rate": 0.0015095672471043156, "loss": 2.512, "step": 13021 }, { "epoch": 0.35, "learning_rate": 0.0015094923539682506, "loss": 3.0596, "step": 13022 }, { "epoch": 0.35, "learning_rate": 0.0015094174569723628, "loss": 2.5858, "step": 13023 }, { "epoch": 0.35, "learning_rate": 0.0015093425561172192, "loss": 2.432, "step": 13024 }, { "epoch": 0.35, "learning_rate": 0.0015092676514033877, "loss": 2.6277, "step": 13025 }, { "epoch": 0.35, "learning_rate": 0.0015091927428314354, "loss": 2.7266, "step": 13026 }, { "epoch": 0.35, "learning_rate": 0.0015091178304019297, "loss": 2.6469, "step": 13027 }, { "epoch": 0.35, "learning_rate": 0.0015090429141154384, "loss": 3.0388, "step": 13028 }, { "epoch": 0.35, "learning_rate": 0.0015089679939725294, "loss": 2.7777, "step": 13029 }, { "epoch": 0.35, "learning_rate": 0.0015088930699737695, "loss": 2.713, "step": 13030 }, { "epoch": 0.35, "learning_rate": 0.0015088181421197265, "loss": 2.7249, "step": 13031 }, { "epoch": 0.35, "learning_rate": 0.0015087432104109687, "loss": 2.3263, "step": 13032 }, { "epoch": 0.35, "learning_rate": 0.001508668274848063, "loss": 2.2203, "step": 13033 }, { "epoch": 0.35, "learning_rate": 0.0015085933354315776, "loss": 2.6426, "step": 13034 }, { "epoch": 0.35, "learning_rate": 0.0015085183921620799, "loss": 2.8198, "step": 13035 }, { "epoch": 0.35, "learning_rate": 0.001508443445040138, "loss": 2.4016, "step": 13036 }, { "epoch": 0.35, "learning_rate": 0.0015083684940663188, "loss": 2.1449, "step": 13037 }, { "epoch": 0.35, "learning_rate": 0.0015082935392411914, "loss": 2.5181, "step": 13038 }, { "epoch": 0.35, "learning_rate": 0.0015082185805653228, "loss": 2.3633, "step": 13039 }, { "epoch": 0.35, "learning_rate": 0.0015081436180392812, "loss": 2.6709, "step": 13040 }, { "epoch": 0.35, "learning_rate": 0.001508068651663634, "loss": 3.0334, "step": 13041 }, { "epoch": 0.35, "learning_rate": 0.0015079936814389502, "loss": 2.9363, "step": 13042 }, { "epoch": 0.35, "learning_rate": 0.0015079187073657968, "loss": 2.5219, "step": 13043 }, { "epoch": 0.35, "learning_rate": 0.0015078437294447418, "loss": 2.5046, "step": 13044 }, { "epoch": 0.35, "learning_rate": 0.0015077687476763538, "loss": 2.5264, "step": 13045 }, { "epoch": 0.35, "learning_rate": 0.0015076937620612007, "loss": 2.486, "step": 13046 }, { "epoch": 0.35, "learning_rate": 0.0015076187725998498, "loss": 1.9793, "step": 13047 }, { "epoch": 0.35, "learning_rate": 0.0015075437792928703, "loss": 2.7812, "step": 13048 }, { "epoch": 0.35, "learning_rate": 0.0015074687821408298, "loss": 2.6363, "step": 13049 }, { "epoch": 0.35, "learning_rate": 0.0015073937811442967, "loss": 2.4601, "step": 13050 }, { "epoch": 0.35, "learning_rate": 0.0015073187763038388, "loss": 2.3874, "step": 13051 }, { "epoch": 0.35, "learning_rate": 0.0015072437676200245, "loss": 2.7924, "step": 13052 }, { "epoch": 0.35, "learning_rate": 0.0015071687550934224, "loss": 2.2829, "step": 13053 }, { "epoch": 0.35, "learning_rate": 0.0015070937387246003, "loss": 2.3782, "step": 13054 }, { "epoch": 0.35, "learning_rate": 0.0015070187185141264, "loss": 2.9657, "step": 13055 }, { "epoch": 0.35, "learning_rate": 0.0015069436944625699, "loss": 2.6307, "step": 13056 }, { "epoch": 0.35, "learning_rate": 0.0015068686665704982, "loss": 2.6749, "step": 13057 }, { "epoch": 0.35, "learning_rate": 0.0015067936348384804, "loss": 2.7588, "step": 13058 }, { "epoch": 0.35, "learning_rate": 0.0015067185992670843, "loss": 2.4144, "step": 13059 }, { "epoch": 0.35, "learning_rate": 0.0015066435598568785, "loss": 2.8814, "step": 13060 }, { "epoch": 0.35, "learning_rate": 0.0015065685166084323, "loss": 2.4343, "step": 13061 }, { "epoch": 0.35, "learning_rate": 0.0015064934695223134, "loss": 2.7604, "step": 13062 }, { "epoch": 0.35, "learning_rate": 0.0015064184185990903, "loss": 2.2154, "step": 13063 }, { "epoch": 0.35, "learning_rate": 0.0015063433638393318, "loss": 2.5871, "step": 13064 }, { "epoch": 0.35, "learning_rate": 0.0015062683052436067, "loss": 2.5747, "step": 13065 }, { "epoch": 0.35, "learning_rate": 0.0015061932428124833, "loss": 2.4255, "step": 13066 }, { "epoch": 0.35, "learning_rate": 0.0015061181765465305, "loss": 2.3476, "step": 13067 }, { "epoch": 0.35, "learning_rate": 0.001506043106446317, "loss": 2.6857, "step": 13068 }, { "epoch": 0.35, "learning_rate": 0.0015059680325124113, "loss": 2.1435, "step": 13069 }, { "epoch": 0.35, "learning_rate": 0.0015058929547453817, "loss": 3.0608, "step": 13070 }, { "epoch": 0.35, "learning_rate": 0.0015058178731457983, "loss": 2.6595, "step": 13071 }, { "epoch": 0.35, "learning_rate": 0.001505742787714229, "loss": 2.693, "step": 13072 }, { "epoch": 0.35, "learning_rate": 0.0015056676984512424, "loss": 3.0387, "step": 13073 }, { "epoch": 0.35, "learning_rate": 0.001505592605357408, "loss": 3.0853, "step": 13074 }, { "epoch": 0.35, "learning_rate": 0.0015055175084332942, "loss": 2.872, "step": 13075 }, { "epoch": 0.35, "learning_rate": 0.0015054424076794701, "loss": 2.7052, "step": 13076 }, { "epoch": 0.35, "learning_rate": 0.001505367303096505, "loss": 2.5183, "step": 13077 }, { "epoch": 0.35, "learning_rate": 0.0015052921946849672, "loss": 2.212, "step": 13078 }, { "epoch": 0.35, "learning_rate": 0.0015052170824454265, "loss": 2.1854, "step": 13079 }, { "epoch": 0.35, "learning_rate": 0.0015051419663784512, "loss": 2.7053, "step": 13080 }, { "epoch": 0.35, "learning_rate": 0.0015050668464846107, "loss": 2.3208, "step": 13081 }, { "epoch": 0.35, "learning_rate": 0.0015049917227644741, "loss": 2.5228, "step": 13082 }, { "epoch": 0.35, "learning_rate": 0.0015049165952186105, "loss": 2.5577, "step": 13083 }, { "epoch": 0.35, "learning_rate": 0.001504841463847589, "loss": 2.3246, "step": 13084 }, { "epoch": 0.35, "learning_rate": 0.001504766328651979, "loss": 2.5265, "step": 13085 }, { "epoch": 0.35, "learning_rate": 0.0015046911896323494, "loss": 2.6324, "step": 13086 }, { "epoch": 0.35, "learning_rate": 0.0015046160467892694, "loss": 2.406, "step": 13087 }, { "epoch": 0.35, "learning_rate": 0.0015045409001233087, "loss": 2.2864, "step": 13088 }, { "epoch": 0.35, "learning_rate": 0.0015044657496350365, "loss": 2.6531, "step": 13089 }, { "epoch": 0.35, "learning_rate": 0.0015043905953250217, "loss": 2.621, "step": 13090 }, { "epoch": 0.35, "learning_rate": 0.0015043154371938339, "loss": 2.7654, "step": 13091 }, { "epoch": 0.35, "learning_rate": 0.0015042402752420427, "loss": 2.6441, "step": 13092 }, { "epoch": 0.35, "learning_rate": 0.0015041651094702172, "loss": 2.5315, "step": 13093 }, { "epoch": 0.35, "learning_rate": 0.0015040899398789268, "loss": 2.3816, "step": 13094 }, { "epoch": 0.35, "learning_rate": 0.0015040147664687415, "loss": 2.4542, "step": 13095 }, { "epoch": 0.35, "learning_rate": 0.00150393958924023, "loss": 2.6662, "step": 13096 }, { "epoch": 0.35, "learning_rate": 0.0015038644081939627, "loss": 2.154, "step": 13097 }, { "epoch": 0.35, "learning_rate": 0.0015037892233305086, "loss": 2.2667, "step": 13098 }, { "epoch": 0.35, "learning_rate": 0.0015037140346504372, "loss": 2.8022, "step": 13099 }, { "epoch": 0.35, "learning_rate": 0.0015036388421543186, "loss": 2.0912, "step": 13100 }, { "epoch": 0.35, "learning_rate": 0.001503563645842722, "loss": 2.4374, "step": 13101 }, { "epoch": 0.35, "learning_rate": 0.0015034884457162173, "loss": 3.0479, "step": 13102 }, { "epoch": 0.35, "learning_rate": 0.0015034132417753741, "loss": 2.5333, "step": 13103 }, { "epoch": 0.35, "learning_rate": 0.0015033380340207624, "loss": 2.4378, "step": 13104 }, { "epoch": 0.35, "learning_rate": 0.0015032628224529514, "loss": 2.7444, "step": 13105 }, { "epoch": 0.35, "learning_rate": 0.0015031876070725116, "loss": 2.1467, "step": 13106 }, { "epoch": 0.35, "learning_rate": 0.0015031123878800124, "loss": 2.2119, "step": 13107 }, { "epoch": 0.35, "learning_rate": 0.0015030371648760235, "loss": 2.7692, "step": 13108 }, { "epoch": 0.35, "learning_rate": 0.001502961938061115, "loss": 3.0026, "step": 13109 }, { "epoch": 0.35, "learning_rate": 0.0015028867074358568, "loss": 2.9172, "step": 13110 }, { "epoch": 0.35, "learning_rate": 0.0015028114730008188, "loss": 2.8751, "step": 13111 }, { "epoch": 0.35, "learning_rate": 0.0015027362347565711, "loss": 2.4664, "step": 13112 }, { "epoch": 0.35, "learning_rate": 0.0015026609927036834, "loss": 2.7103, "step": 13113 }, { "epoch": 0.35, "learning_rate": 0.001502585746842726, "loss": 2.8042, "step": 13114 }, { "epoch": 0.35, "learning_rate": 0.0015025104971742689, "loss": 2.78, "step": 13115 }, { "epoch": 0.35, "learning_rate": 0.0015024352436988817, "loss": 2.4824, "step": 13116 }, { "epoch": 0.35, "learning_rate": 0.0015023599864171352, "loss": 2.4879, "step": 13117 }, { "epoch": 0.35, "learning_rate": 0.0015022847253295995, "loss": 2.8412, "step": 13118 }, { "epoch": 0.35, "learning_rate": 0.0015022094604368443, "loss": 2.4139, "step": 13119 }, { "epoch": 0.35, "learning_rate": 0.0015021341917394403, "loss": 2.4364, "step": 13120 }, { "epoch": 0.35, "learning_rate": 0.0015020589192379567, "loss": 2.5668, "step": 13121 }, { "epoch": 0.35, "learning_rate": 0.0015019836429329653, "loss": 2.8794, "step": 13122 }, { "epoch": 0.35, "learning_rate": 0.0015019083628250351, "loss": 2.9618, "step": 13123 }, { "epoch": 0.35, "learning_rate": 0.0015018330789147369, "loss": 2.3916, "step": 13124 }, { "epoch": 0.35, "learning_rate": 0.0015017577912026412, "loss": 2.887, "step": 13125 }, { "epoch": 0.35, "learning_rate": 0.0015016824996893182, "loss": 2.3656, "step": 13126 }, { "epoch": 0.35, "learning_rate": 0.001501607204375338, "loss": 2.6753, "step": 13127 }, { "epoch": 0.35, "learning_rate": 0.0015015319052612717, "loss": 2.5459, "step": 13128 }, { "epoch": 0.35, "learning_rate": 0.001501456602347689, "loss": 2.1511, "step": 13129 }, { "epoch": 0.35, "learning_rate": 0.0015013812956351606, "loss": 2.5718, "step": 13130 }, { "epoch": 0.35, "learning_rate": 0.0015013059851242576, "loss": 2.5251, "step": 13131 }, { "epoch": 0.35, "learning_rate": 0.00150123067081555, "loss": 2.859, "step": 13132 }, { "epoch": 0.35, "learning_rate": 0.001501155352709608, "loss": 2.499, "step": 13133 }, { "epoch": 0.35, "learning_rate": 0.0015010800308070031, "loss": 2.4031, "step": 13134 }, { "epoch": 0.35, "learning_rate": 0.0015010047051083055, "loss": 2.9464, "step": 13135 }, { "epoch": 0.35, "learning_rate": 0.0015009293756140854, "loss": 2.8392, "step": 13136 }, { "epoch": 0.35, "learning_rate": 0.0015008540423249142, "loss": 2.3419, "step": 13137 }, { "epoch": 0.35, "learning_rate": 0.0015007787052413624, "loss": 2.7472, "step": 13138 }, { "epoch": 0.35, "learning_rate": 0.0015007033643640005, "loss": 2.5454, "step": 13139 }, { "epoch": 0.35, "learning_rate": 0.0015006280196933992, "loss": 2.5736, "step": 13140 }, { "epoch": 0.35, "learning_rate": 0.0015005526712301301, "loss": 2.4033, "step": 13141 }, { "epoch": 0.35, "learning_rate": 0.0015004773189747631, "loss": 2.1524, "step": 13142 }, { "epoch": 0.35, "learning_rate": 0.0015004019629278696, "loss": 2.3971, "step": 13143 }, { "epoch": 0.35, "learning_rate": 0.00150032660309002, "loss": 2.2632, "step": 13144 }, { "epoch": 0.35, "learning_rate": 0.0015002512394617857, "loss": 2.5122, "step": 13145 }, { "epoch": 0.35, "learning_rate": 0.0015001758720437372, "loss": 2.7831, "step": 13146 }, { "epoch": 0.35, "learning_rate": 0.0015001005008364464, "loss": 2.2158, "step": 13147 }, { "epoch": 0.35, "learning_rate": 0.0015000251258404829, "loss": 2.8302, "step": 13148 }, { "epoch": 0.35, "learning_rate": 0.0014999497470564184, "loss": 2.5906, "step": 13149 }, { "epoch": 0.35, "learning_rate": 0.0014998743644848245, "loss": 2.6593, "step": 13150 }, { "epoch": 0.35, "learning_rate": 0.0014997989781262717, "loss": 2.574, "step": 13151 }, { "epoch": 0.35, "learning_rate": 0.001499723587981331, "loss": 2.3619, "step": 13152 }, { "epoch": 0.35, "learning_rate": 0.0014996481940505737, "loss": 3.0532, "step": 13153 }, { "epoch": 0.35, "learning_rate": 0.0014995727963345714, "loss": 2.6014, "step": 13154 }, { "epoch": 0.35, "learning_rate": 0.0014994973948338946, "loss": 2.5563, "step": 13155 }, { "epoch": 0.35, "learning_rate": 0.0014994219895491147, "loss": 2.3613, "step": 13156 }, { "epoch": 0.35, "learning_rate": 0.0014993465804808033, "loss": 2.9505, "step": 13157 }, { "epoch": 0.35, "learning_rate": 0.0014992711676295315, "loss": 2.6048, "step": 13158 }, { "epoch": 0.35, "learning_rate": 0.0014991957509958706, "loss": 2.8606, "step": 13159 }, { "epoch": 0.35, "learning_rate": 0.0014991203305803915, "loss": 2.8229, "step": 13160 }, { "epoch": 0.35, "learning_rate": 0.0014990449063836666, "loss": 2.4484, "step": 13161 }, { "epoch": 0.35, "learning_rate": 0.0014989694784062664, "loss": 2.4178, "step": 13162 }, { "epoch": 0.35, "learning_rate": 0.0014988940466487627, "loss": 2.8185, "step": 13163 }, { "epoch": 0.35, "learning_rate": 0.001498818611111727, "loss": 2.4523, "step": 13164 }, { "epoch": 0.35, "learning_rate": 0.0014987431717957307, "loss": 2.5177, "step": 13165 }, { "epoch": 0.35, "learning_rate": 0.0014986677287013453, "loss": 2.9106, "step": 13166 }, { "epoch": 0.35, "learning_rate": 0.0014985922818291423, "loss": 2.576, "step": 13167 }, { "epoch": 0.35, "learning_rate": 0.001498516831179693, "loss": 2.9132, "step": 13168 }, { "epoch": 0.35, "learning_rate": 0.0014984413767535696, "loss": 2.4224, "step": 13169 }, { "epoch": 0.35, "learning_rate": 0.0014983659185513435, "loss": 2.4692, "step": 13170 }, { "epoch": 0.35, "learning_rate": 0.0014982904565735864, "loss": 2.3847, "step": 13171 }, { "epoch": 0.35, "learning_rate": 0.0014982149908208695, "loss": 2.5613, "step": 13172 }, { "epoch": 0.35, "learning_rate": 0.0014981395212937652, "loss": 2.2894, "step": 13173 }, { "epoch": 0.35, "learning_rate": 0.0014980640479928446, "loss": 1.7843, "step": 13174 }, { "epoch": 0.35, "learning_rate": 0.0014979885709186802, "loss": 3.1034, "step": 13175 }, { "epoch": 0.35, "learning_rate": 0.0014979130900718432, "loss": 2.4335, "step": 13176 }, { "epoch": 0.35, "learning_rate": 0.0014978376054529058, "loss": 2.5661, "step": 13177 }, { "epoch": 0.35, "learning_rate": 0.0014977621170624397, "loss": 2.549, "step": 13178 }, { "epoch": 0.35, "learning_rate": 0.0014976866249010166, "loss": 2.5554, "step": 13179 }, { "epoch": 0.35, "learning_rate": 0.0014976111289692086, "loss": 2.5159, "step": 13180 }, { "epoch": 0.35, "learning_rate": 0.001497535629267588, "loss": 2.5843, "step": 13181 }, { "epoch": 0.35, "learning_rate": 0.0014974601257967263, "loss": 2.6403, "step": 13182 }, { "epoch": 0.35, "learning_rate": 0.0014973846185571955, "loss": 2.3441, "step": 13183 }, { "epoch": 0.35, "learning_rate": 0.001497309107549568, "loss": 2.1205, "step": 13184 }, { "epoch": 0.35, "learning_rate": 0.0014972335927744154, "loss": 2.4923, "step": 13185 }, { "epoch": 0.35, "learning_rate": 0.00149715807423231, "loss": 2.0837, "step": 13186 }, { "epoch": 0.35, "learning_rate": 0.0014970825519238238, "loss": 2.5876, "step": 13187 }, { "epoch": 0.35, "learning_rate": 0.0014970070258495292, "loss": 2.3812, "step": 13188 }, { "epoch": 0.35, "learning_rate": 0.001496931496009998, "loss": 2.3942, "step": 13189 }, { "epoch": 0.35, "learning_rate": 0.0014968559624058031, "loss": 2.6454, "step": 13190 }, { "epoch": 0.35, "learning_rate": 0.0014967804250375159, "loss": 2.9111, "step": 13191 }, { "epoch": 0.35, "learning_rate": 0.001496704883905709, "loss": 2.9033, "step": 13192 }, { "epoch": 0.35, "learning_rate": 0.001496629339010955, "loss": 2.7026, "step": 13193 }, { "epoch": 0.35, "learning_rate": 0.0014965537903538259, "loss": 2.67, "step": 13194 }, { "epoch": 0.35, "learning_rate": 0.0014964782379348937, "loss": 2.6279, "step": 13195 }, { "epoch": 0.35, "learning_rate": 0.0014964026817547312, "loss": 2.4726, "step": 13196 }, { "epoch": 0.35, "learning_rate": 0.001496327121813911, "loss": 2.5354, "step": 13197 }, { "epoch": 0.35, "learning_rate": 0.0014962515581130051, "loss": 2.736, "step": 13198 }, { "epoch": 0.35, "learning_rate": 0.0014961759906525858, "loss": 2.2823, "step": 13199 }, { "epoch": 0.35, "learning_rate": 0.0014961004194332264, "loss": 2.636, "step": 13200 }, { "epoch": 0.35, "learning_rate": 0.001496024844455499, "loss": 2.293, "step": 13201 }, { "epoch": 0.35, "learning_rate": 0.0014959492657199756, "loss": 2.5987, "step": 13202 }, { "epoch": 0.35, "learning_rate": 0.0014958736832272296, "loss": 2.4203, "step": 13203 }, { "epoch": 0.35, "learning_rate": 0.001495798096977833, "loss": 2.8881, "step": 13204 }, { "epoch": 0.35, "learning_rate": 0.0014957225069723585, "loss": 2.4515, "step": 13205 }, { "epoch": 0.35, "learning_rate": 0.0014956469132113793, "loss": 2.5558, "step": 13206 }, { "epoch": 0.35, "learning_rate": 0.0014955713156954676, "loss": 2.5253, "step": 13207 }, { "epoch": 0.35, "learning_rate": 0.0014954957144251962, "loss": 2.0738, "step": 13208 }, { "epoch": 0.35, "learning_rate": 0.0014954201094011378, "loss": 2.5284, "step": 13209 }, { "epoch": 0.36, "learning_rate": 0.0014953445006238653, "loss": 2.6755, "step": 13210 }, { "epoch": 0.36, "learning_rate": 0.0014952688880939511, "loss": 2.6072, "step": 13211 }, { "epoch": 0.36, "learning_rate": 0.0014951932718119685, "loss": 2.7666, "step": 13212 }, { "epoch": 0.36, "learning_rate": 0.0014951176517784906, "loss": 2.3489, "step": 13213 }, { "epoch": 0.36, "learning_rate": 0.0014950420279940895, "loss": 2.4086, "step": 13214 }, { "epoch": 0.36, "learning_rate": 0.0014949664004593386, "loss": 2.1955, "step": 13215 }, { "epoch": 0.36, "learning_rate": 0.0014948907691748109, "loss": 2.829, "step": 13216 }, { "epoch": 0.36, "learning_rate": 0.001494815134141079, "loss": 2.458, "step": 13217 }, { "epoch": 0.36, "learning_rate": 0.001494739495358716, "loss": 2.4565, "step": 13218 }, { "epoch": 0.36, "learning_rate": 0.0014946638528282952, "loss": 2.5731, "step": 13219 }, { "epoch": 0.36, "learning_rate": 0.0014945882065503895, "loss": 2.6136, "step": 13220 }, { "epoch": 0.36, "learning_rate": 0.001494512556525572, "loss": 2.6784, "step": 13221 }, { "epoch": 0.36, "learning_rate": 0.0014944369027544155, "loss": 2.2319, "step": 13222 }, { "epoch": 0.36, "learning_rate": 0.0014943612452374938, "loss": 2.8763, "step": 13223 }, { "epoch": 0.36, "learning_rate": 0.0014942855839753797, "loss": 2.8397, "step": 13224 }, { "epoch": 0.36, "learning_rate": 0.001494209918968646, "loss": 2.7796, "step": 13225 }, { "epoch": 0.36, "learning_rate": 0.0014941342502178664, "loss": 2.7836, "step": 13226 }, { "epoch": 0.36, "learning_rate": 0.0014940585777236143, "loss": 2.8614, "step": 13227 }, { "epoch": 0.36, "learning_rate": 0.0014939829014864628, "loss": 2.3548, "step": 13228 }, { "epoch": 0.36, "learning_rate": 0.001493907221506985, "loss": 2.7021, "step": 13229 }, { "epoch": 0.36, "learning_rate": 0.0014938315377857542, "loss": 2.5886, "step": 13230 }, { "epoch": 0.36, "learning_rate": 0.0014937558503233443, "loss": 2.8871, "step": 13231 }, { "epoch": 0.36, "learning_rate": 0.001493680159120328, "loss": 2.9938, "step": 13232 }, { "epoch": 0.36, "learning_rate": 0.0014936044641772797, "loss": 2.5118, "step": 13233 }, { "epoch": 0.36, "learning_rate": 0.0014935287654947716, "loss": 2.2469, "step": 13234 }, { "epoch": 0.36, "learning_rate": 0.001493453063073378, "loss": 2.6503, "step": 13235 }, { "epoch": 0.36, "learning_rate": 0.0014933773569136724, "loss": 2.7875, "step": 13236 }, { "epoch": 0.36, "learning_rate": 0.001493301647016228, "loss": 2.7375, "step": 13237 }, { "epoch": 0.36, "learning_rate": 0.0014932259333816185, "loss": 2.0994, "step": 13238 }, { "epoch": 0.36, "learning_rate": 0.0014931502160104174, "loss": 2.5489, "step": 13239 }, { "epoch": 0.36, "learning_rate": 0.0014930744949031986, "loss": 2.4089, "step": 13240 }, { "epoch": 0.36, "learning_rate": 0.0014929987700605355, "loss": 2.6283, "step": 13241 }, { "epoch": 0.36, "learning_rate": 0.0014929230414830017, "loss": 2.2908, "step": 13242 }, { "epoch": 0.36, "learning_rate": 0.0014928473091711714, "loss": 2.7888, "step": 13243 }, { "epoch": 0.36, "learning_rate": 0.0014927715731256179, "loss": 2.8613, "step": 13244 }, { "epoch": 0.36, "learning_rate": 0.001492695833346915, "loss": 2.6274, "step": 13245 }, { "epoch": 0.36, "learning_rate": 0.0014926200898356364, "loss": 2.6628, "step": 13246 }, { "epoch": 0.36, "learning_rate": 0.0014925443425923563, "loss": 3.041, "step": 13247 }, { "epoch": 0.36, "learning_rate": 0.0014924685916176482, "loss": 2.5496, "step": 13248 }, { "epoch": 0.36, "learning_rate": 0.001492392836912086, "loss": 2.2377, "step": 13249 }, { "epoch": 0.36, "learning_rate": 0.0014923170784762441, "loss": 2.8492, "step": 13250 }, { "epoch": 0.36, "learning_rate": 0.0014922413163106958, "loss": 2.9435, "step": 13251 }, { "epoch": 0.36, "learning_rate": 0.0014921655504160152, "loss": 2.7774, "step": 13252 }, { "epoch": 0.36, "learning_rate": 0.0014920897807927762, "loss": 2.6544, "step": 13253 }, { "epoch": 0.36, "learning_rate": 0.0014920140074415533, "loss": 2.5167, "step": 13254 }, { "epoch": 0.36, "learning_rate": 0.0014919382303629203, "loss": 2.7231, "step": 13255 }, { "epoch": 0.36, "learning_rate": 0.001491862449557451, "loss": 2.6691, "step": 13256 }, { "epoch": 0.36, "learning_rate": 0.00149178666502572, "loss": 2.6664, "step": 13257 }, { "epoch": 0.36, "learning_rate": 0.0014917108767683008, "loss": 2.632, "step": 13258 }, { "epoch": 0.36, "learning_rate": 0.0014916350847857683, "loss": 2.5248, "step": 13259 }, { "epoch": 0.36, "learning_rate": 0.0014915592890786963, "loss": 2.6859, "step": 13260 }, { "epoch": 0.36, "learning_rate": 0.0014914834896476586, "loss": 2.5, "step": 13261 }, { "epoch": 0.36, "learning_rate": 0.0014914076864932298, "loss": 2.3458, "step": 13262 }, { "epoch": 0.36, "learning_rate": 0.0014913318796159847, "loss": 2.2786, "step": 13263 }, { "epoch": 0.36, "learning_rate": 0.001491256069016497, "loss": 2.6343, "step": 13264 }, { "epoch": 0.36, "learning_rate": 0.0014911802546953405, "loss": 2.8315, "step": 13265 }, { "epoch": 0.36, "learning_rate": 0.0014911044366530911, "loss": 2.4417, "step": 13266 }, { "epoch": 0.36, "learning_rate": 0.0014910286148903217, "loss": 2.7417, "step": 13267 }, { "epoch": 0.36, "learning_rate": 0.0014909527894076077, "loss": 2.5099, "step": 13268 }, { "epoch": 0.36, "learning_rate": 0.0014908769602055229, "loss": 2.179, "step": 13269 }, { "epoch": 0.36, "learning_rate": 0.001490801127284642, "loss": 2.8427, "step": 13270 }, { "epoch": 0.36, "learning_rate": 0.0014907252906455396, "loss": 2.6109, "step": 13271 }, { "epoch": 0.36, "learning_rate": 0.0014906494502887901, "loss": 2.404, "step": 13272 }, { "epoch": 0.36, "learning_rate": 0.0014905736062149682, "loss": 2.4241, "step": 13273 }, { "epoch": 0.36, "learning_rate": 0.0014904977584246483, "loss": 2.5806, "step": 13274 }, { "epoch": 0.36, "learning_rate": 0.0014904219069184048, "loss": 2.4639, "step": 13275 }, { "epoch": 0.36, "learning_rate": 0.001490346051696813, "loss": 2.4189, "step": 13276 }, { "epoch": 0.36, "learning_rate": 0.0014902701927604468, "loss": 2.8008, "step": 13277 }, { "epoch": 0.36, "learning_rate": 0.0014901943301098817, "loss": 2.7067, "step": 13278 }, { "epoch": 0.36, "learning_rate": 0.001490118463745692, "loss": 2.4432, "step": 13279 }, { "epoch": 0.36, "learning_rate": 0.001490042593668452, "loss": 2.625, "step": 13280 }, { "epoch": 0.36, "learning_rate": 0.0014899667198787373, "loss": 2.4883, "step": 13281 }, { "epoch": 0.36, "learning_rate": 0.001489890842377122, "loss": 2.1902, "step": 13282 }, { "epoch": 0.36, "learning_rate": 0.0014898149611641816, "loss": 2.8512, "step": 13283 }, { "epoch": 0.36, "learning_rate": 0.0014897390762404906, "loss": 2.6847, "step": 13284 }, { "epoch": 0.36, "learning_rate": 0.0014896631876066236, "loss": 2.5179, "step": 13285 }, { "epoch": 0.36, "learning_rate": 0.001489587295263156, "loss": 2.9308, "step": 13286 }, { "epoch": 0.36, "learning_rate": 0.0014895113992106628, "loss": 2.4331, "step": 13287 }, { "epoch": 0.36, "learning_rate": 0.0014894354994497185, "loss": 2.3142, "step": 13288 }, { "epoch": 0.36, "learning_rate": 0.0014893595959808983, "loss": 2.3724, "step": 13289 }, { "epoch": 0.36, "learning_rate": 0.0014892836888047776, "loss": 2.699, "step": 13290 }, { "epoch": 0.36, "learning_rate": 0.0014892077779219309, "loss": 2.6032, "step": 13291 }, { "epoch": 0.36, "learning_rate": 0.0014891318633329334, "loss": 2.5092, "step": 13292 }, { "epoch": 0.36, "learning_rate": 0.0014890559450383605, "loss": 2.6734, "step": 13293 }, { "epoch": 0.36, "learning_rate": 0.0014889800230387874, "loss": 2.1545, "step": 13294 }, { "epoch": 0.36, "learning_rate": 0.001488904097334789, "loss": 2.6652, "step": 13295 }, { "epoch": 0.36, "learning_rate": 0.0014888281679269401, "loss": 2.7689, "step": 13296 }, { "epoch": 0.36, "learning_rate": 0.001488752234815817, "loss": 2.7956, "step": 13297 }, { "epoch": 0.36, "learning_rate": 0.0014886762980019941, "loss": 2.3121, "step": 13298 }, { "epoch": 0.36, "learning_rate": 0.001488600357486047, "loss": 2.9148, "step": 13299 }, { "epoch": 0.36, "learning_rate": 0.0014885244132685509, "loss": 2.8377, "step": 13300 }, { "epoch": 0.36, "learning_rate": 0.0014884484653500812, "loss": 2.7769, "step": 13301 }, { "epoch": 0.36, "learning_rate": 0.0014883725137312131, "loss": 2.3875, "step": 13302 }, { "epoch": 0.36, "learning_rate": 0.0014882965584125224, "loss": 2.7934, "step": 13303 }, { "epoch": 0.36, "learning_rate": 0.0014882205993945843, "loss": 2.227, "step": 13304 }, { "epoch": 0.36, "learning_rate": 0.0014881446366779739, "loss": 2.6462, "step": 13305 }, { "epoch": 0.36, "learning_rate": 0.0014880686702632674, "loss": 2.828, "step": 13306 }, { "epoch": 0.36, "learning_rate": 0.0014879927001510396, "loss": 2.5315, "step": 13307 }, { "epoch": 0.36, "learning_rate": 0.0014879167263418664, "loss": 2.4092, "step": 13308 }, { "epoch": 0.36, "learning_rate": 0.0014878407488363235, "loss": 2.5075, "step": 13309 }, { "epoch": 0.36, "learning_rate": 0.001487764767634986, "loss": 2.5397, "step": 13310 }, { "epoch": 0.36, "learning_rate": 0.00148768878273843, "loss": 2.9005, "step": 13311 }, { "epoch": 0.36, "learning_rate": 0.0014876127941472308, "loss": 2.6292, "step": 13312 }, { "epoch": 0.36, "learning_rate": 0.0014875368018619647, "loss": 2.7656, "step": 13313 }, { "epoch": 0.36, "learning_rate": 0.0014874608058832064, "loss": 2.7111, "step": 13314 }, { "epoch": 0.36, "learning_rate": 0.0014873848062115327, "loss": 2.6958, "step": 13315 }, { "epoch": 0.36, "learning_rate": 0.0014873088028475184, "loss": 2.7763, "step": 13316 }, { "epoch": 0.36, "learning_rate": 0.0014872327957917402, "loss": 2.5983, "step": 13317 }, { "epoch": 0.36, "learning_rate": 0.001487156785044773, "loss": 2.3519, "step": 13318 }, { "epoch": 0.36, "learning_rate": 0.0014870807706071933, "loss": 2.8356, "step": 13319 }, { "epoch": 0.36, "learning_rate": 0.0014870047524795766, "loss": 2.5551, "step": 13320 }, { "epoch": 0.36, "learning_rate": 0.0014869287306624992, "loss": 2.7103, "step": 13321 }, { "epoch": 0.36, "learning_rate": 0.0014868527051565366, "loss": 2.8298, "step": 13322 }, { "epoch": 0.36, "learning_rate": 0.001486776675962265, "loss": 2.4479, "step": 13323 }, { "epoch": 0.36, "learning_rate": 0.0014867006430802604, "loss": 2.4295, "step": 13324 }, { "epoch": 0.36, "learning_rate": 0.0014866246065110987, "loss": 2.7065, "step": 13325 }, { "epoch": 0.36, "learning_rate": 0.0014865485662553563, "loss": 2.6275, "step": 13326 }, { "epoch": 0.36, "learning_rate": 0.0014864725223136083, "loss": 2.5799, "step": 13327 }, { "epoch": 0.36, "learning_rate": 0.0014863964746864317, "loss": 2.7265, "step": 13328 }, { "epoch": 0.36, "learning_rate": 0.0014863204233744028, "loss": 2.6084, "step": 13329 }, { "epoch": 0.36, "learning_rate": 0.0014862443683780968, "loss": 2.5748, "step": 13330 }, { "epoch": 0.36, "learning_rate": 0.0014861683096980905, "loss": 2.3906, "step": 13331 }, { "epoch": 0.36, "learning_rate": 0.00148609224733496, "loss": 2.9915, "step": 13332 }, { "epoch": 0.36, "learning_rate": 0.001486016181289282, "loss": 2.4511, "step": 13333 }, { "epoch": 0.36, "learning_rate": 0.0014859401115616315, "loss": 2.53, "step": 13334 }, { "epoch": 0.36, "learning_rate": 0.001485864038152586, "loss": 2.3094, "step": 13335 }, { "epoch": 0.36, "learning_rate": 0.0014857879610627217, "loss": 2.4679, "step": 13336 }, { "epoch": 0.36, "learning_rate": 0.0014857118802926142, "loss": 2.2826, "step": 13337 }, { "epoch": 0.36, "learning_rate": 0.0014856357958428405, "loss": 2.4122, "step": 13338 }, { "epoch": 0.36, "learning_rate": 0.0014855597077139766, "loss": 2.4163, "step": 13339 }, { "epoch": 0.36, "learning_rate": 0.0014854836159065997, "loss": 3.0407, "step": 13340 }, { "epoch": 0.36, "learning_rate": 0.0014854075204212853, "loss": 2.4218, "step": 13341 }, { "epoch": 0.36, "learning_rate": 0.0014853314212586106, "loss": 2.7219, "step": 13342 }, { "epoch": 0.36, "learning_rate": 0.0014852553184191515, "loss": 2.5252, "step": 13343 }, { "epoch": 0.36, "learning_rate": 0.001485179211903485, "loss": 2.4801, "step": 13344 }, { "epoch": 0.36, "learning_rate": 0.0014851031017121877, "loss": 2.5075, "step": 13345 }, { "epoch": 0.36, "learning_rate": 0.0014850269878458357, "loss": 2.6852, "step": 13346 }, { "epoch": 0.36, "learning_rate": 0.0014849508703050063, "loss": 2.7968, "step": 13347 }, { "epoch": 0.36, "learning_rate": 0.0014848747490902754, "loss": 2.7246, "step": 13348 }, { "epoch": 0.36, "learning_rate": 0.0014847986242022204, "loss": 2.4428, "step": 13349 }, { "epoch": 0.36, "learning_rate": 0.0014847224956414176, "loss": 2.3244, "step": 13350 }, { "epoch": 0.36, "learning_rate": 0.001484646363408444, "loss": 2.4483, "step": 13351 }, { "epoch": 0.36, "learning_rate": 0.001484570227503876, "loss": 2.7494, "step": 13352 }, { "epoch": 0.36, "learning_rate": 0.0014844940879282906, "loss": 2.0726, "step": 13353 }, { "epoch": 0.36, "learning_rate": 0.0014844179446822647, "loss": 2.6999, "step": 13354 }, { "epoch": 0.36, "learning_rate": 0.0014843417977663748, "loss": 2.6215, "step": 13355 }, { "epoch": 0.36, "learning_rate": 0.0014842656471811986, "loss": 3.0465, "step": 13356 }, { "epoch": 0.36, "learning_rate": 0.001484189492927312, "loss": 2.7754, "step": 13357 }, { "epoch": 0.36, "learning_rate": 0.0014841133350052924, "loss": 2.4825, "step": 13358 }, { "epoch": 0.36, "learning_rate": 0.0014840371734157168, "loss": 2.5056, "step": 13359 }, { "epoch": 0.36, "learning_rate": 0.0014839610081591622, "loss": 2.4263, "step": 13360 }, { "epoch": 0.36, "learning_rate": 0.0014838848392362053, "loss": 2.8878, "step": 13361 }, { "epoch": 0.36, "learning_rate": 0.0014838086666474233, "loss": 2.5522, "step": 13362 }, { "epoch": 0.36, "learning_rate": 0.0014837324903933938, "loss": 2.2435, "step": 13363 }, { "epoch": 0.36, "learning_rate": 0.001483656310474693, "loss": 2.7656, "step": 13364 }, { "epoch": 0.36, "learning_rate": 0.0014835801268918986, "loss": 2.7996, "step": 13365 }, { "epoch": 0.36, "learning_rate": 0.0014835039396455876, "loss": 2.7268, "step": 13366 }, { "epoch": 0.36, "learning_rate": 0.0014834277487363373, "loss": 2.315, "step": 13367 }, { "epoch": 0.36, "learning_rate": 0.0014833515541647247, "loss": 2.2887, "step": 13368 }, { "epoch": 0.36, "learning_rate": 0.0014832753559313272, "loss": 2.362, "step": 13369 }, { "epoch": 0.36, "learning_rate": 0.0014831991540367221, "loss": 2.761, "step": 13370 }, { "epoch": 0.36, "learning_rate": 0.0014831229484814862, "loss": 2.5251, "step": 13371 }, { "epoch": 0.36, "learning_rate": 0.0014830467392661975, "loss": 2.164, "step": 13372 }, { "epoch": 0.36, "learning_rate": 0.0014829705263914332, "loss": 2.5509, "step": 13373 }, { "epoch": 0.36, "learning_rate": 0.00148289430985777, "loss": 2.6637, "step": 13374 }, { "epoch": 0.36, "learning_rate": 0.0014828180896657866, "loss": 2.6299, "step": 13375 }, { "epoch": 0.36, "learning_rate": 0.0014827418658160593, "loss": 2.5512, "step": 13376 }, { "epoch": 0.36, "learning_rate": 0.001482665638309166, "loss": 2.2171, "step": 13377 }, { "epoch": 0.36, "learning_rate": 0.0014825894071456838, "loss": 2.6372, "step": 13378 }, { "epoch": 0.36, "learning_rate": 0.0014825131723261908, "loss": 2.7522, "step": 13379 }, { "epoch": 0.36, "learning_rate": 0.0014824369338512643, "loss": 2.3508, "step": 13380 }, { "epoch": 0.36, "learning_rate": 0.0014823606917214818, "loss": 2.8582, "step": 13381 }, { "epoch": 0.36, "learning_rate": 0.001482284445937421, "loss": 2.4048, "step": 13382 }, { "epoch": 0.36, "learning_rate": 0.0014822081964996595, "loss": 2.9165, "step": 13383 }, { "epoch": 0.36, "learning_rate": 0.0014821319434087745, "loss": 2.3833, "step": 13384 }, { "epoch": 0.36, "learning_rate": 0.0014820556866653447, "loss": 2.5345, "step": 13385 }, { "epoch": 0.36, "learning_rate": 0.0014819794262699469, "loss": 2.3609, "step": 13386 }, { "epoch": 0.36, "learning_rate": 0.0014819031622231589, "loss": 2.6253, "step": 13387 }, { "epoch": 0.36, "learning_rate": 0.001481826894525559, "loss": 2.5647, "step": 13388 }, { "epoch": 0.36, "learning_rate": 0.001481750623177725, "loss": 2.7466, "step": 13389 }, { "epoch": 0.36, "learning_rate": 0.0014816743481802337, "loss": 2.4069, "step": 13390 }, { "epoch": 0.36, "learning_rate": 0.001481598069533664, "loss": 2.6586, "step": 13391 }, { "epoch": 0.36, "learning_rate": 0.0014815217872385935, "loss": 2.3982, "step": 13392 }, { "epoch": 0.36, "learning_rate": 0.0014814455012956, "loss": 2.3799, "step": 13393 }, { "epoch": 0.36, "learning_rate": 0.0014813692117052614, "loss": 2.7547, "step": 13394 }, { "epoch": 0.36, "learning_rate": 0.0014812929184681556, "loss": 2.7285, "step": 13395 }, { "epoch": 0.36, "learning_rate": 0.001481216621584861, "loss": 2.1964, "step": 13396 }, { "epoch": 0.36, "learning_rate": 0.001481140321055955, "loss": 2.5248, "step": 13397 }, { "epoch": 0.36, "learning_rate": 0.001481064016882016, "loss": 2.5743, "step": 13398 }, { "epoch": 0.36, "learning_rate": 0.001480987709063622, "loss": 2.806, "step": 13399 }, { "epoch": 0.36, "learning_rate": 0.0014809113976013513, "loss": 2.7227, "step": 13400 }, { "epoch": 0.36, "learning_rate": 0.0014808350824957817, "loss": 2.1963, "step": 13401 }, { "epoch": 0.36, "learning_rate": 0.0014807587637474915, "loss": 2.8885, "step": 13402 }, { "epoch": 0.36, "learning_rate": 0.0014806824413570588, "loss": 2.4613, "step": 13403 }, { "epoch": 0.36, "learning_rate": 0.001480606115325062, "loss": 2.9959, "step": 13404 }, { "epoch": 0.36, "learning_rate": 0.001480529785652079, "loss": 2.524, "step": 13405 }, { "epoch": 0.36, "learning_rate": 0.0014804534523386885, "loss": 2.1598, "step": 13406 }, { "epoch": 0.36, "learning_rate": 0.0014803771153854683, "loss": 2.7825, "step": 13407 }, { "epoch": 0.36, "learning_rate": 0.0014803007747929973, "loss": 2.9043, "step": 13408 }, { "epoch": 0.36, "learning_rate": 0.0014802244305618531, "loss": 2.9716, "step": 13409 }, { "epoch": 0.36, "learning_rate": 0.0014801480826926146, "loss": 2.7168, "step": 13410 }, { "epoch": 0.36, "learning_rate": 0.0014800717311858602, "loss": 2.8911, "step": 13411 }, { "epoch": 0.36, "learning_rate": 0.0014799953760421683, "loss": 2.6369, "step": 13412 }, { "epoch": 0.36, "learning_rate": 0.0014799190172621168, "loss": 2.3763, "step": 13413 }, { "epoch": 0.36, "learning_rate": 0.001479842654846285, "loss": 2.5564, "step": 13414 }, { "epoch": 0.36, "learning_rate": 0.0014797662887952507, "loss": 2.4699, "step": 13415 }, { "epoch": 0.36, "learning_rate": 0.0014796899191095929, "loss": 2.0511, "step": 13416 }, { "epoch": 0.36, "learning_rate": 0.0014796135457898903, "loss": 2.4836, "step": 13417 }, { "epoch": 0.36, "learning_rate": 0.001479537168836721, "loss": 2.8676, "step": 13418 }, { "epoch": 0.36, "learning_rate": 0.001479460788250664, "loss": 2.4423, "step": 13419 }, { "epoch": 0.36, "learning_rate": 0.0014793844040322975, "loss": 2.8267, "step": 13420 }, { "epoch": 0.36, "learning_rate": 0.0014793080161822005, "loss": 2.574, "step": 13421 }, { "epoch": 0.36, "learning_rate": 0.0014792316247009521, "loss": 2.5628, "step": 13422 }, { "epoch": 0.36, "learning_rate": 0.0014791552295891303, "loss": 2.4802, "step": 13423 }, { "epoch": 0.36, "learning_rate": 0.001479078830847314, "loss": 2.7222, "step": 13424 }, { "epoch": 0.36, "learning_rate": 0.0014790024284760822, "loss": 2.6307, "step": 13425 }, { "epoch": 0.36, "learning_rate": 0.0014789260224760139, "loss": 2.3935, "step": 13426 }, { "epoch": 0.36, "learning_rate": 0.0014788496128476873, "loss": 2.6813, "step": 13427 }, { "epoch": 0.36, "learning_rate": 0.001478773199591682, "loss": 2.3858, "step": 13428 }, { "epoch": 0.36, "learning_rate": 0.0014786967827085762, "loss": 2.6829, "step": 13429 }, { "epoch": 0.36, "learning_rate": 0.0014786203621989492, "loss": 2.7429, "step": 13430 }, { "epoch": 0.36, "learning_rate": 0.0014785439380633801, "loss": 2.3978, "step": 13431 }, { "epoch": 0.36, "learning_rate": 0.0014784675103024477, "loss": 2.7218, "step": 13432 }, { "epoch": 0.36, "learning_rate": 0.0014783910789167307, "loss": 2.5578, "step": 13433 }, { "epoch": 0.36, "learning_rate": 0.0014783146439068086, "loss": 2.483, "step": 13434 }, { "epoch": 0.36, "learning_rate": 0.0014782382052732604, "loss": 2.8677, "step": 13435 }, { "epoch": 0.36, "learning_rate": 0.0014781617630166648, "loss": 2.3022, "step": 13436 }, { "epoch": 0.36, "learning_rate": 0.0014780853171376012, "loss": 2.2256, "step": 13437 }, { "epoch": 0.36, "learning_rate": 0.001478008867636649, "loss": 2.6856, "step": 13438 }, { "epoch": 0.36, "learning_rate": 0.001477932414514387, "loss": 2.5833, "step": 13439 }, { "epoch": 0.36, "learning_rate": 0.0014778559577713942, "loss": 2.511, "step": 13440 }, { "epoch": 0.36, "learning_rate": 0.00147777949740825, "loss": 2.5658, "step": 13441 }, { "epoch": 0.36, "learning_rate": 0.0014777030334255344, "loss": 2.606, "step": 13442 }, { "epoch": 0.36, "learning_rate": 0.0014776265658238254, "loss": 2.5226, "step": 13443 }, { "epoch": 0.36, "learning_rate": 0.0014775500946037031, "loss": 2.9886, "step": 13444 }, { "epoch": 0.36, "learning_rate": 0.0014774736197657467, "loss": 2.8028, "step": 13445 }, { "epoch": 0.36, "learning_rate": 0.0014773971413105356, "loss": 2.7808, "step": 13446 }, { "epoch": 0.36, "learning_rate": 0.0014773206592386492, "loss": 2.4569, "step": 13447 }, { "epoch": 0.36, "learning_rate": 0.0014772441735506666, "loss": 2.6701, "step": 13448 }, { "epoch": 0.36, "learning_rate": 0.0014771676842471675, "loss": 2.3741, "step": 13449 }, { "epoch": 0.36, "learning_rate": 0.0014770911913287313, "loss": 2.3996, "step": 13450 }, { "epoch": 0.36, "learning_rate": 0.0014770146947959378, "loss": 2.9025, "step": 13451 }, { "epoch": 0.36, "learning_rate": 0.0014769381946493658, "loss": 2.8348, "step": 13452 }, { "epoch": 0.36, "learning_rate": 0.0014768616908895956, "loss": 2.7327, "step": 13453 }, { "epoch": 0.36, "learning_rate": 0.0014767851835172064, "loss": 2.5519, "step": 13454 }, { "epoch": 0.36, "learning_rate": 0.0014767086725327781, "loss": 2.381, "step": 13455 }, { "epoch": 0.36, "learning_rate": 0.0014766321579368898, "loss": 2.8589, "step": 13456 }, { "epoch": 0.36, "learning_rate": 0.0014765556397301216, "loss": 2.4985, "step": 13457 }, { "epoch": 0.36, "learning_rate": 0.0014764791179130532, "loss": 2.643, "step": 13458 }, { "epoch": 0.36, "learning_rate": 0.001476402592486264, "loss": 2.5742, "step": 13459 }, { "epoch": 0.36, "learning_rate": 0.0014763260634503342, "loss": 2.705, "step": 13460 }, { "epoch": 0.36, "learning_rate": 0.001476249530805843, "loss": 2.329, "step": 13461 }, { "epoch": 0.36, "learning_rate": 0.0014761729945533709, "loss": 2.747, "step": 13462 }, { "epoch": 0.36, "learning_rate": 0.001476096454693497, "loss": 2.4919, "step": 13463 }, { "epoch": 0.36, "learning_rate": 0.0014760199112268013, "loss": 2.1159, "step": 13464 }, { "epoch": 0.36, "learning_rate": 0.0014759433641538641, "loss": 2.5362, "step": 13465 }, { "epoch": 0.36, "learning_rate": 0.0014758668134752652, "loss": 2.6222, "step": 13466 }, { "epoch": 0.36, "learning_rate": 0.0014757902591915843, "loss": 2.7392, "step": 13467 }, { "epoch": 0.36, "learning_rate": 0.0014757137013034014, "loss": 2.7688, "step": 13468 }, { "epoch": 0.36, "learning_rate": 0.0014756371398112966, "loss": 2.7971, "step": 13469 }, { "epoch": 0.36, "learning_rate": 0.0014755605747158499, "loss": 2.2536, "step": 13470 }, { "epoch": 0.36, "learning_rate": 0.0014754840060176408, "loss": 2.7054, "step": 13471 }, { "epoch": 0.36, "learning_rate": 0.0014754074337172507, "loss": 2.7781, "step": 13472 }, { "epoch": 0.36, "learning_rate": 0.0014753308578152585, "loss": 2.7477, "step": 13473 }, { "epoch": 0.36, "learning_rate": 0.0014752542783122446, "loss": 2.7248, "step": 13474 }, { "epoch": 0.36, "learning_rate": 0.0014751776952087892, "loss": 2.6735, "step": 13475 }, { "epoch": 0.36, "learning_rate": 0.0014751011085054725, "loss": 2.5876, "step": 13476 }, { "epoch": 0.36, "learning_rate": 0.0014750245182028753, "loss": 2.5966, "step": 13477 }, { "epoch": 0.36, "learning_rate": 0.0014749479243015768, "loss": 2.187, "step": 13478 }, { "epoch": 0.36, "learning_rate": 0.0014748713268021578, "loss": 2.7541, "step": 13479 }, { "epoch": 0.36, "learning_rate": 0.0014747947257051986, "loss": 2.7765, "step": 13480 }, { "epoch": 0.36, "learning_rate": 0.0014747181210112794, "loss": 2.9916, "step": 13481 }, { "epoch": 0.36, "learning_rate": 0.001474641512720981, "loss": 2.3426, "step": 13482 }, { "epoch": 0.36, "learning_rate": 0.0014745649008348824, "loss": 2.7753, "step": 13483 }, { "epoch": 0.36, "learning_rate": 0.0014744882853535658, "loss": 2.5191, "step": 13484 }, { "epoch": 0.36, "learning_rate": 0.0014744116662776107, "loss": 2.5317, "step": 13485 }, { "epoch": 0.36, "learning_rate": 0.0014743350436075971, "loss": 2.4612, "step": 13486 }, { "epoch": 0.36, "learning_rate": 0.0014742584173441063, "loss": 2.1882, "step": 13487 }, { "epoch": 0.36, "learning_rate": 0.0014741817874877189, "loss": 2.5088, "step": 13488 }, { "epoch": 0.36, "learning_rate": 0.0014741051540390145, "loss": 2.392, "step": 13489 }, { "epoch": 0.36, "learning_rate": 0.0014740285169985747, "loss": 2.5814, "step": 13490 }, { "epoch": 0.36, "learning_rate": 0.001473951876366979, "loss": 2.3681, "step": 13491 }, { "epoch": 0.36, "learning_rate": 0.0014738752321448092, "loss": 2.4775, "step": 13492 }, { "epoch": 0.36, "learning_rate": 0.001473798584332645, "loss": 2.1451, "step": 13493 }, { "epoch": 0.36, "learning_rate": 0.0014737219329310676, "loss": 2.7145, "step": 13494 }, { "epoch": 0.36, "learning_rate": 0.0014736452779406575, "loss": 2.7336, "step": 13495 }, { "epoch": 0.36, "learning_rate": 0.0014735686193619953, "loss": 2.2558, "step": 13496 }, { "epoch": 0.36, "learning_rate": 0.0014734919571956619, "loss": 2.9188, "step": 13497 }, { "epoch": 0.36, "learning_rate": 0.0014734152914422385, "loss": 2.4187, "step": 13498 }, { "epoch": 0.36, "learning_rate": 0.0014733386221023048, "loss": 2.9913, "step": 13499 }, { "epoch": 0.36, "learning_rate": 0.001473261949176443, "loss": 2.7127, "step": 13500 }, { "epoch": 0.36, "learning_rate": 0.001473185272665233, "loss": 2.947, "step": 13501 }, { "epoch": 0.36, "learning_rate": 0.001473108592569256, "loss": 2.5917, "step": 13502 }, { "epoch": 0.36, "learning_rate": 0.0014730319088890928, "loss": 2.8061, "step": 13503 }, { "epoch": 0.36, "learning_rate": 0.0014729552216253246, "loss": 2.5452, "step": 13504 }, { "epoch": 0.36, "learning_rate": 0.0014728785307785322, "loss": 2.4477, "step": 13505 }, { "epoch": 0.36, "learning_rate": 0.0014728018363492966, "loss": 2.6076, "step": 13506 }, { "epoch": 0.36, "learning_rate": 0.0014727251383381986, "loss": 2.5883, "step": 13507 }, { "epoch": 0.36, "learning_rate": 0.0014726484367458194, "loss": 2.8167, "step": 13508 }, { "epoch": 0.36, "learning_rate": 0.0014725717315727405, "loss": 2.5459, "step": 13509 }, { "epoch": 0.36, "learning_rate": 0.0014724950228195421, "loss": 2.5867, "step": 13510 }, { "epoch": 0.36, "learning_rate": 0.0014724183104868065, "loss": 2.8, "step": 13511 }, { "epoch": 0.36, "learning_rate": 0.001472341594575114, "loss": 2.7259, "step": 13512 }, { "epoch": 0.36, "learning_rate": 0.0014722648750850463, "loss": 2.6768, "step": 13513 }, { "epoch": 0.36, "learning_rate": 0.0014721881520171837, "loss": 2.3765, "step": 13514 }, { "epoch": 0.36, "learning_rate": 0.0014721114253721085, "loss": 2.9345, "step": 13515 }, { "epoch": 0.36, "learning_rate": 0.0014720346951504015, "loss": 2.6895, "step": 13516 }, { "epoch": 0.36, "learning_rate": 0.001471957961352644, "loss": 2.5478, "step": 13517 }, { "epoch": 0.36, "learning_rate": 0.0014718812239794174, "loss": 2.7353, "step": 13518 }, { "epoch": 0.36, "learning_rate": 0.001471804483031303, "loss": 2.3539, "step": 13519 }, { "epoch": 0.36, "learning_rate": 0.0014717277385088822, "loss": 2.2815, "step": 13520 }, { "epoch": 0.36, "learning_rate": 0.0014716509904127365, "loss": 2.8825, "step": 13521 }, { "epoch": 0.36, "learning_rate": 0.0014715742387434471, "loss": 2.8716, "step": 13522 }, { "epoch": 0.36, "learning_rate": 0.0014714974835015955, "loss": 2.501, "step": 13523 }, { "epoch": 0.36, "learning_rate": 0.0014714207246877636, "loss": 2.3438, "step": 13524 }, { "epoch": 0.36, "learning_rate": 0.0014713439623025319, "loss": 2.4386, "step": 13525 }, { "epoch": 0.36, "learning_rate": 0.0014712671963464832, "loss": 2.7243, "step": 13526 }, { "epoch": 0.36, "learning_rate": 0.0014711904268201984, "loss": 2.3751, "step": 13527 }, { "epoch": 0.36, "learning_rate": 0.001471113653724259, "loss": 2.1045, "step": 13528 }, { "epoch": 0.36, "learning_rate": 0.0014710368770592468, "loss": 2.7504, "step": 13529 }, { "epoch": 0.36, "learning_rate": 0.0014709600968257435, "loss": 2.4335, "step": 13530 }, { "epoch": 0.36, "learning_rate": 0.001470883313024331, "loss": 2.4108, "step": 13531 }, { "epoch": 0.36, "learning_rate": 0.00147080652565559, "loss": 2.739, "step": 13532 }, { "epoch": 0.36, "learning_rate": 0.0014707297347201036, "loss": 2.5479, "step": 13533 }, { "epoch": 0.36, "learning_rate": 0.0014706529402184526, "loss": 2.2869, "step": 13534 }, { "epoch": 0.36, "learning_rate": 0.001470576142151219, "loss": 2.7403, "step": 13535 }, { "epoch": 0.36, "learning_rate": 0.0014704993405189849, "loss": 2.7442, "step": 13536 }, { "epoch": 0.36, "learning_rate": 0.0014704225353223317, "loss": 3.1035, "step": 13537 }, { "epoch": 0.36, "learning_rate": 0.0014703457265618414, "loss": 2.9141, "step": 13538 }, { "epoch": 0.36, "learning_rate": 0.0014702689142380963, "loss": 2.5176, "step": 13539 }, { "epoch": 0.36, "learning_rate": 0.0014701920983516779, "loss": 2.7738, "step": 13540 }, { "epoch": 0.36, "learning_rate": 0.0014701152789031683, "loss": 2.5143, "step": 13541 }, { "epoch": 0.36, "learning_rate": 0.0014700384558931489, "loss": 2.443, "step": 13542 }, { "epoch": 0.36, "learning_rate": 0.0014699616293222025, "loss": 2.4642, "step": 13543 }, { "epoch": 0.36, "learning_rate": 0.001469884799190911, "loss": 2.522, "step": 13544 }, { "epoch": 0.36, "learning_rate": 0.001469807965499856, "loss": 2.2241, "step": 13545 }, { "epoch": 0.36, "learning_rate": 0.0014697311282496196, "loss": 2.3423, "step": 13546 }, { "epoch": 0.36, "learning_rate": 0.0014696542874407849, "loss": 2.4109, "step": 13547 }, { "epoch": 0.36, "learning_rate": 0.0014695774430739331, "loss": 2.5781, "step": 13548 }, { "epoch": 0.36, "learning_rate": 0.0014695005951496458, "loss": 2.6358, "step": 13549 }, { "epoch": 0.36, "learning_rate": 0.0014694237436685066, "loss": 2.6791, "step": 13550 }, { "epoch": 0.36, "learning_rate": 0.001469346888631097, "loss": 2.7217, "step": 13551 }, { "epoch": 0.36, "learning_rate": 0.0014692700300379992, "loss": 2.9861, "step": 13552 }, { "epoch": 0.36, "learning_rate": 0.0014691931678897953, "loss": 2.1566, "step": 13553 }, { "epoch": 0.36, "learning_rate": 0.0014691163021870685, "loss": 2.6873, "step": 13554 }, { "epoch": 0.36, "learning_rate": 0.0014690394329303998, "loss": 2.917, "step": 13555 }, { "epoch": 0.36, "learning_rate": 0.0014689625601203727, "loss": 2.8369, "step": 13556 }, { "epoch": 0.36, "learning_rate": 0.0014688856837575686, "loss": 2.2838, "step": 13557 }, { "epoch": 0.36, "learning_rate": 0.001468808803842571, "loss": 2.6469, "step": 13558 }, { "epoch": 0.36, "learning_rate": 0.001468731920375961, "loss": 2.6254, "step": 13559 }, { "epoch": 0.36, "learning_rate": 0.0014686550333583223, "loss": 2.3328, "step": 13560 }, { "epoch": 0.36, "learning_rate": 0.0014685781427902366, "loss": 2.8119, "step": 13561 }, { "epoch": 0.36, "learning_rate": 0.0014685012486722866, "loss": 2.4296, "step": 13562 }, { "epoch": 0.36, "learning_rate": 0.0014684243510050552, "loss": 2.8732, "step": 13563 }, { "epoch": 0.36, "learning_rate": 0.0014683474497891246, "loss": 2.4143, "step": 13564 }, { "epoch": 0.36, "learning_rate": 0.0014682705450250772, "loss": 2.3859, "step": 13565 }, { "epoch": 0.36, "learning_rate": 0.001468193636713496, "loss": 2.4032, "step": 13566 }, { "epoch": 0.36, "learning_rate": 0.0014681167248549638, "loss": 2.7077, "step": 13567 }, { "epoch": 0.36, "learning_rate": 0.0014680398094500627, "loss": 2.7854, "step": 13568 }, { "epoch": 0.36, "learning_rate": 0.0014679628904993756, "loss": 2.5691, "step": 13569 }, { "epoch": 0.36, "learning_rate": 0.0014678859680034855, "loss": 2.7368, "step": 13570 }, { "epoch": 0.36, "learning_rate": 0.0014678090419629748, "loss": 2.502, "step": 13571 }, { "epoch": 0.36, "learning_rate": 0.0014677321123784265, "loss": 2.5086, "step": 13572 }, { "epoch": 0.36, "learning_rate": 0.0014676551792504233, "loss": 2.649, "step": 13573 }, { "epoch": 0.36, "learning_rate": 0.0014675782425795482, "loss": 2.3885, "step": 13574 }, { "epoch": 0.36, "learning_rate": 0.0014675013023663838, "loss": 2.2886, "step": 13575 }, { "epoch": 0.36, "learning_rate": 0.0014674243586115133, "loss": 2.5227, "step": 13576 }, { "epoch": 0.36, "learning_rate": 0.0014673474113155191, "loss": 2.9263, "step": 13577 }, { "epoch": 0.36, "learning_rate": 0.0014672704604789847, "loss": 2.8072, "step": 13578 }, { "epoch": 0.36, "learning_rate": 0.0014671935061024927, "loss": 2.6556, "step": 13579 }, { "epoch": 0.36, "learning_rate": 0.0014671165481866266, "loss": 2.2746, "step": 13580 }, { "epoch": 0.36, "learning_rate": 0.0014670395867319686, "loss": 2.7554, "step": 13581 }, { "epoch": 0.36, "learning_rate": 0.0014669626217391023, "loss": 2.4848, "step": 13582 }, { "epoch": 0.37, "learning_rate": 0.0014668856532086107, "loss": 2.2784, "step": 13583 }, { "epoch": 0.37, "learning_rate": 0.0014668086811410767, "loss": 2.7935, "step": 13584 }, { "epoch": 0.37, "learning_rate": 0.0014667317055370838, "loss": 2.4229, "step": 13585 }, { "epoch": 0.37, "learning_rate": 0.001466654726397215, "loss": 2.7978, "step": 13586 }, { "epoch": 0.37, "learning_rate": 0.0014665777437220535, "loss": 2.6401, "step": 13587 }, { "epoch": 0.37, "learning_rate": 0.0014665007575121822, "loss": 2.5668, "step": 13588 }, { "epoch": 0.37, "learning_rate": 0.0014664237677681844, "loss": 2.6196, "step": 13589 }, { "epoch": 0.37, "learning_rate": 0.001466346774490644, "loss": 2.51, "step": 13590 }, { "epoch": 0.37, "learning_rate": 0.0014662697776801435, "loss": 2.7742, "step": 13591 }, { "epoch": 0.37, "learning_rate": 0.0014661927773372664, "loss": 2.4243, "step": 13592 }, { "epoch": 0.37, "learning_rate": 0.0014661157734625965, "loss": 2.5686, "step": 13593 }, { "epoch": 0.37, "learning_rate": 0.0014660387660567168, "loss": 2.3763, "step": 13594 }, { "epoch": 0.37, "learning_rate": 0.0014659617551202105, "loss": 2.3063, "step": 13595 }, { "epoch": 0.37, "learning_rate": 0.0014658847406536612, "loss": 2.2544, "step": 13596 }, { "epoch": 0.37, "learning_rate": 0.0014658077226576526, "loss": 2.4898, "step": 13597 }, { "epoch": 0.37, "learning_rate": 0.001465730701132768, "loss": 2.5567, "step": 13598 }, { "epoch": 0.37, "learning_rate": 0.0014656536760795909, "loss": 2.3492, "step": 13599 }, { "epoch": 0.37, "learning_rate": 0.0014655766474987045, "loss": 2.7357, "step": 13600 }, { "epoch": 0.37, "learning_rate": 0.001465499615390693, "loss": 2.3894, "step": 13601 }, { "epoch": 0.37, "learning_rate": 0.0014654225797561394, "loss": 2.9682, "step": 13602 }, { "epoch": 0.37, "learning_rate": 0.0014653455405956278, "loss": 2.4424, "step": 13603 }, { "epoch": 0.37, "learning_rate": 0.0014652684979097413, "loss": 2.6582, "step": 13604 }, { "epoch": 0.37, "learning_rate": 0.0014651914516990638, "loss": 2.8019, "step": 13605 }, { "epoch": 0.37, "learning_rate": 0.0014651144019641796, "loss": 2.2746, "step": 13606 }, { "epoch": 0.37, "learning_rate": 0.0014650373487056713, "loss": 2.757, "step": 13607 }, { "epoch": 0.37, "learning_rate": 0.001464960291924123, "loss": 2.7892, "step": 13608 }, { "epoch": 0.37, "learning_rate": 0.0014648832316201193, "loss": 2.8191, "step": 13609 }, { "epoch": 0.37, "learning_rate": 0.001464806167794243, "loss": 2.6188, "step": 13610 }, { "epoch": 0.37, "learning_rate": 0.0014647291004470783, "loss": 2.7715, "step": 13611 }, { "epoch": 0.37, "learning_rate": 0.001464652029579209, "loss": 2.4293, "step": 13612 }, { "epoch": 0.37, "learning_rate": 0.001464574955191219, "loss": 2.3732, "step": 13613 }, { "epoch": 0.37, "learning_rate": 0.0014644978772836922, "loss": 2.3787, "step": 13614 }, { "epoch": 0.37, "learning_rate": 0.0014644207958572127, "loss": 2.3061, "step": 13615 }, { "epoch": 0.37, "learning_rate": 0.001464343710912364, "loss": 2.1255, "step": 13616 }, { "epoch": 0.37, "learning_rate": 0.0014642666224497305, "loss": 2.7806, "step": 13617 }, { "epoch": 0.37, "learning_rate": 0.001464189530469896, "loss": 2.5873, "step": 13618 }, { "epoch": 0.37, "learning_rate": 0.001464112434973445, "loss": 2.7482, "step": 13619 }, { "epoch": 0.37, "learning_rate": 0.0014640353359609607, "loss": 2.7582, "step": 13620 }, { "epoch": 0.37, "learning_rate": 0.0014639582334330275, "loss": 2.5714, "step": 13621 }, { "epoch": 0.37, "learning_rate": 0.00146388112739023, "loss": 2.5936, "step": 13622 }, { "epoch": 0.37, "learning_rate": 0.001463804017833152, "loss": 2.6703, "step": 13623 }, { "epoch": 0.37, "learning_rate": 0.0014637269047623777, "loss": 3.2231, "step": 13624 }, { "epoch": 0.37, "learning_rate": 0.0014636497881784912, "loss": 2.26, "step": 13625 }, { "epoch": 0.37, "learning_rate": 0.0014635726680820769, "loss": 2.5635, "step": 13626 }, { "epoch": 0.37, "learning_rate": 0.0014634955444737187, "loss": 2.4793, "step": 13627 }, { "epoch": 0.37, "learning_rate": 0.0014634184173540014, "loss": 2.4849, "step": 13628 }, { "epoch": 0.37, "learning_rate": 0.001463341286723509, "loss": 2.9467, "step": 13629 }, { "epoch": 0.37, "learning_rate": 0.0014632641525828259, "loss": 2.4446, "step": 13630 }, { "epoch": 0.37, "learning_rate": 0.0014631870149325362, "loss": 2.7259, "step": 13631 }, { "epoch": 0.37, "learning_rate": 0.0014631098737732245, "loss": 2.7044, "step": 13632 }, { "epoch": 0.37, "learning_rate": 0.0014630327291054752, "loss": 2.675, "step": 13633 }, { "epoch": 0.37, "learning_rate": 0.0014629555809298727, "loss": 2.8164, "step": 13634 }, { "epoch": 0.37, "learning_rate": 0.0014628784292470014, "loss": 2.8829, "step": 13635 }, { "epoch": 0.37, "learning_rate": 0.0014628012740574463, "loss": 2.3402, "step": 13636 }, { "epoch": 0.37, "learning_rate": 0.0014627241153617914, "loss": 2.5661, "step": 13637 }, { "epoch": 0.37, "learning_rate": 0.001462646953160621, "loss": 2.5516, "step": 13638 }, { "epoch": 0.37, "learning_rate": 0.0014625697874545201, "loss": 2.8941, "step": 13639 }, { "epoch": 0.37, "learning_rate": 0.0014624926182440735, "loss": 2.6173, "step": 13640 }, { "epoch": 0.37, "learning_rate": 0.001462415445529865, "loss": 2.6803, "step": 13641 }, { "epoch": 0.37, "learning_rate": 0.00146233826931248, "loss": 2.8295, "step": 13642 }, { "epoch": 0.37, "learning_rate": 0.001462261089592503, "loss": 2.9346, "step": 13643 }, { "epoch": 0.37, "learning_rate": 0.0014621839063705187, "loss": 2.9114, "step": 13644 }, { "epoch": 0.37, "learning_rate": 0.0014621067196471113, "loss": 2.6209, "step": 13645 }, { "epoch": 0.37, "learning_rate": 0.0014620295294228668, "loss": 2.5169, "step": 13646 }, { "epoch": 0.37, "learning_rate": 0.0014619523356983683, "loss": 3.0687, "step": 13647 }, { "epoch": 0.37, "learning_rate": 0.001461875138474202, "loss": 2.5523, "step": 13648 }, { "epoch": 0.37, "learning_rate": 0.0014617979377509523, "loss": 2.3835, "step": 13649 }, { "epoch": 0.37, "learning_rate": 0.0014617207335292039, "loss": 2.3995, "step": 13650 }, { "epoch": 0.37, "learning_rate": 0.0014616435258095412, "loss": 2.712, "step": 13651 }, { "epoch": 0.37, "learning_rate": 0.0014615663145925504, "loss": 2.5907, "step": 13652 }, { "epoch": 0.37, "learning_rate": 0.0014614890998788158, "loss": 2.5078, "step": 13653 }, { "epoch": 0.37, "learning_rate": 0.0014614118816689218, "loss": 2.5945, "step": 13654 }, { "epoch": 0.37, "learning_rate": 0.001461334659963454, "loss": 2.739, "step": 13655 }, { "epoch": 0.37, "learning_rate": 0.0014612574347629974, "loss": 2.3028, "step": 13656 }, { "epoch": 0.37, "learning_rate": 0.001461180206068137, "loss": 2.5727, "step": 13657 }, { "epoch": 0.37, "learning_rate": 0.0014611029738794575, "loss": 2.3861, "step": 13658 }, { "epoch": 0.37, "learning_rate": 0.0014610257381975447, "loss": 2.2845, "step": 13659 }, { "epoch": 0.37, "learning_rate": 0.0014609484990229832, "loss": 2.8169, "step": 13660 }, { "epoch": 0.37, "learning_rate": 0.0014608712563563579, "loss": 2.8339, "step": 13661 }, { "epoch": 0.37, "learning_rate": 0.0014607940101982549, "loss": 2.703, "step": 13662 }, { "epoch": 0.37, "learning_rate": 0.0014607167605492587, "loss": 3.0687, "step": 13663 }, { "epoch": 0.37, "learning_rate": 0.0014606395074099545, "loss": 2.377, "step": 13664 }, { "epoch": 0.37, "learning_rate": 0.001460562250780928, "loss": 2.4451, "step": 13665 }, { "epoch": 0.37, "learning_rate": 0.001460484990662764, "loss": 2.8858, "step": 13666 }, { "epoch": 0.37, "learning_rate": 0.0014604077270560483, "loss": 2.5411, "step": 13667 }, { "epoch": 0.37, "learning_rate": 0.0014603304599613658, "loss": 2.9199, "step": 13668 }, { "epoch": 0.37, "learning_rate": 0.001460253189379302, "loss": 2.1347, "step": 13669 }, { "epoch": 0.37, "learning_rate": 0.0014601759153104424, "loss": 2.1376, "step": 13670 }, { "epoch": 0.37, "learning_rate": 0.0014600986377553721, "loss": 2.4198, "step": 13671 }, { "epoch": 0.37, "learning_rate": 0.0014600213567146773, "loss": 2.8316, "step": 13672 }, { "epoch": 0.37, "learning_rate": 0.0014599440721889427, "loss": 2.814, "step": 13673 }, { "epoch": 0.37, "learning_rate": 0.0014598667841787536, "loss": 2.7054, "step": 13674 }, { "epoch": 0.37, "learning_rate": 0.0014597894926846964, "loss": 2.4411, "step": 13675 }, { "epoch": 0.37, "learning_rate": 0.0014597121977073565, "loss": 2.1323, "step": 13676 }, { "epoch": 0.37, "learning_rate": 0.0014596348992473188, "loss": 2.343, "step": 13677 }, { "epoch": 0.37, "learning_rate": 0.001459557597305169, "loss": 2.4078, "step": 13678 }, { "epoch": 0.37, "learning_rate": 0.0014594802918814936, "loss": 2.202, "step": 13679 }, { "epoch": 0.37, "learning_rate": 0.0014594029829768772, "loss": 2.9595, "step": 13680 }, { "epoch": 0.37, "learning_rate": 0.0014593256705919063, "loss": 2.5336, "step": 13681 }, { "epoch": 0.37, "learning_rate": 0.0014592483547271658, "loss": 2.6117, "step": 13682 }, { "epoch": 0.37, "learning_rate": 0.0014591710353832421, "loss": 2.5229, "step": 13683 }, { "epoch": 0.37, "learning_rate": 0.0014590937125607208, "loss": 2.7398, "step": 13684 }, { "epoch": 0.37, "learning_rate": 0.0014590163862601877, "loss": 2.8559, "step": 13685 }, { "epoch": 0.37, "learning_rate": 0.0014589390564822282, "loss": 2.4718, "step": 13686 }, { "epoch": 0.37, "learning_rate": 0.0014588617232274286, "loss": 2.8064, "step": 13687 }, { "epoch": 0.37, "learning_rate": 0.0014587843864963747, "loss": 2.6413, "step": 13688 }, { "epoch": 0.37, "learning_rate": 0.0014587070462896525, "loss": 2.3288, "step": 13689 }, { "epoch": 0.37, "learning_rate": 0.0014586297026078473, "loss": 2.4294, "step": 13690 }, { "epoch": 0.37, "learning_rate": 0.0014585523554515457, "loss": 2.4786, "step": 13691 }, { "epoch": 0.37, "learning_rate": 0.0014584750048213335, "loss": 2.5954, "step": 13692 }, { "epoch": 0.37, "learning_rate": 0.0014583976507177964, "loss": 2.5026, "step": 13693 }, { "epoch": 0.37, "learning_rate": 0.0014583202931415208, "loss": 2.5477, "step": 13694 }, { "epoch": 0.37, "learning_rate": 0.0014582429320930926, "loss": 2.7684, "step": 13695 }, { "epoch": 0.37, "learning_rate": 0.0014581655675730979, "loss": 2.6543, "step": 13696 }, { "epoch": 0.37, "learning_rate": 0.0014580881995821227, "loss": 2.4305, "step": 13697 }, { "epoch": 0.37, "learning_rate": 0.0014580108281207532, "loss": 2.7293, "step": 13698 }, { "epoch": 0.37, "learning_rate": 0.0014579334531895755, "loss": 2.5086, "step": 13699 }, { "epoch": 0.37, "learning_rate": 0.0014578560747891757, "loss": 2.22, "step": 13700 }, { "epoch": 0.37, "learning_rate": 0.0014577786929201404, "loss": 3.0333, "step": 13701 }, { "epoch": 0.37, "learning_rate": 0.0014577013075830556, "loss": 2.5412, "step": 13702 }, { "epoch": 0.37, "learning_rate": 0.0014576239187785076, "loss": 2.4156, "step": 13703 }, { "epoch": 0.37, "learning_rate": 0.0014575465265070822, "loss": 2.3563, "step": 13704 }, { "epoch": 0.37, "learning_rate": 0.0014574691307693663, "loss": 2.5869, "step": 13705 }, { "epoch": 0.37, "learning_rate": 0.0014573917315659464, "loss": 2.5015, "step": 13706 }, { "epoch": 0.37, "learning_rate": 0.001457314328897408, "loss": 2.5865, "step": 13707 }, { "epoch": 0.37, "learning_rate": 0.0014572369227643382, "loss": 2.335, "step": 13708 }, { "epoch": 0.37, "learning_rate": 0.0014571595131673233, "loss": 2.3648, "step": 13709 }, { "epoch": 0.37, "learning_rate": 0.0014570821001069496, "loss": 2.7933, "step": 13710 }, { "epoch": 0.37, "learning_rate": 0.0014570046835838037, "loss": 2.7443, "step": 13711 }, { "epoch": 0.37, "learning_rate": 0.001456927263598472, "loss": 2.5379, "step": 13712 }, { "epoch": 0.37, "learning_rate": 0.0014568498401515409, "loss": 2.3035, "step": 13713 }, { "epoch": 0.37, "learning_rate": 0.0014567724132435972, "loss": 2.3949, "step": 13714 }, { "epoch": 0.37, "learning_rate": 0.0014566949828752273, "loss": 2.4003, "step": 13715 }, { "epoch": 0.37, "learning_rate": 0.0014566175490470182, "loss": 2.5213, "step": 13716 }, { "epoch": 0.37, "learning_rate": 0.0014565401117595553, "loss": 1.9833, "step": 13717 }, { "epoch": 0.37, "learning_rate": 0.001456462671013427, "loss": 2.5499, "step": 13718 }, { "epoch": 0.37, "learning_rate": 0.0014563852268092191, "loss": 2.912, "step": 13719 }, { "epoch": 0.37, "learning_rate": 0.001456307779147518, "loss": 2.7262, "step": 13720 }, { "epoch": 0.37, "learning_rate": 0.0014562303280289104, "loss": 2.7657, "step": 13721 }, { "epoch": 0.37, "learning_rate": 0.0014561528734539839, "loss": 2.5394, "step": 13722 }, { "epoch": 0.37, "learning_rate": 0.001456075415423325, "loss": 2.7461, "step": 13723 }, { "epoch": 0.37, "learning_rate": 0.0014559979539375196, "loss": 2.7787, "step": 13724 }, { "epoch": 0.37, "learning_rate": 0.0014559204889971556, "loss": 2.3565, "step": 13725 }, { "epoch": 0.37, "learning_rate": 0.0014558430206028196, "loss": 2.3817, "step": 13726 }, { "epoch": 0.37, "learning_rate": 0.0014557655487550984, "loss": 2.7546, "step": 13727 }, { "epoch": 0.37, "learning_rate": 0.0014556880734545787, "loss": 2.612, "step": 13728 }, { "epoch": 0.37, "learning_rate": 0.0014556105947018476, "loss": 2.6109, "step": 13729 }, { "epoch": 0.37, "learning_rate": 0.001455533112497492, "loss": 2.7468, "step": 13730 }, { "epoch": 0.37, "learning_rate": 0.0014554556268420993, "loss": 2.5079, "step": 13731 }, { "epoch": 0.37, "learning_rate": 0.0014553781377362558, "loss": 2.6535, "step": 13732 }, { "epoch": 0.37, "learning_rate": 0.0014553006451805495, "loss": 3.0203, "step": 13733 }, { "epoch": 0.37, "learning_rate": 0.0014552231491755665, "loss": 2.2206, "step": 13734 }, { "epoch": 0.37, "learning_rate": 0.0014551456497218945, "loss": 2.6379, "step": 13735 }, { "epoch": 0.37, "learning_rate": 0.0014550681468201202, "loss": 2.9728, "step": 13736 }, { "epoch": 0.37, "learning_rate": 0.001454990640470831, "loss": 2.3754, "step": 13737 }, { "epoch": 0.37, "learning_rate": 0.001454913130674614, "loss": 2.5612, "step": 13738 }, { "epoch": 0.37, "learning_rate": 0.001454835617432057, "loss": 2.2616, "step": 13739 }, { "epoch": 0.37, "learning_rate": 0.001454758100743746, "loss": 2.5222, "step": 13740 }, { "epoch": 0.37, "learning_rate": 0.0014546805806102694, "loss": 2.4026, "step": 13741 }, { "epoch": 0.37, "learning_rate": 0.0014546030570322139, "loss": 2.1173, "step": 13742 }, { "epoch": 0.37, "learning_rate": 0.0014545255300101667, "loss": 2.6288, "step": 13743 }, { "epoch": 0.37, "learning_rate": 0.0014544479995447154, "loss": 2.2715, "step": 13744 }, { "epoch": 0.37, "learning_rate": 0.0014543704656364476, "loss": 2.5002, "step": 13745 }, { "epoch": 0.37, "learning_rate": 0.0014542929282859503, "loss": 2.2503, "step": 13746 }, { "epoch": 0.37, "learning_rate": 0.001454215387493811, "loss": 2.3339, "step": 13747 }, { "epoch": 0.37, "learning_rate": 0.0014541378432606168, "loss": 2.7978, "step": 13748 }, { "epoch": 0.37, "learning_rate": 0.0014540602955869558, "loss": 2.8012, "step": 13749 }, { "epoch": 0.37, "learning_rate": 0.001453982744473415, "loss": 2.4053, "step": 13750 }, { "epoch": 0.37, "learning_rate": 0.0014539051899205822, "loss": 2.6314, "step": 13751 }, { "epoch": 0.37, "learning_rate": 0.0014538276319290447, "loss": 2.4409, "step": 13752 }, { "epoch": 0.37, "learning_rate": 0.0014537500704993901, "loss": 2.5922, "step": 13753 }, { "epoch": 0.37, "learning_rate": 0.0014536725056322065, "loss": 2.4458, "step": 13754 }, { "epoch": 0.37, "learning_rate": 0.001453594937328081, "loss": 2.6668, "step": 13755 }, { "epoch": 0.37, "learning_rate": 0.0014535173655876013, "loss": 2.3989, "step": 13756 }, { "epoch": 0.37, "learning_rate": 0.001453439790411355, "loss": 2.4056, "step": 13757 }, { "epoch": 0.37, "learning_rate": 0.00145336221179993, "loss": 2.2061, "step": 13758 }, { "epoch": 0.37, "learning_rate": 0.001453284629753914, "loss": 2.4408, "step": 13759 }, { "epoch": 0.37, "learning_rate": 0.0014532070442738942, "loss": 2.5378, "step": 13760 }, { "epoch": 0.37, "learning_rate": 0.0014531294553604595, "loss": 2.6614, "step": 13761 }, { "epoch": 0.37, "learning_rate": 0.001453051863014197, "loss": 2.6281, "step": 13762 }, { "epoch": 0.37, "learning_rate": 0.0014529742672356942, "loss": 2.6782, "step": 13763 }, { "epoch": 0.37, "learning_rate": 0.0014528966680255396, "loss": 2.7375, "step": 13764 }, { "epoch": 0.37, "learning_rate": 0.0014528190653843207, "loss": 2.8473, "step": 13765 }, { "epoch": 0.37, "learning_rate": 0.0014527414593126255, "loss": 2.7362, "step": 13766 }, { "epoch": 0.37, "learning_rate": 0.0014526638498110424, "loss": 2.6428, "step": 13767 }, { "epoch": 0.37, "learning_rate": 0.0014525862368801584, "loss": 2.3869, "step": 13768 }, { "epoch": 0.37, "learning_rate": 0.001452508620520562, "loss": 2.2539, "step": 13769 }, { "epoch": 0.37, "learning_rate": 0.0014524310007328412, "loss": 2.5986, "step": 13770 }, { "epoch": 0.37, "learning_rate": 0.001452353377517584, "loss": 2.8689, "step": 13771 }, { "epoch": 0.37, "learning_rate": 0.0014522757508753789, "loss": 2.5079, "step": 13772 }, { "epoch": 0.37, "learning_rate": 0.0014521981208068132, "loss": 2.4, "step": 13773 }, { "epoch": 0.37, "learning_rate": 0.0014521204873124754, "loss": 2.5337, "step": 13774 }, { "epoch": 0.37, "learning_rate": 0.0014520428503929537, "loss": 2.7344, "step": 13775 }, { "epoch": 0.37, "learning_rate": 0.0014519652100488361, "loss": 2.7295, "step": 13776 }, { "epoch": 0.37, "learning_rate": 0.001451887566280711, "loss": 2.4659, "step": 13777 }, { "epoch": 0.37, "learning_rate": 0.0014518099190891664, "loss": 2.535, "step": 13778 }, { "epoch": 0.37, "learning_rate": 0.0014517322684747906, "loss": 2.9175, "step": 13779 }, { "epoch": 0.37, "learning_rate": 0.001451654614438172, "loss": 2.469, "step": 13780 }, { "epoch": 0.37, "learning_rate": 0.0014515769569798987, "loss": 2.765, "step": 13781 }, { "epoch": 0.37, "learning_rate": 0.0014514992961005594, "loss": 2.7921, "step": 13782 }, { "epoch": 0.37, "learning_rate": 0.0014514216318007415, "loss": 2.6495, "step": 13783 }, { "epoch": 0.37, "learning_rate": 0.0014513439640810347, "loss": 2.8963, "step": 13784 }, { "epoch": 0.37, "learning_rate": 0.0014512662929420264, "loss": 2.3886, "step": 13785 }, { "epoch": 0.37, "learning_rate": 0.0014511886183843053, "loss": 2.8428, "step": 13786 }, { "epoch": 0.37, "learning_rate": 0.00145111094040846, "loss": 2.7335, "step": 13787 }, { "epoch": 0.37, "learning_rate": 0.001451033259015079, "loss": 2.4543, "step": 13788 }, { "epoch": 0.37, "learning_rate": 0.0014509555742047505, "loss": 2.5944, "step": 13789 }, { "epoch": 0.37, "learning_rate": 0.0014508778859780632, "loss": 2.5199, "step": 13790 }, { "epoch": 0.37, "learning_rate": 0.0014508001943356055, "loss": 3.0106, "step": 13791 }, { "epoch": 0.37, "learning_rate": 0.0014507224992779664, "loss": 2.1417, "step": 13792 }, { "epoch": 0.37, "learning_rate": 0.001450644800805734, "loss": 2.6353, "step": 13793 }, { "epoch": 0.37, "learning_rate": 0.0014505670989194974, "loss": 2.3671, "step": 13794 }, { "epoch": 0.37, "learning_rate": 0.0014504893936198447, "loss": 2.66, "step": 13795 }, { "epoch": 0.37, "learning_rate": 0.001450411684907365, "loss": 2.6224, "step": 13796 }, { "epoch": 0.37, "learning_rate": 0.001450333972782647, "loss": 2.7724, "step": 13797 }, { "epoch": 0.37, "learning_rate": 0.0014502562572462794, "loss": 2.7982, "step": 13798 }, { "epoch": 0.37, "learning_rate": 0.001450178538298851, "loss": 2.9111, "step": 13799 }, { "epoch": 0.37, "learning_rate": 0.00145010081594095, "loss": 2.2625, "step": 13800 }, { "epoch": 0.37, "learning_rate": 0.0014500230901731662, "loss": 2.835, "step": 13801 }, { "epoch": 0.37, "learning_rate": 0.0014499453609960879, "loss": 2.5597, "step": 13802 }, { "epoch": 0.37, "learning_rate": 0.0014498676284103033, "loss": 2.3749, "step": 13803 }, { "epoch": 0.37, "learning_rate": 0.0014497898924164027, "loss": 2.4435, "step": 13804 }, { "epoch": 0.37, "learning_rate": 0.0014497121530149739, "loss": 2.483, "step": 13805 }, { "epoch": 0.37, "learning_rate": 0.0014496344102066063, "loss": 2.8263, "step": 13806 }, { "epoch": 0.37, "learning_rate": 0.0014495566639918889, "loss": 2.3152, "step": 13807 }, { "epoch": 0.37, "learning_rate": 0.0014494789143714108, "loss": 2.5955, "step": 13808 }, { "epoch": 0.37, "learning_rate": 0.0014494011613457602, "loss": 2.7189, "step": 13809 }, { "epoch": 0.37, "learning_rate": 0.001449323404915527, "loss": 2.1884, "step": 13810 }, { "epoch": 0.37, "learning_rate": 0.0014492456450813003, "loss": 2.3807, "step": 13811 }, { "epoch": 0.37, "learning_rate": 0.001449167881843669, "loss": 2.7194, "step": 13812 }, { "epoch": 0.37, "learning_rate": 0.0014490901152032216, "loss": 2.3261, "step": 13813 }, { "epoch": 0.37, "learning_rate": 0.0014490123451605479, "loss": 2.3967, "step": 13814 }, { "epoch": 0.37, "learning_rate": 0.0014489345717162373, "loss": 2.6651, "step": 13815 }, { "epoch": 0.37, "learning_rate": 0.0014488567948708784, "loss": 2.5254, "step": 13816 }, { "epoch": 0.37, "learning_rate": 0.0014487790146250608, "loss": 2.8927, "step": 13817 }, { "epoch": 0.37, "learning_rate": 0.0014487012309793734, "loss": 1.9543, "step": 13818 }, { "epoch": 0.37, "learning_rate": 0.0014486234439344057, "loss": 2.6223, "step": 13819 }, { "epoch": 0.37, "learning_rate": 0.0014485456534907473, "loss": 2.93, "step": 13820 }, { "epoch": 0.37, "learning_rate": 0.0014484678596489871, "loss": 2.4412, "step": 13821 }, { "epoch": 0.37, "learning_rate": 0.0014483900624097145, "loss": 2.5675, "step": 13822 }, { "epoch": 0.37, "learning_rate": 0.0014483122617735187, "loss": 2.6082, "step": 13823 }, { "epoch": 0.37, "learning_rate": 0.00144823445774099, "loss": 2.5242, "step": 13824 }, { "epoch": 0.37, "learning_rate": 0.0014481566503127166, "loss": 2.5424, "step": 13825 }, { "epoch": 0.37, "learning_rate": 0.0014480788394892886, "loss": 2.7717, "step": 13826 }, { "epoch": 0.37, "learning_rate": 0.0014480010252712957, "loss": 2.7115, "step": 13827 }, { "epoch": 0.37, "learning_rate": 0.0014479232076593268, "loss": 2.4127, "step": 13828 }, { "epoch": 0.37, "learning_rate": 0.001447845386653972, "loss": 2.8983, "step": 13829 }, { "epoch": 0.37, "learning_rate": 0.0014477675622558207, "loss": 2.2714, "step": 13830 }, { "epoch": 0.37, "learning_rate": 0.0014476897344654622, "loss": 2.3627, "step": 13831 }, { "epoch": 0.37, "learning_rate": 0.0014476119032834865, "loss": 2.8632, "step": 13832 }, { "epoch": 0.37, "learning_rate": 0.0014475340687104827, "loss": 2.3915, "step": 13833 }, { "epoch": 0.37, "learning_rate": 0.0014474562307470412, "loss": 2.61, "step": 13834 }, { "epoch": 0.37, "learning_rate": 0.001447378389393751, "loss": 2.8386, "step": 13835 }, { "epoch": 0.37, "learning_rate": 0.0014473005446512023, "loss": 2.4551, "step": 13836 }, { "epoch": 0.37, "learning_rate": 0.0014472226965199847, "loss": 2.4056, "step": 13837 }, { "epoch": 0.37, "learning_rate": 0.0014471448450006877, "loss": 2.428, "step": 13838 }, { "epoch": 0.37, "learning_rate": 0.0014470669900939013, "loss": 2.8612, "step": 13839 }, { "epoch": 0.37, "learning_rate": 0.0014469891318002156, "loss": 2.8105, "step": 13840 }, { "epoch": 0.37, "learning_rate": 0.00144691127012022, "loss": 2.3426, "step": 13841 }, { "epoch": 0.37, "learning_rate": 0.0014468334050545045, "loss": 2.3719, "step": 13842 }, { "epoch": 0.37, "learning_rate": 0.0014467555366036587, "loss": 2.5615, "step": 13843 }, { "epoch": 0.37, "learning_rate": 0.0014466776647682731, "loss": 2.6459, "step": 13844 }, { "epoch": 0.37, "learning_rate": 0.0014465997895489373, "loss": 2.0144, "step": 13845 }, { "epoch": 0.37, "learning_rate": 0.0014465219109462413, "loss": 2.5995, "step": 13846 }, { "epoch": 0.37, "learning_rate": 0.0014464440289607755, "loss": 2.916, "step": 13847 }, { "epoch": 0.37, "learning_rate": 0.0014463661435931293, "loss": 2.6857, "step": 13848 }, { "epoch": 0.37, "learning_rate": 0.0014462882548438927, "loss": 3.1255, "step": 13849 }, { "epoch": 0.37, "learning_rate": 0.0014462103627136565, "loss": 2.9513, "step": 13850 }, { "epoch": 0.37, "learning_rate": 0.0014461324672030106, "loss": 2.7026, "step": 13851 }, { "epoch": 0.37, "learning_rate": 0.0014460545683125444, "loss": 2.6993, "step": 13852 }, { "epoch": 0.37, "learning_rate": 0.0014459766660428483, "loss": 2.7891, "step": 13853 }, { "epoch": 0.37, "learning_rate": 0.0014458987603945133, "loss": 2.2082, "step": 13854 }, { "epoch": 0.37, "learning_rate": 0.0014458208513681288, "loss": 2.2376, "step": 13855 }, { "epoch": 0.37, "learning_rate": 0.001445742938964285, "loss": 2.5705, "step": 13856 }, { "epoch": 0.37, "learning_rate": 0.0014456650231835725, "loss": 2.5868, "step": 13857 }, { "epoch": 0.37, "learning_rate": 0.0014455871040265818, "loss": 2.7338, "step": 13858 }, { "epoch": 0.37, "learning_rate": 0.0014455091814939026, "loss": 2.571, "step": 13859 }, { "epoch": 0.37, "learning_rate": 0.0014454312555861255, "loss": 2.6614, "step": 13860 }, { "epoch": 0.37, "learning_rate": 0.0014453533263038409, "loss": 2.5184, "step": 13861 }, { "epoch": 0.37, "learning_rate": 0.001445275393647639, "loss": 2.523, "step": 13862 }, { "epoch": 0.37, "learning_rate": 0.0014451974576181104, "loss": 2.6675, "step": 13863 }, { "epoch": 0.37, "learning_rate": 0.0014451195182158456, "loss": 2.4899, "step": 13864 }, { "epoch": 0.37, "learning_rate": 0.0014450415754414347, "loss": 2.6994, "step": 13865 }, { "epoch": 0.37, "learning_rate": 0.0014449636292954684, "loss": 2.847, "step": 13866 }, { "epoch": 0.37, "learning_rate": 0.0014448856797785372, "loss": 2.2089, "step": 13867 }, { "epoch": 0.37, "learning_rate": 0.001444807726891232, "loss": 2.5877, "step": 13868 }, { "epoch": 0.37, "learning_rate": 0.0014447297706341425, "loss": 2.6578, "step": 13869 }, { "epoch": 0.37, "learning_rate": 0.00144465181100786, "loss": 2.472, "step": 13870 }, { "epoch": 0.37, "learning_rate": 0.001444573848012975, "loss": 2.6564, "step": 13871 }, { "epoch": 0.37, "learning_rate": 0.0014444958816500774, "loss": 2.5307, "step": 13872 }, { "epoch": 0.37, "learning_rate": 0.0014444179119197588, "loss": 2.6473, "step": 13873 }, { "epoch": 0.37, "learning_rate": 0.00144433993882261, "loss": 2.653, "step": 13874 }, { "epoch": 0.37, "learning_rate": 0.0014442619623592208, "loss": 2.9573, "step": 13875 }, { "epoch": 0.37, "learning_rate": 0.0014441839825301826, "loss": 2.4848, "step": 13876 }, { "epoch": 0.37, "learning_rate": 0.0014441059993360859, "loss": 2.7538, "step": 13877 }, { "epoch": 0.37, "learning_rate": 0.0014440280127775216, "loss": 2.4041, "step": 13878 }, { "epoch": 0.37, "learning_rate": 0.00144395002285508, "loss": 2.9953, "step": 13879 }, { "epoch": 0.37, "learning_rate": 0.001443872029569353, "loss": 2.8173, "step": 13880 }, { "epoch": 0.37, "learning_rate": 0.0014437940329209305, "loss": 2.4697, "step": 13881 }, { "epoch": 0.37, "learning_rate": 0.001443716032910404, "loss": 2.3648, "step": 13882 }, { "epoch": 0.37, "learning_rate": 0.0014436380295383643, "loss": 2.3953, "step": 13883 }, { "epoch": 0.37, "learning_rate": 0.0014435600228054016, "loss": 2.7562, "step": 13884 }, { "epoch": 0.37, "learning_rate": 0.001443482012712108, "loss": 2.6015, "step": 13885 }, { "epoch": 0.37, "learning_rate": 0.0014434039992590737, "loss": 2.5195, "step": 13886 }, { "epoch": 0.37, "learning_rate": 0.00144332598244689, "loss": 2.3704, "step": 13887 }, { "epoch": 0.37, "learning_rate": 0.001443247962276148, "loss": 2.3102, "step": 13888 }, { "epoch": 0.37, "learning_rate": 0.0014431699387474387, "loss": 2.6209, "step": 13889 }, { "epoch": 0.37, "learning_rate": 0.001443091911861353, "loss": 2.7269, "step": 13890 }, { "epoch": 0.37, "learning_rate": 0.0014430138816184826, "loss": 2.6545, "step": 13891 }, { "epoch": 0.37, "learning_rate": 0.0014429358480194177, "loss": 2.3346, "step": 13892 }, { "epoch": 0.37, "learning_rate": 0.0014428578110647504, "loss": 2.4712, "step": 13893 }, { "epoch": 0.37, "learning_rate": 0.0014427797707550715, "loss": 2.5163, "step": 13894 }, { "epoch": 0.37, "learning_rate": 0.0014427017270909719, "loss": 2.3761, "step": 13895 }, { "epoch": 0.37, "learning_rate": 0.0014426236800730433, "loss": 2.5733, "step": 13896 }, { "epoch": 0.37, "learning_rate": 0.001442545629701877, "loss": 2.7811, "step": 13897 }, { "epoch": 0.37, "learning_rate": 0.001442467575978064, "loss": 2.8422, "step": 13898 }, { "epoch": 0.37, "learning_rate": 0.0014423895189021958, "loss": 2.8782, "step": 13899 }, { "epoch": 0.37, "learning_rate": 0.0014423114584748635, "loss": 2.4916, "step": 13900 }, { "epoch": 0.37, "learning_rate": 0.0014422333946966588, "loss": 2.6835, "step": 13901 }, { "epoch": 0.37, "learning_rate": 0.0014421553275681732, "loss": 2.3144, "step": 13902 }, { "epoch": 0.37, "learning_rate": 0.0014420772570899977, "loss": 2.607, "step": 13903 }, { "epoch": 0.37, "learning_rate": 0.0014419991832627238, "loss": 2.2637, "step": 13904 }, { "epoch": 0.37, "learning_rate": 0.0014419211060869431, "loss": 2.6165, "step": 13905 }, { "epoch": 0.37, "learning_rate": 0.0014418430255632472, "loss": 2.2038, "step": 13906 }, { "epoch": 0.37, "learning_rate": 0.0014417649416922278, "loss": 2.0969, "step": 13907 }, { "epoch": 0.37, "learning_rate": 0.001441686854474476, "loss": 2.3626, "step": 13908 }, { "epoch": 0.37, "learning_rate": 0.0014416087639105833, "loss": 2.4883, "step": 13909 }, { "epoch": 0.37, "learning_rate": 0.001441530670001142, "loss": 2.6686, "step": 13910 }, { "epoch": 0.37, "learning_rate": 0.001441452572746743, "loss": 2.9534, "step": 13911 }, { "epoch": 0.37, "learning_rate": 0.001441374472147978, "loss": 3.0757, "step": 13912 }, { "epoch": 0.37, "learning_rate": 0.0014412963682054391, "loss": 2.1494, "step": 13913 }, { "epoch": 0.37, "learning_rate": 0.001441218260919718, "loss": 3.0019, "step": 13914 }, { "epoch": 0.37, "learning_rate": 0.0014411401502914063, "loss": 2.5975, "step": 13915 }, { "epoch": 0.37, "learning_rate": 0.0014410620363210953, "loss": 2.611, "step": 13916 }, { "epoch": 0.37, "learning_rate": 0.0014409839190093776, "loss": 2.7502, "step": 13917 }, { "epoch": 0.37, "learning_rate": 0.001440905798356844, "loss": 3.1212, "step": 13918 }, { "epoch": 0.37, "learning_rate": 0.0014408276743640874, "loss": 2.4973, "step": 13919 }, { "epoch": 0.37, "learning_rate": 0.001440749547031699, "loss": 2.6861, "step": 13920 }, { "epoch": 0.37, "learning_rate": 0.001440671416360271, "loss": 2.6934, "step": 13921 }, { "epoch": 0.37, "learning_rate": 0.0014405932823503948, "loss": 2.16, "step": 13922 }, { "epoch": 0.37, "learning_rate": 0.0014405151450026627, "loss": 2.7317, "step": 13923 }, { "epoch": 0.37, "learning_rate": 0.001440437004317667, "loss": 2.9259, "step": 13924 }, { "epoch": 0.37, "learning_rate": 0.0014403588602959992, "loss": 2.5636, "step": 13925 }, { "epoch": 0.37, "learning_rate": 0.0014402807129382511, "loss": 3.1202, "step": 13926 }, { "epoch": 0.37, "learning_rate": 0.0014402025622450153, "loss": 2.8567, "step": 13927 }, { "epoch": 0.37, "learning_rate": 0.0014401244082168833, "loss": 2.6943, "step": 13928 }, { "epoch": 0.37, "learning_rate": 0.0014400462508544478, "loss": 2.6397, "step": 13929 }, { "epoch": 0.37, "learning_rate": 0.0014399680901583006, "loss": 2.8279, "step": 13930 }, { "epoch": 0.37, "learning_rate": 0.0014398899261290335, "loss": 2.6222, "step": 13931 }, { "epoch": 0.37, "learning_rate": 0.001439811758767239, "loss": 2.5156, "step": 13932 }, { "epoch": 0.37, "learning_rate": 0.0014397335880735095, "loss": 2.8436, "step": 13933 }, { "epoch": 0.37, "learning_rate": 0.0014396554140484368, "loss": 2.1227, "step": 13934 }, { "epoch": 0.37, "learning_rate": 0.001439577236692613, "loss": 2.537, "step": 13935 }, { "epoch": 0.37, "learning_rate": 0.001439499056006631, "loss": 2.7642, "step": 13936 }, { "epoch": 0.37, "learning_rate": 0.001439420871991083, "loss": 2.4336, "step": 13937 }, { "epoch": 0.37, "learning_rate": 0.0014393426846465605, "loss": 2.4406, "step": 13938 }, { "epoch": 0.37, "learning_rate": 0.0014392644939736562, "loss": 2.5093, "step": 13939 }, { "epoch": 0.37, "learning_rate": 0.0014391862999729632, "loss": 2.5978, "step": 13940 }, { "epoch": 0.37, "learning_rate": 0.0014391081026450731, "loss": 2.5586, "step": 13941 }, { "epoch": 0.37, "learning_rate": 0.0014390299019905787, "loss": 2.4166, "step": 13942 }, { "epoch": 0.37, "learning_rate": 0.0014389516980100718, "loss": 2.2847, "step": 13943 }, { "epoch": 0.37, "learning_rate": 0.001438873490704146, "loss": 2.4495, "step": 13944 }, { "epoch": 0.37, "learning_rate": 0.0014387952800733923, "loss": 2.789, "step": 13945 }, { "epoch": 0.37, "learning_rate": 0.0014387170661184045, "loss": 2.3575, "step": 13946 }, { "epoch": 0.37, "learning_rate": 0.0014386388488397746, "loss": 2.1975, "step": 13947 }, { "epoch": 0.37, "learning_rate": 0.001438560628238095, "loss": 2.9442, "step": 13948 }, { "epoch": 0.37, "learning_rate": 0.0014384824043139589, "loss": 2.6005, "step": 13949 }, { "epoch": 0.37, "learning_rate": 0.001438404177067958, "loss": 2.9122, "step": 13950 }, { "epoch": 0.37, "learning_rate": 0.0014383259465006856, "loss": 2.9161, "step": 13951 }, { "epoch": 0.37, "learning_rate": 0.0014382477126127341, "loss": 2.4524, "step": 13952 }, { "epoch": 0.37, "learning_rate": 0.0014381694754046967, "loss": 2.3998, "step": 13953 }, { "epoch": 0.37, "learning_rate": 0.0014380912348771653, "loss": 2.3331, "step": 13954 }, { "epoch": 0.38, "learning_rate": 0.0014380129910307332, "loss": 2.5486, "step": 13955 }, { "epoch": 0.38, "learning_rate": 0.0014379347438659932, "loss": 2.6047, "step": 13956 }, { "epoch": 0.38, "learning_rate": 0.0014378564933835375, "loss": 2.7, "step": 13957 }, { "epoch": 0.38, "learning_rate": 0.0014377782395839592, "loss": 2.6464, "step": 13958 }, { "epoch": 0.38, "learning_rate": 0.0014376999824678514, "loss": 2.6274, "step": 13959 }, { "epoch": 0.38, "learning_rate": 0.001437621722035807, "loss": 2.7139, "step": 13960 }, { "epoch": 0.38, "learning_rate": 0.0014375434582884184, "loss": 3.1125, "step": 13961 }, { "epoch": 0.38, "learning_rate": 0.001437465191226279, "loss": 2.9198, "step": 13962 }, { "epoch": 0.38, "learning_rate": 0.0014373869208499813, "loss": 2.4043, "step": 13963 }, { "epoch": 0.38, "learning_rate": 0.0014373086471601187, "loss": 2.6543, "step": 13964 }, { "epoch": 0.38, "learning_rate": 0.0014372303701572838, "loss": 2.8056, "step": 13965 }, { "epoch": 0.38, "learning_rate": 0.0014371520898420697, "loss": 2.096, "step": 13966 }, { "epoch": 0.38, "learning_rate": 0.0014370738062150696, "loss": 2.7258, "step": 13967 }, { "epoch": 0.38, "learning_rate": 0.0014369955192768766, "loss": 2.5979, "step": 13968 }, { "epoch": 0.38, "learning_rate": 0.0014369172290280838, "loss": 2.5817, "step": 13969 }, { "epoch": 0.38, "learning_rate": 0.0014368389354692838, "loss": 2.4164, "step": 13970 }, { "epoch": 0.38, "learning_rate": 0.0014367606386010703, "loss": 2.2851, "step": 13971 }, { "epoch": 0.38, "learning_rate": 0.0014366823384240363, "loss": 2.8423, "step": 13972 }, { "epoch": 0.38, "learning_rate": 0.0014366040349387751, "loss": 2.2871, "step": 13973 }, { "epoch": 0.38, "learning_rate": 0.0014365257281458797, "loss": 3.019, "step": 13974 }, { "epoch": 0.38, "learning_rate": 0.0014364474180459435, "loss": 2.5985, "step": 13975 }, { "epoch": 0.38, "learning_rate": 0.0014363691046395594, "loss": 2.4183, "step": 13976 }, { "epoch": 0.38, "learning_rate": 0.0014362907879273215, "loss": 2.3458, "step": 13977 }, { "epoch": 0.38, "learning_rate": 0.0014362124679098219, "loss": 2.5843, "step": 13978 }, { "epoch": 0.38, "learning_rate": 0.0014361341445876552, "loss": 2.5552, "step": 13979 }, { "epoch": 0.38, "learning_rate": 0.001436055817961414, "loss": 2.6778, "step": 13980 }, { "epoch": 0.38, "learning_rate": 0.0014359774880316918, "loss": 2.4085, "step": 13981 }, { "epoch": 0.38, "learning_rate": 0.001435899154799082, "loss": 2.3908, "step": 13982 }, { "epoch": 0.38, "learning_rate": 0.0014358208182641786, "loss": 2.1145, "step": 13983 }, { "epoch": 0.38, "learning_rate": 0.001435742478427574, "loss": 2.4148, "step": 13984 }, { "epoch": 0.38, "learning_rate": 0.001435664135289863, "loss": 1.9589, "step": 13985 }, { "epoch": 0.38, "learning_rate": 0.0014355857888516377, "loss": 2.1461, "step": 13986 }, { "epoch": 0.38, "learning_rate": 0.001435507439113493, "loss": 2.7503, "step": 13987 }, { "epoch": 0.38, "learning_rate": 0.001435429086076021, "loss": 2.718, "step": 13988 }, { "epoch": 0.38, "learning_rate": 0.0014353507297398167, "loss": 2.3816, "step": 13989 }, { "epoch": 0.38, "learning_rate": 0.0014352723701054728, "loss": 2.7835, "step": 13990 }, { "epoch": 0.38, "learning_rate": 0.0014351940071735834, "loss": 2.6146, "step": 13991 }, { "epoch": 0.38, "learning_rate": 0.0014351156409447422, "loss": 2.5596, "step": 13992 }, { "epoch": 0.38, "learning_rate": 0.0014350372714195423, "loss": 2.4903, "step": 13993 }, { "epoch": 0.38, "learning_rate": 0.001434958898598578, "loss": 2.9173, "step": 13994 }, { "epoch": 0.38, "learning_rate": 0.0014348805224824429, "loss": 2.4659, "step": 13995 }, { "epoch": 0.38, "learning_rate": 0.0014348021430717307, "loss": 2.755, "step": 13996 }, { "epoch": 0.38, "learning_rate": 0.0014347237603670351, "loss": 2.47, "step": 13997 }, { "epoch": 0.38, "learning_rate": 0.00143464537436895, "loss": 2.8202, "step": 13998 }, { "epoch": 0.38, "learning_rate": 0.0014345669850780694, "loss": 2.4241, "step": 13999 }, { "epoch": 0.38, "learning_rate": 0.001434488592494987, "loss": 2.5283, "step": 14000 }, { "epoch": 0.38, "learning_rate": 0.0014344101966202963, "loss": 2.7255, "step": 14001 }, { "epoch": 0.38, "learning_rate": 0.001434331797454592, "loss": 2.2646, "step": 14002 }, { "epoch": 0.38, "learning_rate": 0.0014342533949984677, "loss": 2.3918, "step": 14003 }, { "epoch": 0.38, "learning_rate": 0.0014341749892525172, "loss": 1.9612, "step": 14004 }, { "epoch": 0.38, "learning_rate": 0.0014340965802173344, "loss": 2.6323, "step": 14005 }, { "epoch": 0.38, "learning_rate": 0.001434018167893514, "loss": 2.6449, "step": 14006 }, { "epoch": 0.38, "learning_rate": 0.001433939752281649, "loss": 2.6912, "step": 14007 }, { "epoch": 0.38, "learning_rate": 0.0014338613333823346, "loss": 2.3998, "step": 14008 }, { "epoch": 0.38, "learning_rate": 0.0014337829111961639, "loss": 2.2497, "step": 14009 }, { "epoch": 0.38, "learning_rate": 0.0014337044857237315, "loss": 2.3089, "step": 14010 }, { "epoch": 0.38, "learning_rate": 0.0014336260569656316, "loss": 2.6511, "step": 14011 }, { "epoch": 0.38, "learning_rate": 0.0014335476249224583, "loss": 2.5967, "step": 14012 }, { "epoch": 0.38, "learning_rate": 0.0014334691895948053, "loss": 2.4794, "step": 14013 }, { "epoch": 0.38, "learning_rate": 0.0014333907509832674, "loss": 2.1277, "step": 14014 }, { "epoch": 0.38, "learning_rate": 0.0014333123090884388, "loss": 2.321, "step": 14015 }, { "epoch": 0.38, "learning_rate": 0.0014332338639109134, "loss": 2.3226, "step": 14016 }, { "epoch": 0.38, "learning_rate": 0.0014331554154512858, "loss": 2.4648, "step": 14017 }, { "epoch": 0.38, "learning_rate": 0.0014330769637101502, "loss": 2.9747, "step": 14018 }, { "epoch": 0.38, "learning_rate": 0.001432998508688101, "loss": 2.7971, "step": 14019 }, { "epoch": 0.38, "learning_rate": 0.0014329200503857323, "loss": 2.2418, "step": 14020 }, { "epoch": 0.38, "learning_rate": 0.001432841588803639, "loss": 2.8473, "step": 14021 }, { "epoch": 0.38, "learning_rate": 0.001432763123942415, "loss": 2.555, "step": 14022 }, { "epoch": 0.38, "learning_rate": 0.001432684655802655, "loss": 2.5619, "step": 14023 }, { "epoch": 0.38, "learning_rate": 0.0014326061843849534, "loss": 2.4191, "step": 14024 }, { "epoch": 0.38, "learning_rate": 0.0014325277096899048, "loss": 2.2538, "step": 14025 }, { "epoch": 0.38, "learning_rate": 0.0014324492317181034, "loss": 2.7286, "step": 14026 }, { "epoch": 0.38, "learning_rate": 0.001432370750470144, "loss": 2.3362, "step": 14027 }, { "epoch": 0.38, "learning_rate": 0.0014322922659466212, "loss": 2.5774, "step": 14028 }, { "epoch": 0.38, "learning_rate": 0.0014322137781481294, "loss": 2.562, "step": 14029 }, { "epoch": 0.38, "learning_rate": 0.0014321352870752635, "loss": 2.7476, "step": 14030 }, { "epoch": 0.38, "learning_rate": 0.0014320567927286177, "loss": 2.671, "step": 14031 }, { "epoch": 0.38, "learning_rate": 0.0014319782951087868, "loss": 3.0805, "step": 14032 }, { "epoch": 0.38, "learning_rate": 0.0014318997942163658, "loss": 2.0752, "step": 14033 }, { "epoch": 0.38, "learning_rate": 0.001431821290051949, "loss": 2.7634, "step": 14034 }, { "epoch": 0.38, "learning_rate": 0.0014317427826161314, "loss": 2.656, "step": 14035 }, { "epoch": 0.38, "learning_rate": 0.0014316642719095077, "loss": 2.7551, "step": 14036 }, { "epoch": 0.38, "learning_rate": 0.0014315857579326723, "loss": 2.296, "step": 14037 }, { "epoch": 0.38, "learning_rate": 0.0014315072406862208, "loss": 2.7005, "step": 14038 }, { "epoch": 0.38, "learning_rate": 0.0014314287201707477, "loss": 2.5721, "step": 14039 }, { "epoch": 0.38, "learning_rate": 0.0014313501963868474, "loss": 2.7969, "step": 14040 }, { "epoch": 0.38, "learning_rate": 0.0014312716693351151, "loss": 2.4554, "step": 14041 }, { "epoch": 0.38, "learning_rate": 0.001431193139016146, "loss": 2.5715, "step": 14042 }, { "epoch": 0.38, "learning_rate": 0.0014311146054305345, "loss": 3.1521, "step": 14043 }, { "epoch": 0.38, "learning_rate": 0.0014310360685788758, "loss": 2.5104, "step": 14044 }, { "epoch": 0.38, "learning_rate": 0.001430957528461765, "loss": 2.4975, "step": 14045 }, { "epoch": 0.38, "learning_rate": 0.0014308789850797973, "loss": 2.5645, "step": 14046 }, { "epoch": 0.38, "learning_rate": 0.001430800438433567, "loss": 2.8154, "step": 14047 }, { "epoch": 0.38, "learning_rate": 0.0014307218885236698, "loss": 2.6737, "step": 14048 }, { "epoch": 0.38, "learning_rate": 0.0014306433353507007, "loss": 3.0817, "step": 14049 }, { "epoch": 0.38, "learning_rate": 0.0014305647789152544, "loss": 2.123, "step": 14050 }, { "epoch": 0.38, "learning_rate": 0.0014304862192179267, "loss": 2.4132, "step": 14051 }, { "epoch": 0.38, "learning_rate": 0.001430407656259312, "loss": 2.3566, "step": 14052 }, { "epoch": 0.38, "learning_rate": 0.0014303290900400062, "loss": 3.0587, "step": 14053 }, { "epoch": 0.38, "learning_rate": 0.0014302505205606038, "loss": 2.979, "step": 14054 }, { "epoch": 0.38, "learning_rate": 0.0014301719478217007, "loss": 2.4464, "step": 14055 }, { "epoch": 0.38, "learning_rate": 0.0014300933718238915, "loss": 2.7463, "step": 14056 }, { "epoch": 0.38, "learning_rate": 0.0014300147925677717, "loss": 2.3922, "step": 14057 }, { "epoch": 0.38, "learning_rate": 0.0014299362100539373, "loss": 2.4027, "step": 14058 }, { "epoch": 0.38, "learning_rate": 0.0014298576242829828, "loss": 2.8717, "step": 14059 }, { "epoch": 0.38, "learning_rate": 0.0014297790352555035, "loss": 2.3536, "step": 14060 }, { "epoch": 0.38, "learning_rate": 0.0014297004429720953, "loss": 2.6391, "step": 14061 }, { "epoch": 0.38, "learning_rate": 0.0014296218474333534, "loss": 2.9391, "step": 14062 }, { "epoch": 0.38, "learning_rate": 0.001429543248639873, "loss": 2.9828, "step": 14063 }, { "epoch": 0.38, "learning_rate": 0.0014294646465922499, "loss": 2.8467, "step": 14064 }, { "epoch": 0.38, "learning_rate": 0.0014293860412910794, "loss": 2.8085, "step": 14065 }, { "epoch": 0.38, "learning_rate": 0.001429307432736957, "loss": 2.8263, "step": 14066 }, { "epoch": 0.38, "learning_rate": 0.001429228820930478, "loss": 2.4605, "step": 14067 }, { "epoch": 0.38, "learning_rate": 0.0014291502058722389, "loss": 2.2899, "step": 14068 }, { "epoch": 0.38, "learning_rate": 0.001429071587562834, "loss": 2.5133, "step": 14069 }, { "epoch": 0.38, "learning_rate": 0.0014289929660028595, "loss": 2.3196, "step": 14070 }, { "epoch": 0.38, "learning_rate": 0.001428914341192911, "loss": 2.507, "step": 14071 }, { "epoch": 0.38, "learning_rate": 0.0014288357131335843, "loss": 2.6578, "step": 14072 }, { "epoch": 0.38, "learning_rate": 0.0014287570818254747, "loss": 2.6362, "step": 14073 }, { "epoch": 0.38, "learning_rate": 0.0014286784472691784, "loss": 2.9383, "step": 14074 }, { "epoch": 0.38, "learning_rate": 0.0014285998094652904, "loss": 2.4195, "step": 14075 }, { "epoch": 0.38, "learning_rate": 0.0014285211684144073, "loss": 2.4702, "step": 14076 }, { "epoch": 0.38, "learning_rate": 0.0014284425241171239, "loss": 2.4307, "step": 14077 }, { "epoch": 0.38, "learning_rate": 0.001428363876574037, "loss": 2.3582, "step": 14078 }, { "epoch": 0.38, "learning_rate": 0.001428285225785742, "loss": 2.4987, "step": 14079 }, { "epoch": 0.38, "learning_rate": 0.0014282065717528343, "loss": 2.5285, "step": 14080 }, { "epoch": 0.38, "learning_rate": 0.0014281279144759105, "loss": 2.5763, "step": 14081 }, { "epoch": 0.38, "learning_rate": 0.001428049253955566, "loss": 2.7827, "step": 14082 }, { "epoch": 0.38, "learning_rate": 0.0014279705901923969, "loss": 2.5582, "step": 14083 }, { "epoch": 0.38, "learning_rate": 0.0014278919231869992, "loss": 2.4876, "step": 14084 }, { "epoch": 0.38, "learning_rate": 0.0014278132529399689, "loss": 2.4728, "step": 14085 }, { "epoch": 0.38, "learning_rate": 0.0014277345794519016, "loss": 2.8178, "step": 14086 }, { "epoch": 0.38, "learning_rate": 0.0014276559027233935, "loss": 2.9079, "step": 14087 }, { "epoch": 0.38, "learning_rate": 0.0014275772227550412, "loss": 2.3413, "step": 14088 }, { "epoch": 0.38, "learning_rate": 0.00142749853954744, "loss": 2.7523, "step": 14089 }, { "epoch": 0.38, "learning_rate": 0.0014274198531011863, "loss": 2.2996, "step": 14090 }, { "epoch": 0.38, "learning_rate": 0.0014273411634168763, "loss": 2.2446, "step": 14091 }, { "epoch": 0.38, "learning_rate": 0.0014272624704951063, "loss": 2.481, "step": 14092 }, { "epoch": 0.38, "learning_rate": 0.0014271837743364717, "loss": 2.5395, "step": 14093 }, { "epoch": 0.38, "learning_rate": 0.0014271050749415696, "loss": 2.5381, "step": 14094 }, { "epoch": 0.38, "learning_rate": 0.0014270263723109955, "loss": 2.7082, "step": 14095 }, { "epoch": 0.38, "learning_rate": 0.0014269476664453462, "loss": 2.1173, "step": 14096 }, { "epoch": 0.38, "learning_rate": 0.0014268689573452176, "loss": 2.6487, "step": 14097 }, { "epoch": 0.38, "learning_rate": 0.001426790245011206, "loss": 2.1398, "step": 14098 }, { "epoch": 0.38, "learning_rate": 0.001426711529443908, "loss": 2.7118, "step": 14099 }, { "epoch": 0.38, "learning_rate": 0.0014266328106439196, "loss": 2.8063, "step": 14100 }, { "epoch": 0.38, "learning_rate": 0.0014265540886118373, "loss": 2.4277, "step": 14101 }, { "epoch": 0.38, "learning_rate": 0.0014264753633482577, "loss": 2.4888, "step": 14102 }, { "epoch": 0.38, "learning_rate": 0.0014263966348537765, "loss": 2.8174, "step": 14103 }, { "epoch": 0.38, "learning_rate": 0.001426317903128991, "loss": 2.8136, "step": 14104 }, { "epoch": 0.38, "learning_rate": 0.0014262391681744973, "loss": 2.5531, "step": 14105 }, { "epoch": 0.38, "learning_rate": 0.0014261604299908917, "loss": 2.3773, "step": 14106 }, { "epoch": 0.38, "learning_rate": 0.0014260816885787709, "loss": 2.8574, "step": 14107 }, { "epoch": 0.38, "learning_rate": 0.0014260029439387316, "loss": 2.7379, "step": 14108 }, { "epoch": 0.38, "learning_rate": 0.0014259241960713701, "loss": 2.8805, "step": 14109 }, { "epoch": 0.38, "learning_rate": 0.001425845444977283, "loss": 2.6156, "step": 14110 }, { "epoch": 0.38, "learning_rate": 0.0014257666906570667, "loss": 2.9112, "step": 14111 }, { "epoch": 0.38, "learning_rate": 0.0014256879331113186, "loss": 2.5877, "step": 14112 }, { "epoch": 0.38, "learning_rate": 0.0014256091723406344, "loss": 2.5109, "step": 14113 }, { "epoch": 0.38, "learning_rate": 0.0014255304083456114, "loss": 2.4033, "step": 14114 }, { "epoch": 0.38, "learning_rate": 0.001425451641126846, "loss": 2.3657, "step": 14115 }, { "epoch": 0.38, "learning_rate": 0.001425372870684935, "loss": 2.4211, "step": 14116 }, { "epoch": 0.38, "learning_rate": 0.0014252940970204753, "loss": 3.0335, "step": 14117 }, { "epoch": 0.38, "learning_rate": 0.0014252153201340634, "loss": 2.8368, "step": 14118 }, { "epoch": 0.38, "learning_rate": 0.0014251365400262963, "loss": 2.775, "step": 14119 }, { "epoch": 0.38, "learning_rate": 0.001425057756697771, "loss": 2.4956, "step": 14120 }, { "epoch": 0.38, "learning_rate": 0.0014249789701490838, "loss": 2.5123, "step": 14121 }, { "epoch": 0.38, "learning_rate": 0.0014249001803808322, "loss": 2.4802, "step": 14122 }, { "epoch": 0.38, "learning_rate": 0.0014248213873936124, "loss": 2.6933, "step": 14123 }, { "epoch": 0.38, "learning_rate": 0.001424742591188022, "loss": 2.3045, "step": 14124 }, { "epoch": 0.38, "learning_rate": 0.0014246637917646578, "loss": 2.3284, "step": 14125 }, { "epoch": 0.38, "learning_rate": 0.0014245849891241164, "loss": 2.2444, "step": 14126 }, { "epoch": 0.38, "learning_rate": 0.001424506183266995, "loss": 2.759, "step": 14127 }, { "epoch": 0.38, "learning_rate": 0.001424427374193891, "loss": 3.2101, "step": 14128 }, { "epoch": 0.38, "learning_rate": 0.0014243485619054007, "loss": 2.8047, "step": 14129 }, { "epoch": 0.38, "learning_rate": 0.0014242697464021217, "loss": 2.7917, "step": 14130 }, { "epoch": 0.38, "learning_rate": 0.001424190927684651, "loss": 2.5878, "step": 14131 }, { "epoch": 0.38, "learning_rate": 0.0014241121057535857, "loss": 2.6008, "step": 14132 }, { "epoch": 0.38, "learning_rate": 0.001424033280609523, "loss": 2.5453, "step": 14133 }, { "epoch": 0.38, "learning_rate": 0.0014239544522530595, "loss": 2.3465, "step": 14134 }, { "epoch": 0.38, "learning_rate": 0.0014238756206847933, "loss": 2.3727, "step": 14135 }, { "epoch": 0.38, "learning_rate": 0.0014237967859053208, "loss": 2.355, "step": 14136 }, { "epoch": 0.38, "learning_rate": 0.0014237179479152401, "loss": 2.5471, "step": 14137 }, { "epoch": 0.38, "learning_rate": 0.0014236391067151478, "loss": 2.3022, "step": 14138 }, { "epoch": 0.38, "learning_rate": 0.0014235602623056413, "loss": 2.4862, "step": 14139 }, { "epoch": 0.38, "learning_rate": 0.001423481414687318, "loss": 2.8672, "step": 14140 }, { "epoch": 0.38, "learning_rate": 0.0014234025638607752, "loss": 2.3225, "step": 14141 }, { "epoch": 0.38, "learning_rate": 0.0014233237098266102, "loss": 2.6456, "step": 14142 }, { "epoch": 0.38, "learning_rate": 0.0014232448525854206, "loss": 2.7519, "step": 14143 }, { "epoch": 0.38, "learning_rate": 0.0014231659921378037, "loss": 2.6827, "step": 14144 }, { "epoch": 0.38, "learning_rate": 0.0014230871284843568, "loss": 2.3534, "step": 14145 }, { "epoch": 0.38, "learning_rate": 0.0014230082616256774, "loss": 2.3963, "step": 14146 }, { "epoch": 0.38, "learning_rate": 0.0014229293915623631, "loss": 2.7914, "step": 14147 }, { "epoch": 0.38, "learning_rate": 0.0014228505182950115, "loss": 2.8908, "step": 14148 }, { "epoch": 0.38, "learning_rate": 0.0014227716418242198, "loss": 2.1251, "step": 14149 }, { "epoch": 0.38, "learning_rate": 0.0014226927621505856, "loss": 2.6183, "step": 14150 }, { "epoch": 0.38, "learning_rate": 0.001422613879274707, "loss": 2.8141, "step": 14151 }, { "epoch": 0.38, "learning_rate": 0.0014225349931971808, "loss": 2.9382, "step": 14152 }, { "epoch": 0.38, "learning_rate": 0.0014224561039186052, "loss": 2.583, "step": 14153 }, { "epoch": 0.38, "learning_rate": 0.0014223772114395777, "loss": 2.6788, "step": 14154 }, { "epoch": 0.38, "learning_rate": 0.001422298315760696, "loss": 2.5298, "step": 14155 }, { "epoch": 0.38, "learning_rate": 0.0014222194168825577, "loss": 2.9283, "step": 14156 }, { "epoch": 0.38, "learning_rate": 0.0014221405148057604, "loss": 2.528, "step": 14157 }, { "epoch": 0.38, "learning_rate": 0.0014220616095309024, "loss": 2.611, "step": 14158 }, { "epoch": 0.38, "learning_rate": 0.0014219827010585808, "loss": 2.3703, "step": 14159 }, { "epoch": 0.38, "learning_rate": 0.001421903789389394, "loss": 2.4706, "step": 14160 }, { "epoch": 0.38, "learning_rate": 0.0014218248745239393, "loss": 2.4173, "step": 14161 }, { "epoch": 0.38, "learning_rate": 0.0014217459564628148, "loss": 2.4762, "step": 14162 }, { "epoch": 0.38, "learning_rate": 0.0014216670352066184, "loss": 2.4756, "step": 14163 }, { "epoch": 0.38, "learning_rate": 0.001421588110755948, "loss": 2.6739, "step": 14164 }, { "epoch": 0.38, "learning_rate": 0.001421509183111401, "loss": 2.3358, "step": 14165 }, { "epoch": 0.38, "learning_rate": 0.001421430252273576, "loss": 2.6671, "step": 14166 }, { "epoch": 0.38, "learning_rate": 0.0014213513182430712, "loss": 2.3723, "step": 14167 }, { "epoch": 0.38, "learning_rate": 0.0014212723810204837, "loss": 2.5049, "step": 14168 }, { "epoch": 0.38, "learning_rate": 0.0014211934406064119, "loss": 2.4481, "step": 14169 }, { "epoch": 0.38, "learning_rate": 0.0014211144970014541, "loss": 2.6156, "step": 14170 }, { "epoch": 0.38, "learning_rate": 0.0014210355502062082, "loss": 2.7962, "step": 14171 }, { "epoch": 0.38, "learning_rate": 0.0014209566002212721, "loss": 2.8562, "step": 14172 }, { "epoch": 0.38, "learning_rate": 0.001420877647047244, "loss": 2.4437, "step": 14173 }, { "epoch": 0.38, "learning_rate": 0.0014207986906847223, "loss": 2.4466, "step": 14174 }, { "epoch": 0.38, "learning_rate": 0.001420719731134305, "loss": 2.5896, "step": 14175 }, { "epoch": 0.38, "learning_rate": 0.00142064076839659, "loss": 2.7014, "step": 14176 }, { "epoch": 0.38, "learning_rate": 0.0014205618024721758, "loss": 3.0222, "step": 14177 }, { "epoch": 0.38, "learning_rate": 0.0014204828333616608, "loss": 2.4151, "step": 14178 }, { "epoch": 0.38, "learning_rate": 0.0014204038610656426, "loss": 2.2475, "step": 14179 }, { "epoch": 0.38, "learning_rate": 0.00142032488558472, "loss": 2.5595, "step": 14180 }, { "epoch": 0.38, "learning_rate": 0.0014202459069194914, "loss": 2.8052, "step": 14181 }, { "epoch": 0.38, "learning_rate": 0.001420166925070555, "loss": 2.856, "step": 14182 }, { "epoch": 0.38, "learning_rate": 0.001420087940038509, "loss": 2.5216, "step": 14183 }, { "epoch": 0.38, "learning_rate": 0.0014200089518239519, "loss": 2.1738, "step": 14184 }, { "epoch": 0.38, "learning_rate": 0.0014199299604274822, "loss": 2.956, "step": 14185 }, { "epoch": 0.38, "learning_rate": 0.0014198509658496978, "loss": 2.2986, "step": 14186 }, { "epoch": 0.38, "learning_rate": 0.001419771968091198, "loss": 3.0927, "step": 14187 }, { "epoch": 0.38, "learning_rate": 0.0014196929671525804, "loss": 2.369, "step": 14188 }, { "epoch": 0.38, "learning_rate": 0.0014196139630344442, "loss": 2.396, "step": 14189 }, { "epoch": 0.38, "learning_rate": 0.0014195349557373875, "loss": 2.3455, "step": 14190 }, { "epoch": 0.38, "learning_rate": 0.0014194559452620093, "loss": 2.4976, "step": 14191 }, { "epoch": 0.38, "learning_rate": 0.0014193769316089076, "loss": 3.1285, "step": 14192 }, { "epoch": 0.38, "learning_rate": 0.0014192979147786811, "loss": 2.7398, "step": 14193 }, { "epoch": 0.38, "learning_rate": 0.0014192188947719287, "loss": 2.6321, "step": 14194 }, { "epoch": 0.38, "learning_rate": 0.0014191398715892487, "loss": 2.7137, "step": 14195 }, { "epoch": 0.38, "learning_rate": 0.0014190608452312402, "loss": 2.3988, "step": 14196 }, { "epoch": 0.38, "learning_rate": 0.0014189818156985017, "loss": 2.7001, "step": 14197 }, { "epoch": 0.38, "learning_rate": 0.001418902782991632, "loss": 2.4619, "step": 14198 }, { "epoch": 0.38, "learning_rate": 0.0014188237471112293, "loss": 2.574, "step": 14199 }, { "epoch": 0.38, "learning_rate": 0.0014187447080578927, "loss": 2.8307, "step": 14200 }, { "epoch": 0.38, "learning_rate": 0.0014186656658322218, "loss": 2.5214, "step": 14201 }, { "epoch": 0.38, "learning_rate": 0.0014185866204348139, "loss": 2.4383, "step": 14202 }, { "epoch": 0.38, "learning_rate": 0.001418507571866269, "loss": 2.6049, "step": 14203 }, { "epoch": 0.38, "learning_rate": 0.0014184285201271855, "loss": 2.8189, "step": 14204 }, { "epoch": 0.38, "learning_rate": 0.0014183494652181623, "loss": 2.9636, "step": 14205 }, { "epoch": 0.38, "learning_rate": 0.0014182704071397983, "loss": 2.8453, "step": 14206 }, { "epoch": 0.38, "learning_rate": 0.0014181913458926926, "loss": 2.4157, "step": 14207 }, { "epoch": 0.38, "learning_rate": 0.0014181122814774438, "loss": 2.5427, "step": 14208 }, { "epoch": 0.38, "learning_rate": 0.0014180332138946513, "loss": 2.7738, "step": 14209 }, { "epoch": 0.38, "learning_rate": 0.0014179541431449136, "loss": 2.8322, "step": 14210 }, { "epoch": 0.38, "learning_rate": 0.0014178750692288306, "loss": 2.6001, "step": 14211 }, { "epoch": 0.38, "learning_rate": 0.001417795992147, "loss": 2.3763, "step": 14212 }, { "epoch": 0.38, "learning_rate": 0.0014177169119000224, "loss": 2.0878, "step": 14213 }, { "epoch": 0.38, "learning_rate": 0.0014176378284884961, "loss": 2.7001, "step": 14214 }, { "epoch": 0.38, "learning_rate": 0.0014175587419130197, "loss": 2.8133, "step": 14215 }, { "epoch": 0.38, "learning_rate": 0.0014174796521741935, "loss": 2.5298, "step": 14216 }, { "epoch": 0.38, "learning_rate": 0.001417400559272616, "loss": 2.6159, "step": 14217 }, { "epoch": 0.38, "learning_rate": 0.0014173214632088864, "loss": 2.6, "step": 14218 }, { "epoch": 0.38, "learning_rate": 0.0014172423639836037, "loss": 2.2197, "step": 14219 }, { "epoch": 0.38, "learning_rate": 0.0014171632615973678, "loss": 2.2561, "step": 14220 }, { "epoch": 0.38, "learning_rate": 0.0014170841560507776, "loss": 2.2417, "step": 14221 }, { "epoch": 0.38, "learning_rate": 0.0014170050473444322, "loss": 2.6309, "step": 14222 }, { "epoch": 0.38, "learning_rate": 0.0014169259354789312, "loss": 2.7053, "step": 14223 }, { "epoch": 0.38, "learning_rate": 0.0014168468204548742, "loss": 2.3505, "step": 14224 }, { "epoch": 0.38, "learning_rate": 0.0014167677022728596, "loss": 2.1571, "step": 14225 }, { "epoch": 0.38, "learning_rate": 0.0014166885809334879, "loss": 2.4962, "step": 14226 }, { "epoch": 0.38, "learning_rate": 0.0014166094564373576, "loss": 2.1623, "step": 14227 }, { "epoch": 0.38, "learning_rate": 0.001416530328785069, "loss": 2.5939, "step": 14228 }, { "epoch": 0.38, "learning_rate": 0.0014164511979772208, "loss": 2.8734, "step": 14229 }, { "epoch": 0.38, "learning_rate": 0.0014163720640144129, "loss": 2.2721, "step": 14230 }, { "epoch": 0.38, "learning_rate": 0.0014162929268972447, "loss": 2.7266, "step": 14231 }, { "epoch": 0.38, "learning_rate": 0.0014162137866263155, "loss": 2.687, "step": 14232 }, { "epoch": 0.38, "learning_rate": 0.0014161346432022253, "loss": 2.6509, "step": 14233 }, { "epoch": 0.38, "learning_rate": 0.0014160554966255734, "loss": 3.0868, "step": 14234 }, { "epoch": 0.38, "learning_rate": 0.001415976346896959, "loss": 2.7695, "step": 14235 }, { "epoch": 0.38, "learning_rate": 0.0014158971940169828, "loss": 2.4906, "step": 14236 }, { "epoch": 0.38, "learning_rate": 0.0014158180379862436, "loss": 2.5717, "step": 14237 }, { "epoch": 0.38, "learning_rate": 0.0014157388788053412, "loss": 2.847, "step": 14238 }, { "epoch": 0.38, "learning_rate": 0.0014156597164748752, "loss": 2.6415, "step": 14239 }, { "epoch": 0.38, "learning_rate": 0.001415580550995446, "loss": 2.7473, "step": 14240 }, { "epoch": 0.38, "learning_rate": 0.0014155013823676525, "loss": 2.8314, "step": 14241 }, { "epoch": 0.38, "learning_rate": 0.001415422210592095, "loss": 2.766, "step": 14242 }, { "epoch": 0.38, "learning_rate": 0.0014153430356693727, "loss": 3.1398, "step": 14243 }, { "epoch": 0.38, "learning_rate": 0.0014152638576000862, "loss": 2.5413, "step": 14244 }, { "epoch": 0.38, "learning_rate": 0.0014151846763848347, "loss": 2.4894, "step": 14245 }, { "epoch": 0.38, "learning_rate": 0.0014151054920242187, "loss": 2.6616, "step": 14246 }, { "epoch": 0.38, "learning_rate": 0.0014150263045188374, "loss": 2.5802, "step": 14247 }, { "epoch": 0.38, "learning_rate": 0.0014149471138692911, "loss": 2.5843, "step": 14248 }, { "epoch": 0.38, "learning_rate": 0.0014148679200761797, "loss": 2.6434, "step": 14249 }, { "epoch": 0.38, "learning_rate": 0.001414788723140103, "loss": 2.2436, "step": 14250 }, { "epoch": 0.38, "learning_rate": 0.0014147095230616614, "loss": 2.4193, "step": 14251 }, { "epoch": 0.38, "learning_rate": 0.0014146303198414542, "loss": 2.8862, "step": 14252 }, { "epoch": 0.38, "learning_rate": 0.001414551113480082, "loss": 2.7564, "step": 14253 }, { "epoch": 0.38, "learning_rate": 0.0014144719039781446, "loss": 2.5717, "step": 14254 }, { "epoch": 0.38, "learning_rate": 0.0014143926913362422, "loss": 2.8659, "step": 14255 }, { "epoch": 0.38, "learning_rate": 0.001414313475554975, "loss": 2.9028, "step": 14256 }, { "epoch": 0.38, "learning_rate": 0.0014142342566349428, "loss": 2.5881, "step": 14257 }, { "epoch": 0.38, "learning_rate": 0.001414155034576746, "loss": 2.0863, "step": 14258 }, { "epoch": 0.38, "learning_rate": 0.0014140758093809844, "loss": 2.5029, "step": 14259 }, { "epoch": 0.38, "learning_rate": 0.001413996581048259, "loss": 2.8115, "step": 14260 }, { "epoch": 0.38, "learning_rate": 0.0014139173495791692, "loss": 2.3217, "step": 14261 }, { "epoch": 0.38, "learning_rate": 0.0014138381149743156, "loss": 2.5061, "step": 14262 }, { "epoch": 0.38, "learning_rate": 0.0014137588772342986, "loss": 2.2662, "step": 14263 }, { "epoch": 0.38, "learning_rate": 0.0014136796363597183, "loss": 2.8573, "step": 14264 }, { "epoch": 0.38, "learning_rate": 0.0014136003923511749, "loss": 2.5432, "step": 14265 }, { "epoch": 0.38, "learning_rate": 0.001413521145209269, "loss": 2.7355, "step": 14266 }, { "epoch": 0.38, "learning_rate": 0.0014134418949346007, "loss": 2.7499, "step": 14267 }, { "epoch": 0.38, "learning_rate": 0.0014133626415277704, "loss": 2.2767, "step": 14268 }, { "epoch": 0.38, "learning_rate": 0.001413283384989379, "loss": 2.2541, "step": 14269 }, { "epoch": 0.38, "learning_rate": 0.0014132041253200262, "loss": 2.2885, "step": 14270 }, { "epoch": 0.38, "learning_rate": 0.0014131248625203132, "loss": 2.6164, "step": 14271 }, { "epoch": 0.38, "learning_rate": 0.0014130455965908398, "loss": 2.3829, "step": 14272 }, { "epoch": 0.38, "learning_rate": 0.001412966327532207, "loss": 2.4362, "step": 14273 }, { "epoch": 0.38, "learning_rate": 0.0014128870553450149, "loss": 2.1354, "step": 14274 }, { "epoch": 0.38, "learning_rate": 0.0014128077800298641, "loss": 2.6443, "step": 14275 }, { "epoch": 0.38, "learning_rate": 0.0014127285015873559, "loss": 2.7726, "step": 14276 }, { "epoch": 0.38, "learning_rate": 0.0014126492200180903, "loss": 2.6347, "step": 14277 }, { "epoch": 0.38, "learning_rate": 0.0014125699353226674, "loss": 2.5511, "step": 14278 }, { "epoch": 0.38, "learning_rate": 0.0014124906475016892, "loss": 2.5385, "step": 14279 }, { "epoch": 0.38, "learning_rate": 0.0014124113565557553, "loss": 2.4195, "step": 14280 }, { "epoch": 0.38, "learning_rate": 0.0014123320624854665, "loss": 3.0874, "step": 14281 }, { "epoch": 0.38, "learning_rate": 0.0014122527652914237, "loss": 2.5873, "step": 14282 }, { "epoch": 0.38, "learning_rate": 0.001412173464974228, "loss": 2.4143, "step": 14283 }, { "epoch": 0.38, "learning_rate": 0.0014120941615344798, "loss": 2.5207, "step": 14284 }, { "epoch": 0.38, "learning_rate": 0.0014120148549727795, "loss": 2.7741, "step": 14285 }, { "epoch": 0.38, "learning_rate": 0.0014119355452897287, "loss": 3.0015, "step": 14286 }, { "epoch": 0.38, "learning_rate": 0.0014118562324859276, "loss": 2.9582, "step": 14287 }, { "epoch": 0.38, "learning_rate": 0.0014117769165619774, "loss": 2.4263, "step": 14288 }, { "epoch": 0.38, "learning_rate": 0.0014116975975184789, "loss": 2.4827, "step": 14289 }, { "epoch": 0.38, "learning_rate": 0.0014116182753560332, "loss": 2.5041, "step": 14290 }, { "epoch": 0.38, "learning_rate": 0.0014115389500752406, "loss": 2.8545, "step": 14291 }, { "epoch": 0.38, "learning_rate": 0.0014114596216767028, "loss": 2.5188, "step": 14292 }, { "epoch": 0.38, "learning_rate": 0.0014113802901610205, "loss": 2.4297, "step": 14293 }, { "epoch": 0.38, "learning_rate": 0.0014113009555287946, "loss": 2.7245, "step": 14294 }, { "epoch": 0.38, "learning_rate": 0.0014112216177806262, "loss": 2.3979, "step": 14295 }, { "epoch": 0.38, "learning_rate": 0.0014111422769171164, "loss": 2.7215, "step": 14296 }, { "epoch": 0.38, "learning_rate": 0.001411062932938866, "loss": 2.8508, "step": 14297 }, { "epoch": 0.38, "learning_rate": 0.0014109835858464766, "loss": 2.8416, "step": 14298 }, { "epoch": 0.38, "learning_rate": 0.0014109042356405489, "loss": 2.7367, "step": 14299 }, { "epoch": 0.38, "learning_rate": 0.0014108248823216842, "loss": 2.4099, "step": 14300 }, { "epoch": 0.38, "learning_rate": 0.0014107455258904836, "loss": 2.5565, "step": 14301 }, { "epoch": 0.38, "learning_rate": 0.0014106661663475482, "loss": 2.3262, "step": 14302 }, { "epoch": 0.38, "learning_rate": 0.0014105868036934797, "loss": 2.4429, "step": 14303 }, { "epoch": 0.38, "learning_rate": 0.0014105074379288786, "loss": 2.4433, "step": 14304 }, { "epoch": 0.38, "learning_rate": 0.0014104280690543467, "loss": 2.5778, "step": 14305 }, { "epoch": 0.38, "learning_rate": 0.0014103486970704852, "loss": 2.4481, "step": 14306 }, { "epoch": 0.38, "learning_rate": 0.0014102693219778953, "loss": 2.535, "step": 14307 }, { "epoch": 0.38, "learning_rate": 0.0014101899437771782, "loss": 2.4921, "step": 14308 }, { "epoch": 0.38, "learning_rate": 0.0014101105624689354, "loss": 2.3269, "step": 14309 }, { "epoch": 0.38, "learning_rate": 0.0014100311780537687, "loss": 2.6487, "step": 14310 }, { "epoch": 0.38, "learning_rate": 0.0014099517905322787, "loss": 2.5821, "step": 14311 }, { "epoch": 0.38, "learning_rate": 0.0014098723999050676, "loss": 2.5487, "step": 14312 }, { "epoch": 0.38, "learning_rate": 0.0014097930061727363, "loss": 2.2504, "step": 14313 }, { "epoch": 0.38, "learning_rate": 0.0014097136093358862, "loss": 2.4519, "step": 14314 }, { "epoch": 0.38, "learning_rate": 0.0014096342093951194, "loss": 2.7834, "step": 14315 }, { "epoch": 0.38, "learning_rate": 0.001409554806351037, "loss": 2.6341, "step": 14316 }, { "epoch": 0.38, "learning_rate": 0.0014094754002042405, "loss": 2.2817, "step": 14317 }, { "epoch": 0.38, "learning_rate": 0.0014093959909553314, "loss": 2.5668, "step": 14318 }, { "epoch": 0.38, "learning_rate": 0.001409316578604912, "loss": 2.5619, "step": 14319 }, { "epoch": 0.38, "learning_rate": 0.001409237163153583, "loss": 2.4368, "step": 14320 }, { "epoch": 0.38, "learning_rate": 0.0014091577446019461, "loss": 2.5696, "step": 14321 }, { "epoch": 0.38, "learning_rate": 0.0014090783229506038, "loss": 2.2202, "step": 14322 }, { "epoch": 0.38, "learning_rate": 0.0014089988982001571, "loss": 2.4224, "step": 14323 }, { "epoch": 0.38, "learning_rate": 0.0014089194703512079, "loss": 3.0175, "step": 14324 }, { "epoch": 0.38, "learning_rate": 0.0014088400394043578, "loss": 2.6127, "step": 14325 }, { "epoch": 0.38, "learning_rate": 0.0014087606053602086, "loss": 2.73, "step": 14326 }, { "epoch": 0.39, "learning_rate": 0.0014086811682193622, "loss": 2.4119, "step": 14327 }, { "epoch": 0.39, "learning_rate": 0.0014086017279824204, "loss": 2.4705, "step": 14328 }, { "epoch": 0.39, "learning_rate": 0.001408522284649985, "loss": 2.7375, "step": 14329 }, { "epoch": 0.39, "learning_rate": 0.001408442838222658, "loss": 2.5748, "step": 14330 }, { "epoch": 0.39, "learning_rate": 0.0014083633887010407, "loss": 2.8909, "step": 14331 }, { "epoch": 0.39, "learning_rate": 0.0014082839360857356, "loss": 2.8754, "step": 14332 }, { "epoch": 0.39, "learning_rate": 0.0014082044803773442, "loss": 2.7552, "step": 14333 }, { "epoch": 0.39, "learning_rate": 0.0014081250215764688, "loss": 2.8367, "step": 14334 }, { "epoch": 0.39, "learning_rate": 0.0014080455596837112, "loss": 2.715, "step": 14335 }, { "epoch": 0.39, "learning_rate": 0.0014079660946996733, "loss": 2.5139, "step": 14336 }, { "epoch": 0.39, "learning_rate": 0.0014078866266249573, "loss": 2.3041, "step": 14337 }, { "epoch": 0.39, "learning_rate": 0.001407807155460165, "loss": 2.9358, "step": 14338 }, { "epoch": 0.39, "learning_rate": 0.0014077276812058989, "loss": 2.4953, "step": 14339 }, { "epoch": 0.39, "learning_rate": 0.0014076482038627605, "loss": 2.5648, "step": 14340 }, { "epoch": 0.39, "learning_rate": 0.001407568723431352, "loss": 2.6946, "step": 14341 }, { "epoch": 0.39, "learning_rate": 0.0014074892399122763, "loss": 2.611, "step": 14342 }, { "epoch": 0.39, "learning_rate": 0.0014074097533061348, "loss": 2.5904, "step": 14343 }, { "epoch": 0.39, "learning_rate": 0.0014073302636135293, "loss": 2.5942, "step": 14344 }, { "epoch": 0.39, "learning_rate": 0.001407250770835063, "loss": 2.3672, "step": 14345 }, { "epoch": 0.39, "learning_rate": 0.0014071712749713376, "loss": 2.8271, "step": 14346 }, { "epoch": 0.39, "learning_rate": 0.0014070917760229556, "loss": 2.396, "step": 14347 }, { "epoch": 0.39, "learning_rate": 0.0014070122739905187, "loss": 2.9613, "step": 14348 }, { "epoch": 0.39, "learning_rate": 0.0014069327688746298, "loss": 2.4507, "step": 14349 }, { "epoch": 0.39, "learning_rate": 0.0014068532606758913, "loss": 2.4193, "step": 14350 }, { "epoch": 0.39, "learning_rate": 0.0014067737493949047, "loss": 2.4802, "step": 14351 }, { "epoch": 0.39, "learning_rate": 0.0014066942350322732, "loss": 2.817, "step": 14352 }, { "epoch": 0.39, "learning_rate": 0.0014066147175885988, "loss": 2.7075, "step": 14353 }, { "epoch": 0.39, "learning_rate": 0.0014065351970644839, "loss": 2.5367, "step": 14354 }, { "epoch": 0.39, "learning_rate": 0.001406455673460531, "loss": 2.4523, "step": 14355 }, { "epoch": 0.39, "learning_rate": 0.0014063761467773429, "loss": 2.8621, "step": 14356 }, { "epoch": 0.39, "learning_rate": 0.0014062966170155216, "loss": 2.9687, "step": 14357 }, { "epoch": 0.39, "learning_rate": 0.0014062170841756699, "loss": 2.7416, "step": 14358 }, { "epoch": 0.39, "learning_rate": 0.00140613754825839, "loss": 2.4964, "step": 14359 }, { "epoch": 0.39, "learning_rate": 0.0014060580092642848, "loss": 2.3876, "step": 14360 }, { "epoch": 0.39, "learning_rate": 0.0014059784671939565, "loss": 2.5631, "step": 14361 }, { "epoch": 0.39, "learning_rate": 0.0014058989220480079, "loss": 2.4801, "step": 14362 }, { "epoch": 0.39, "learning_rate": 0.001405819373827042, "loss": 2.6556, "step": 14363 }, { "epoch": 0.39, "learning_rate": 0.0014057398225316604, "loss": 2.5085, "step": 14364 }, { "epoch": 0.39, "learning_rate": 0.001405660268162467, "loss": 2.5437, "step": 14365 }, { "epoch": 0.39, "learning_rate": 0.001405580710720064, "loss": 2.8941, "step": 14366 }, { "epoch": 0.39, "learning_rate": 0.0014055011502050539, "loss": 2.9573, "step": 14367 }, { "epoch": 0.39, "learning_rate": 0.0014054215866180393, "loss": 2.998, "step": 14368 }, { "epoch": 0.39, "learning_rate": 0.0014053420199596235, "loss": 2.4592, "step": 14369 }, { "epoch": 0.39, "learning_rate": 0.001405262450230409, "loss": 2.5085, "step": 14370 }, { "epoch": 0.39, "learning_rate": 0.0014051828774309986, "loss": 2.1471, "step": 14371 }, { "epoch": 0.39, "learning_rate": 0.0014051033015619954, "loss": 2.203, "step": 14372 }, { "epoch": 0.39, "learning_rate": 0.001405023722624002, "loss": 2.1898, "step": 14373 }, { "epoch": 0.39, "learning_rate": 0.0014049441406176208, "loss": 2.2819, "step": 14374 }, { "epoch": 0.39, "learning_rate": 0.0014048645555434554, "loss": 2.8003, "step": 14375 }, { "epoch": 0.39, "learning_rate": 0.0014047849674021088, "loss": 2.5476, "step": 14376 }, { "epoch": 0.39, "learning_rate": 0.0014047053761941832, "loss": 2.4301, "step": 14377 }, { "epoch": 0.39, "learning_rate": 0.0014046257819202825, "loss": 2.7404, "step": 14378 }, { "epoch": 0.39, "learning_rate": 0.0014045461845810091, "loss": 2.5601, "step": 14379 }, { "epoch": 0.39, "learning_rate": 0.001404466584176966, "loss": 2.5946, "step": 14380 }, { "epoch": 0.39, "learning_rate": 0.0014043869807087563, "loss": 2.5389, "step": 14381 }, { "epoch": 0.39, "learning_rate": 0.0014043073741769835, "loss": 2.7879, "step": 14382 }, { "epoch": 0.39, "learning_rate": 0.0014042277645822498, "loss": 2.9772, "step": 14383 }, { "epoch": 0.39, "learning_rate": 0.001404148151925159, "loss": 2.2874, "step": 14384 }, { "epoch": 0.39, "learning_rate": 0.0014040685362063142, "loss": 2.5884, "step": 14385 }, { "epoch": 0.39, "learning_rate": 0.0014039889174263186, "loss": 2.4551, "step": 14386 }, { "epoch": 0.39, "learning_rate": 0.0014039092955857747, "loss": 2.3256, "step": 14387 }, { "epoch": 0.39, "learning_rate": 0.0014038296706852865, "loss": 2.9123, "step": 14388 }, { "epoch": 0.39, "learning_rate": 0.001403750042725457, "loss": 2.3509, "step": 14389 }, { "epoch": 0.39, "learning_rate": 0.001403670411706889, "loss": 2.7531, "step": 14390 }, { "epoch": 0.39, "learning_rate": 0.001403590777630186, "loss": 2.5801, "step": 14391 }, { "epoch": 0.39, "learning_rate": 0.001403511140495952, "loss": 2.475, "step": 14392 }, { "epoch": 0.39, "learning_rate": 0.0014034315003047895, "loss": 2.5686, "step": 14393 }, { "epoch": 0.39, "learning_rate": 0.001403351857057302, "loss": 2.583, "step": 14394 }, { "epoch": 0.39, "learning_rate": 0.001403272210754093, "loss": 2.3678, "step": 14395 }, { "epoch": 0.39, "learning_rate": 0.001403192561395766, "loss": 2.5141, "step": 14396 }, { "epoch": 0.39, "learning_rate": 0.001403112908982924, "loss": 2.6172, "step": 14397 }, { "epoch": 0.39, "learning_rate": 0.0014030332535161707, "loss": 2.4777, "step": 14398 }, { "epoch": 0.39, "learning_rate": 0.0014029535949961096, "loss": 2.4958, "step": 14399 }, { "epoch": 0.39, "learning_rate": 0.001402873933423344, "loss": 2.2538, "step": 14400 }, { "epoch": 0.39, "learning_rate": 0.0014027942687984776, "loss": 2.3236, "step": 14401 }, { "epoch": 0.39, "learning_rate": 0.001402714601122114, "loss": 2.3763, "step": 14402 }, { "epoch": 0.39, "learning_rate": 0.0014026349303948563, "loss": 2.5984, "step": 14403 }, { "epoch": 0.39, "learning_rate": 0.0014025552566173083, "loss": 2.1048, "step": 14404 }, { "epoch": 0.39, "learning_rate": 0.001402475579790074, "loss": 2.6402, "step": 14405 }, { "epoch": 0.39, "learning_rate": 0.0014023958999137562, "loss": 2.5797, "step": 14406 }, { "epoch": 0.39, "learning_rate": 0.0014023162169889594, "loss": 2.1214, "step": 14407 }, { "epoch": 0.39, "learning_rate": 0.0014022365310162868, "loss": 2.5212, "step": 14408 }, { "epoch": 0.39, "learning_rate": 0.0014021568419963421, "loss": 2.7813, "step": 14409 }, { "epoch": 0.39, "learning_rate": 0.0014020771499297288, "loss": 2.639, "step": 14410 }, { "epoch": 0.39, "learning_rate": 0.0014019974548170513, "loss": 2.6556, "step": 14411 }, { "epoch": 0.39, "learning_rate": 0.001401917756658913, "loss": 2.6106, "step": 14412 }, { "epoch": 0.39, "learning_rate": 0.0014018380554559173, "loss": 2.0645, "step": 14413 }, { "epoch": 0.39, "learning_rate": 0.0014017583512086684, "loss": 2.6591, "step": 14414 }, { "epoch": 0.39, "learning_rate": 0.0014016786439177702, "loss": 2.6435, "step": 14415 }, { "epoch": 0.39, "learning_rate": 0.0014015989335838263, "loss": 2.3331, "step": 14416 }, { "epoch": 0.39, "learning_rate": 0.0014015192202074408, "loss": 2.9478, "step": 14417 }, { "epoch": 0.39, "learning_rate": 0.0014014395037892174, "loss": 2.5772, "step": 14418 }, { "epoch": 0.39, "learning_rate": 0.00140135978432976, "loss": 2.4632, "step": 14419 }, { "epoch": 0.39, "learning_rate": 0.0014012800618296729, "loss": 3.07, "step": 14420 }, { "epoch": 0.39, "learning_rate": 0.0014012003362895596, "loss": 2.4242, "step": 14421 }, { "epoch": 0.39, "learning_rate": 0.001401120607710024, "loss": 2.5143, "step": 14422 }, { "epoch": 0.39, "learning_rate": 0.0014010408760916707, "loss": 1.9741, "step": 14423 }, { "epoch": 0.39, "learning_rate": 0.0014009611414351035, "loss": 2.4079, "step": 14424 }, { "epoch": 0.39, "learning_rate": 0.0014008814037409264, "loss": 2.646, "step": 14425 }, { "epoch": 0.39, "learning_rate": 0.0014008016630097432, "loss": 2.5918, "step": 14426 }, { "epoch": 0.39, "learning_rate": 0.0014007219192421583, "loss": 2.4667, "step": 14427 }, { "epoch": 0.39, "learning_rate": 0.0014006421724387758, "loss": 2.1364, "step": 14428 }, { "epoch": 0.39, "learning_rate": 0.0014005624226002, "loss": 2.8244, "step": 14429 }, { "epoch": 0.39, "learning_rate": 0.0014004826697270347, "loss": 2.4604, "step": 14430 }, { "epoch": 0.39, "learning_rate": 0.0014004029138198844, "loss": 2.5113, "step": 14431 }, { "epoch": 0.39, "learning_rate": 0.0014003231548793535, "loss": 2.5962, "step": 14432 }, { "epoch": 0.39, "learning_rate": 0.0014002433929060454, "loss": 2.3446, "step": 14433 }, { "epoch": 0.39, "learning_rate": 0.0014001636279005652, "loss": 2.6736, "step": 14434 }, { "epoch": 0.39, "learning_rate": 0.0014000838598635169, "loss": 2.7441, "step": 14435 }, { "epoch": 0.39, "learning_rate": 0.0014000040887955049, "loss": 2.3473, "step": 14436 }, { "epoch": 0.39, "learning_rate": 0.0013999243146971332, "loss": 2.1465, "step": 14437 }, { "epoch": 0.39, "learning_rate": 0.0013998445375690064, "loss": 2.6414, "step": 14438 }, { "epoch": 0.39, "learning_rate": 0.0013997647574117292, "loss": 2.3715, "step": 14439 }, { "epoch": 0.39, "learning_rate": 0.0013996849742259052, "loss": 2.9624, "step": 14440 }, { "epoch": 0.39, "learning_rate": 0.0013996051880121394, "loss": 2.7632, "step": 14441 }, { "epoch": 0.39, "learning_rate": 0.0013995253987710364, "loss": 2.2125, "step": 14442 }, { "epoch": 0.39, "learning_rate": 0.0013994456065032001, "loss": 2.4616, "step": 14443 }, { "epoch": 0.39, "learning_rate": 0.0013993658112092357, "loss": 2.4686, "step": 14444 }, { "epoch": 0.39, "learning_rate": 0.001399286012889747, "loss": 2.4297, "step": 14445 }, { "epoch": 0.39, "learning_rate": 0.001399206211545339, "loss": 2.6764, "step": 14446 }, { "epoch": 0.39, "learning_rate": 0.0013991264071766159, "loss": 2.4044, "step": 14447 }, { "epoch": 0.39, "learning_rate": 0.0013990465997841828, "loss": 2.8896, "step": 14448 }, { "epoch": 0.39, "learning_rate": 0.0013989667893686438, "loss": 2.3055, "step": 14449 }, { "epoch": 0.39, "learning_rate": 0.0013988869759306035, "loss": 2.6053, "step": 14450 }, { "epoch": 0.39, "learning_rate": 0.0013988071594706673, "loss": 2.7955, "step": 14451 }, { "epoch": 0.39, "learning_rate": 0.0013987273399894394, "loss": 2.6758, "step": 14452 }, { "epoch": 0.39, "learning_rate": 0.0013986475174875238, "loss": 2.5908, "step": 14453 }, { "epoch": 0.39, "learning_rate": 0.0013985676919655264, "loss": 2.4428, "step": 14454 }, { "epoch": 0.39, "learning_rate": 0.0013984878634240513, "loss": 2.6412, "step": 14455 }, { "epoch": 0.39, "learning_rate": 0.0013984080318637034, "loss": 2.5273, "step": 14456 }, { "epoch": 0.39, "learning_rate": 0.0013983281972850873, "loss": 2.5651, "step": 14457 }, { "epoch": 0.39, "learning_rate": 0.0013982483596888082, "loss": 2.4119, "step": 14458 }, { "epoch": 0.39, "learning_rate": 0.0013981685190754707, "loss": 2.6447, "step": 14459 }, { "epoch": 0.39, "learning_rate": 0.0013980886754456797, "loss": 2.7484, "step": 14460 }, { "epoch": 0.39, "learning_rate": 0.00139800882880004, "loss": 2.9304, "step": 14461 }, { "epoch": 0.39, "learning_rate": 0.0013979289791391568, "loss": 2.2356, "step": 14462 }, { "epoch": 0.39, "learning_rate": 0.0013978491264636343, "loss": 2.4988, "step": 14463 }, { "epoch": 0.39, "learning_rate": 0.0013977692707740784, "loss": 2.4399, "step": 14464 }, { "epoch": 0.39, "learning_rate": 0.0013976894120710935, "loss": 2.9313, "step": 14465 }, { "epoch": 0.39, "learning_rate": 0.0013976095503552845, "loss": 2.7796, "step": 14466 }, { "epoch": 0.39, "learning_rate": 0.0013975296856272568, "loss": 2.2909, "step": 14467 }, { "epoch": 0.39, "learning_rate": 0.0013974498178876153, "loss": 2.6217, "step": 14468 }, { "epoch": 0.39, "learning_rate": 0.0013973699471369653, "loss": 2.8572, "step": 14469 }, { "epoch": 0.39, "learning_rate": 0.001397290073375911, "loss": 2.3389, "step": 14470 }, { "epoch": 0.39, "learning_rate": 0.0013972101966050585, "loss": 2.6934, "step": 14471 }, { "epoch": 0.39, "learning_rate": 0.0013971303168250127, "loss": 2.6352, "step": 14472 }, { "epoch": 0.39, "learning_rate": 0.0013970504340363782, "loss": 2.6147, "step": 14473 }, { "epoch": 0.39, "learning_rate": 0.001396970548239761, "loss": 2.787, "step": 14474 }, { "epoch": 0.39, "learning_rate": 0.001396890659435766, "loss": 2.2475, "step": 14475 }, { "epoch": 0.39, "learning_rate": 0.0013968107676249977, "loss": 2.6073, "step": 14476 }, { "epoch": 0.39, "learning_rate": 0.0013967308728080623, "loss": 3.0661, "step": 14477 }, { "epoch": 0.39, "learning_rate": 0.0013966509749855649, "loss": 2.5313, "step": 14478 }, { "epoch": 0.39, "learning_rate": 0.0013965710741581105, "loss": 2.4363, "step": 14479 }, { "epoch": 0.39, "learning_rate": 0.0013964911703263044, "loss": 2.5236, "step": 14480 }, { "epoch": 0.39, "learning_rate": 0.0013964112634907524, "loss": 2.5568, "step": 14481 }, { "epoch": 0.39, "learning_rate": 0.0013963313536520595, "loss": 2.6377, "step": 14482 }, { "epoch": 0.39, "learning_rate": 0.0013962514408108308, "loss": 2.8332, "step": 14483 }, { "epoch": 0.39, "learning_rate": 0.0013961715249676723, "loss": 2.8763, "step": 14484 }, { "epoch": 0.39, "learning_rate": 0.001396091606123189, "loss": 3.0124, "step": 14485 }, { "epoch": 0.39, "learning_rate": 0.0013960116842779867, "loss": 2.6527, "step": 14486 }, { "epoch": 0.39, "learning_rate": 0.0013959317594326706, "loss": 3.0442, "step": 14487 }, { "epoch": 0.39, "learning_rate": 0.0013958518315878461, "loss": 2.6548, "step": 14488 }, { "epoch": 0.39, "learning_rate": 0.001395771900744119, "loss": 2.5111, "step": 14489 }, { "epoch": 0.39, "learning_rate": 0.001395691966902095, "loss": 2.8024, "step": 14490 }, { "epoch": 0.39, "learning_rate": 0.001395612030062379, "loss": 2.4498, "step": 14491 }, { "epoch": 0.39, "learning_rate": 0.0013955320902255771, "loss": 2.2739, "step": 14492 }, { "epoch": 0.39, "learning_rate": 0.0013954521473922947, "loss": 2.4879, "step": 14493 }, { "epoch": 0.39, "learning_rate": 0.001395372201563138, "loss": 2.7249, "step": 14494 }, { "epoch": 0.39, "learning_rate": 0.001395292252738712, "loss": 3.2681, "step": 14495 }, { "epoch": 0.39, "learning_rate": 0.001395212300919622, "loss": 2.4396, "step": 14496 }, { "epoch": 0.39, "learning_rate": 0.001395132346106475, "loss": 2.7234, "step": 14497 }, { "epoch": 0.39, "learning_rate": 0.0013950523882998755, "loss": 2.5228, "step": 14498 }, { "epoch": 0.39, "learning_rate": 0.00139497242750043, "loss": 2.6522, "step": 14499 }, { "epoch": 0.39, "learning_rate": 0.001394892463708744, "loss": 2.6632, "step": 14500 }, { "epoch": 0.39, "learning_rate": 0.0013948124969254232, "loss": 2.698, "step": 14501 }, { "epoch": 0.39, "learning_rate": 0.0013947325271510733, "loss": 2.4607, "step": 14502 }, { "epoch": 0.39, "learning_rate": 0.0013946525543863009, "loss": 2.8417, "step": 14503 }, { "epoch": 0.39, "learning_rate": 0.0013945725786317109, "loss": 2.4668, "step": 14504 }, { "epoch": 0.39, "learning_rate": 0.0013944925998879097, "loss": 2.2024, "step": 14505 }, { "epoch": 0.39, "learning_rate": 0.001394412618155503, "loss": 2.7188, "step": 14506 }, { "epoch": 0.39, "learning_rate": 0.001394332633435097, "loss": 2.6226, "step": 14507 }, { "epoch": 0.39, "learning_rate": 0.0013942526457272973, "loss": 2.6361, "step": 14508 }, { "epoch": 0.39, "learning_rate": 0.00139417265503271, "loss": 2.603, "step": 14509 }, { "epoch": 0.39, "learning_rate": 0.0013940926613519413, "loss": 1.99, "step": 14510 }, { "epoch": 0.39, "learning_rate": 0.0013940126646855974, "loss": 2.5252, "step": 14511 }, { "epoch": 0.39, "learning_rate": 0.0013939326650342831, "loss": 2.4562, "step": 14512 }, { "epoch": 0.39, "learning_rate": 0.001393852662398606, "loss": 2.5728, "step": 14513 }, { "epoch": 0.39, "learning_rate": 0.0013937726567791713, "loss": 2.5953, "step": 14514 }, { "epoch": 0.39, "learning_rate": 0.0013936926481765855, "loss": 2.5417, "step": 14515 }, { "epoch": 0.39, "learning_rate": 0.0013936126365914543, "loss": 2.5533, "step": 14516 }, { "epoch": 0.39, "learning_rate": 0.0013935326220243845, "loss": 2.8939, "step": 14517 }, { "epoch": 0.39, "learning_rate": 0.001393452604475982, "loss": 2.3498, "step": 14518 }, { "epoch": 0.39, "learning_rate": 0.0013933725839468524, "loss": 2.2203, "step": 14519 }, { "epoch": 0.39, "learning_rate": 0.0013932925604376028, "loss": 2.5413, "step": 14520 }, { "epoch": 0.39, "learning_rate": 0.0013932125339488391, "loss": 2.941, "step": 14521 }, { "epoch": 0.39, "learning_rate": 0.0013931325044811674, "loss": 2.6151, "step": 14522 }, { "epoch": 0.39, "learning_rate": 0.001393052472035194, "loss": 2.5998, "step": 14523 }, { "epoch": 0.39, "learning_rate": 0.0013929724366115255, "loss": 2.7697, "step": 14524 }, { "epoch": 0.39, "learning_rate": 0.0013928923982107681, "loss": 2.3616, "step": 14525 }, { "epoch": 0.39, "learning_rate": 0.0013928123568335282, "loss": 2.6564, "step": 14526 }, { "epoch": 0.39, "learning_rate": 0.0013927323124804118, "loss": 2.322, "step": 14527 }, { "epoch": 0.39, "learning_rate": 0.001392652265152026, "loss": 2.665, "step": 14528 }, { "epoch": 0.39, "learning_rate": 0.0013925722148489768, "loss": 2.5031, "step": 14529 }, { "epoch": 0.39, "learning_rate": 0.0013924921615718706, "loss": 2.6826, "step": 14530 }, { "epoch": 0.39, "learning_rate": 0.001392412105321314, "loss": 2.6478, "step": 14531 }, { "epoch": 0.39, "learning_rate": 0.0013923320460979133, "loss": 2.3456, "step": 14532 }, { "epoch": 0.39, "learning_rate": 0.0013922519839022751, "loss": 2.5624, "step": 14533 }, { "epoch": 0.39, "learning_rate": 0.0013921719187350065, "loss": 2.828, "step": 14534 }, { "epoch": 0.39, "learning_rate": 0.0013920918505967129, "loss": 2.6796, "step": 14535 }, { "epoch": 0.39, "learning_rate": 0.0013920117794880018, "loss": 2.104, "step": 14536 }, { "epoch": 0.39, "learning_rate": 0.0013919317054094799, "loss": 2.3326, "step": 14537 }, { "epoch": 0.39, "learning_rate": 0.001391851628361753, "loss": 2.9643, "step": 14538 }, { "epoch": 0.39, "learning_rate": 0.001391771548345428, "loss": 2.9795, "step": 14539 }, { "epoch": 0.39, "learning_rate": 0.0013916914653611123, "loss": 2.9946, "step": 14540 }, { "epoch": 0.39, "learning_rate": 0.0013916113794094122, "loss": 2.5848, "step": 14541 }, { "epoch": 0.39, "learning_rate": 0.001391531290490934, "loss": 2.141, "step": 14542 }, { "epoch": 0.39, "learning_rate": 0.0013914511986062846, "loss": 2.3134, "step": 14543 }, { "epoch": 0.39, "learning_rate": 0.0013913711037560712, "loss": 2.2301, "step": 14544 }, { "epoch": 0.39, "learning_rate": 0.0013912910059409001, "loss": 2.1485, "step": 14545 }, { "epoch": 0.39, "learning_rate": 0.0013912109051613783, "loss": 2.4208, "step": 14546 }, { "epoch": 0.39, "learning_rate": 0.0013911308014181128, "loss": 2.3872, "step": 14547 }, { "epoch": 0.39, "learning_rate": 0.0013910506947117103, "loss": 2.3744, "step": 14548 }, { "epoch": 0.39, "learning_rate": 0.0013909705850427773, "loss": 2.5685, "step": 14549 }, { "epoch": 0.39, "learning_rate": 0.0013908904724119213, "loss": 2.7416, "step": 14550 }, { "epoch": 0.39, "learning_rate": 0.001390810356819749, "loss": 2.7168, "step": 14551 }, { "epoch": 0.39, "learning_rate": 0.0013907302382668671, "loss": 2.6712, "step": 14552 }, { "epoch": 0.39, "learning_rate": 0.0013906501167538833, "loss": 2.5328, "step": 14553 }, { "epoch": 0.39, "learning_rate": 0.0013905699922814034, "loss": 3.0115, "step": 14554 }, { "epoch": 0.39, "learning_rate": 0.0013904898648500355, "loss": 3.1083, "step": 14555 }, { "epoch": 0.39, "learning_rate": 0.001390409734460386, "loss": 2.7863, "step": 14556 }, { "epoch": 0.39, "learning_rate": 0.0013903296011130621, "loss": 2.3877, "step": 14557 }, { "epoch": 0.39, "learning_rate": 0.001390249464808671, "loss": 2.2919, "step": 14558 }, { "epoch": 0.39, "learning_rate": 0.0013901693255478195, "loss": 2.7969, "step": 14559 }, { "epoch": 0.39, "learning_rate": 0.0013900891833311156, "loss": 2.2441, "step": 14560 }, { "epoch": 0.39, "learning_rate": 0.0013900090381591655, "loss": 2.8449, "step": 14561 }, { "epoch": 0.39, "learning_rate": 0.0013899288900325762, "loss": 2.3331, "step": 14562 }, { "epoch": 0.39, "learning_rate": 0.0013898487389519556, "loss": 2.7893, "step": 14563 }, { "epoch": 0.39, "learning_rate": 0.001389768584917911, "loss": 2.8525, "step": 14564 }, { "epoch": 0.39, "learning_rate": 0.001389688427931049, "loss": 2.4321, "step": 14565 }, { "epoch": 0.39, "learning_rate": 0.001389608267991977, "loss": 2.8274, "step": 14566 }, { "epoch": 0.39, "learning_rate": 0.0013895281051013028, "loss": 2.5902, "step": 14567 }, { "epoch": 0.39, "learning_rate": 0.0013894479392596328, "loss": 2.7558, "step": 14568 }, { "epoch": 0.39, "learning_rate": 0.001389367770467575, "loss": 2.9059, "step": 14569 }, { "epoch": 0.39, "learning_rate": 0.0013892875987257366, "loss": 2.8346, "step": 14570 }, { "epoch": 0.39, "learning_rate": 0.0013892074240347255, "loss": 2.9698, "step": 14571 }, { "epoch": 0.39, "learning_rate": 0.001389127246395148, "loss": 2.7797, "step": 14572 }, { "epoch": 0.39, "learning_rate": 0.0013890470658076122, "loss": 2.6391, "step": 14573 }, { "epoch": 0.39, "learning_rate": 0.001388966882272725, "loss": 2.6359, "step": 14574 }, { "epoch": 0.39, "learning_rate": 0.0013888866957910946, "loss": 2.5766, "step": 14575 }, { "epoch": 0.39, "learning_rate": 0.0013888065063633282, "loss": 2.0582, "step": 14576 }, { "epoch": 0.39, "learning_rate": 0.0013887263139900333, "loss": 2.5853, "step": 14577 }, { "epoch": 0.39, "learning_rate": 0.0013886461186718168, "loss": 2.3395, "step": 14578 }, { "epoch": 0.39, "learning_rate": 0.0013885659204092872, "loss": 2.6089, "step": 14579 }, { "epoch": 0.39, "learning_rate": 0.0013884857192030518, "loss": 2.4261, "step": 14580 }, { "epoch": 0.39, "learning_rate": 0.0013884055150537177, "loss": 2.9176, "step": 14581 }, { "epoch": 0.39, "learning_rate": 0.001388325307961893, "loss": 2.9401, "step": 14582 }, { "epoch": 0.39, "learning_rate": 0.0013882450979281853, "loss": 2.7206, "step": 14583 }, { "epoch": 0.39, "learning_rate": 0.001388164884953202, "loss": 2.5692, "step": 14584 }, { "epoch": 0.39, "learning_rate": 0.001388084669037551, "loss": 2.7439, "step": 14585 }, { "epoch": 0.39, "learning_rate": 0.00138800445018184, "loss": 2.2084, "step": 14586 }, { "epoch": 0.39, "learning_rate": 0.0013879242283866763, "loss": 2.4201, "step": 14587 }, { "epoch": 0.39, "learning_rate": 0.0013878440036526683, "loss": 2.5951, "step": 14588 }, { "epoch": 0.39, "learning_rate": 0.0013877637759804233, "loss": 2.5562, "step": 14589 }, { "epoch": 0.39, "learning_rate": 0.0013876835453705497, "loss": 2.3993, "step": 14590 }, { "epoch": 0.39, "learning_rate": 0.0013876033118236544, "loss": 2.6286, "step": 14591 }, { "epoch": 0.39, "learning_rate": 0.0013875230753403458, "loss": 2.8216, "step": 14592 }, { "epoch": 0.39, "learning_rate": 0.0013874428359212316, "loss": 2.6612, "step": 14593 }, { "epoch": 0.39, "learning_rate": 0.00138736259356692, "loss": 2.3996, "step": 14594 }, { "epoch": 0.39, "learning_rate": 0.0013872823482780185, "loss": 2.3085, "step": 14595 }, { "epoch": 0.39, "learning_rate": 0.0013872021000551353, "loss": 2.2833, "step": 14596 }, { "epoch": 0.39, "learning_rate": 0.001387121848898878, "loss": 2.2456, "step": 14597 }, { "epoch": 0.39, "learning_rate": 0.0013870415948098547, "loss": 2.263, "step": 14598 }, { "epoch": 0.39, "learning_rate": 0.001386961337788674, "loss": 2.6439, "step": 14599 }, { "epoch": 0.39, "learning_rate": 0.0013868810778359432, "loss": 2.4806, "step": 14600 }, { "epoch": 0.39, "learning_rate": 0.0013868008149522703, "loss": 2.384, "step": 14601 }, { "epoch": 0.39, "learning_rate": 0.0013867205491382632, "loss": 2.3332, "step": 14602 }, { "epoch": 0.39, "learning_rate": 0.0013866402803945311, "loss": 2.8029, "step": 14603 }, { "epoch": 0.39, "learning_rate": 0.0013865600087216812, "loss": 2.3292, "step": 14604 }, { "epoch": 0.39, "learning_rate": 0.0013864797341203213, "loss": 2.4082, "step": 14605 }, { "epoch": 0.39, "learning_rate": 0.0013863994565910605, "loss": 2.5965, "step": 14606 }, { "epoch": 0.39, "learning_rate": 0.0013863191761345065, "loss": 2.6618, "step": 14607 }, { "epoch": 0.39, "learning_rate": 0.0013862388927512671, "loss": 2.4624, "step": 14608 }, { "epoch": 0.39, "learning_rate": 0.0013861586064419513, "loss": 2.3913, "step": 14609 }, { "epoch": 0.39, "learning_rate": 0.0013860783172071668, "loss": 2.8667, "step": 14610 }, { "epoch": 0.39, "learning_rate": 0.0013859980250475218, "loss": 2.6472, "step": 14611 }, { "epoch": 0.39, "learning_rate": 0.001385917729963625, "loss": 2.6648, "step": 14612 }, { "epoch": 0.39, "learning_rate": 0.0013858374319560846, "loss": 2.4721, "step": 14613 }, { "epoch": 0.39, "learning_rate": 0.0013857571310255086, "loss": 2.4934, "step": 14614 }, { "epoch": 0.39, "learning_rate": 0.0013856768271725056, "loss": 2.3222, "step": 14615 }, { "epoch": 0.39, "learning_rate": 0.0013855965203976842, "loss": 3.1044, "step": 14616 }, { "epoch": 0.39, "learning_rate": 0.001385516210701652, "loss": 2.6237, "step": 14617 }, { "epoch": 0.39, "learning_rate": 0.001385435898085018, "loss": 2.5293, "step": 14618 }, { "epoch": 0.39, "learning_rate": 0.0013853555825483906, "loss": 2.4526, "step": 14619 }, { "epoch": 0.39, "learning_rate": 0.0013852752640923784, "loss": 2.6434, "step": 14620 }, { "epoch": 0.39, "learning_rate": 0.0013851949427175897, "loss": 2.6893, "step": 14621 }, { "epoch": 0.39, "learning_rate": 0.0013851146184246327, "loss": 2.1745, "step": 14622 }, { "epoch": 0.39, "learning_rate": 0.0013850342912141162, "loss": 2.5868, "step": 14623 }, { "epoch": 0.39, "learning_rate": 0.0013849539610866488, "loss": 2.1844, "step": 14624 }, { "epoch": 0.39, "learning_rate": 0.0013848736280428389, "loss": 2.4869, "step": 14625 }, { "epoch": 0.39, "learning_rate": 0.0013847932920832955, "loss": 2.3656, "step": 14626 }, { "epoch": 0.39, "learning_rate": 0.001384712953208627, "loss": 2.6321, "step": 14627 }, { "epoch": 0.39, "learning_rate": 0.0013846326114194413, "loss": 2.1448, "step": 14628 }, { "epoch": 0.39, "learning_rate": 0.0013845522667163483, "loss": 2.5312, "step": 14629 }, { "epoch": 0.39, "learning_rate": 0.0013844719190999563, "loss": 2.6441, "step": 14630 }, { "epoch": 0.39, "learning_rate": 0.001384391568570873, "loss": 2.2488, "step": 14631 }, { "epoch": 0.39, "learning_rate": 0.0013843112151297084, "loss": 2.5789, "step": 14632 }, { "epoch": 0.39, "learning_rate": 0.0013842308587770707, "loss": 2.4343, "step": 14633 }, { "epoch": 0.39, "learning_rate": 0.0013841504995135688, "loss": 2.6752, "step": 14634 }, { "epoch": 0.39, "learning_rate": 0.001384070137339811, "loss": 2.2142, "step": 14635 }, { "epoch": 0.39, "learning_rate": 0.0013839897722564068, "loss": 2.6947, "step": 14636 }, { "epoch": 0.39, "learning_rate": 0.0013839094042639645, "loss": 2.8271, "step": 14637 }, { "epoch": 0.39, "learning_rate": 0.0013838290333630936, "loss": 2.6543, "step": 14638 }, { "epoch": 0.39, "learning_rate": 0.0013837486595544024, "loss": 2.4576, "step": 14639 }, { "epoch": 0.39, "learning_rate": 0.0013836682828384998, "loss": 2.5281, "step": 14640 }, { "epoch": 0.39, "learning_rate": 0.0013835879032159948, "loss": 2.3385, "step": 14641 }, { "epoch": 0.39, "learning_rate": 0.0013835075206874968, "loss": 2.3493, "step": 14642 }, { "epoch": 0.39, "learning_rate": 0.0013834271352536143, "loss": 3.1305, "step": 14643 }, { "epoch": 0.39, "learning_rate": 0.001383346746914956, "loss": 2.6002, "step": 14644 }, { "epoch": 0.39, "learning_rate": 0.0013832663556721317, "loss": 2.2295, "step": 14645 }, { "epoch": 0.39, "learning_rate": 0.0013831859615257497, "loss": 2.7629, "step": 14646 }, { "epoch": 0.39, "learning_rate": 0.00138310556447642, "loss": 2.4585, "step": 14647 }, { "epoch": 0.39, "learning_rate": 0.0013830251645247503, "loss": 2.7213, "step": 14648 }, { "epoch": 0.39, "learning_rate": 0.0013829447616713507, "loss": 2.8109, "step": 14649 }, { "epoch": 0.39, "learning_rate": 0.0013828643559168302, "loss": 2.7307, "step": 14650 }, { "epoch": 0.39, "learning_rate": 0.0013827839472617973, "loss": 2.3433, "step": 14651 }, { "epoch": 0.39, "learning_rate": 0.001382703535706862, "loss": 2.1785, "step": 14652 }, { "epoch": 0.39, "learning_rate": 0.0013826231212526333, "loss": 2.6819, "step": 14653 }, { "epoch": 0.39, "learning_rate": 0.0013825427038997198, "loss": 2.7541, "step": 14654 }, { "epoch": 0.39, "learning_rate": 0.0013824622836487318, "loss": 2.1923, "step": 14655 }, { "epoch": 0.39, "learning_rate": 0.0013823818605002774, "loss": 2.3764, "step": 14656 }, { "epoch": 0.39, "learning_rate": 0.0013823014344549664, "loss": 2.3993, "step": 14657 }, { "epoch": 0.39, "learning_rate": 0.0013822210055134084, "loss": 2.8094, "step": 14658 }, { "epoch": 0.39, "learning_rate": 0.001382140573676212, "loss": 2.6739, "step": 14659 }, { "epoch": 0.39, "learning_rate": 0.0013820601389439872, "loss": 2.7196, "step": 14660 }, { "epoch": 0.39, "learning_rate": 0.001381979701317343, "loss": 2.5744, "step": 14661 }, { "epoch": 0.39, "learning_rate": 0.001381899260796889, "loss": 2.4512, "step": 14662 }, { "epoch": 0.39, "learning_rate": 0.0013818188173832342, "loss": 2.6565, "step": 14663 }, { "epoch": 0.39, "learning_rate": 0.0013817383710769886, "loss": 2.381, "step": 14664 }, { "epoch": 0.39, "learning_rate": 0.0013816579218787614, "loss": 2.8188, "step": 14665 }, { "epoch": 0.39, "learning_rate": 0.001381577469789162, "loss": 2.6221, "step": 14666 }, { "epoch": 0.39, "learning_rate": 0.0013814970148087996, "loss": 2.7455, "step": 14667 }, { "epoch": 0.39, "learning_rate": 0.001381416556938284, "loss": 2.6832, "step": 14668 }, { "epoch": 0.39, "learning_rate": 0.001381336096178225, "loss": 2.5111, "step": 14669 }, { "epoch": 0.39, "learning_rate": 0.001381255632529232, "loss": 2.8222, "step": 14670 }, { "epoch": 0.39, "learning_rate": 0.0013811751659919141, "loss": 2.2766, "step": 14671 }, { "epoch": 0.39, "learning_rate": 0.0013810946965668817, "loss": 2.5226, "step": 14672 }, { "epoch": 0.39, "learning_rate": 0.001381014224254744, "loss": 2.4214, "step": 14673 }, { "epoch": 0.39, "learning_rate": 0.0013809337490561103, "loss": 2.2813, "step": 14674 }, { "epoch": 0.39, "learning_rate": 0.0013808532709715907, "loss": 2.7107, "step": 14675 }, { "epoch": 0.39, "learning_rate": 0.001380772790001795, "loss": 2.2584, "step": 14676 }, { "epoch": 0.39, "learning_rate": 0.0013806923061473327, "loss": 2.8462, "step": 14677 }, { "epoch": 0.39, "learning_rate": 0.0013806118194088135, "loss": 2.6184, "step": 14678 }, { "epoch": 0.39, "learning_rate": 0.001380531329786847, "loss": 2.1608, "step": 14679 }, { "epoch": 0.39, "learning_rate": 0.0013804508372820437, "loss": 2.4465, "step": 14680 }, { "epoch": 0.39, "learning_rate": 0.0013803703418950124, "loss": 2.6555, "step": 14681 }, { "epoch": 0.39, "learning_rate": 0.0013802898436263637, "loss": 2.7708, "step": 14682 }, { "epoch": 0.39, "learning_rate": 0.0013802093424767068, "loss": 2.6258, "step": 14683 }, { "epoch": 0.39, "learning_rate": 0.0013801288384466522, "loss": 2.4965, "step": 14684 }, { "epoch": 0.39, "learning_rate": 0.0013800483315368093, "loss": 2.5449, "step": 14685 }, { "epoch": 0.39, "learning_rate": 0.0013799678217477885, "loss": 2.4232, "step": 14686 }, { "epoch": 0.39, "learning_rate": 0.001379887309080199, "loss": 2.4521, "step": 14687 }, { "epoch": 0.39, "learning_rate": 0.0013798067935346513, "loss": 2.6834, "step": 14688 }, { "epoch": 0.39, "learning_rate": 0.0013797262751117554, "loss": 2.4225, "step": 14689 }, { "epoch": 0.39, "learning_rate": 0.0013796457538121207, "loss": 2.5732, "step": 14690 }, { "epoch": 0.39, "learning_rate": 0.0013795652296363578, "loss": 2.579, "step": 14691 }, { "epoch": 0.39, "learning_rate": 0.001379484702585077, "loss": 2.4858, "step": 14692 }, { "epoch": 0.39, "learning_rate": 0.0013794041726588877, "loss": 2.7363, "step": 14693 }, { "epoch": 0.39, "learning_rate": 0.0013793236398584002, "loss": 2.511, "step": 14694 }, { "epoch": 0.39, "learning_rate": 0.0013792431041842244, "loss": 2.4557, "step": 14695 }, { "epoch": 0.39, "learning_rate": 0.001379162565636971, "loss": 2.666, "step": 14696 }, { "epoch": 0.39, "learning_rate": 0.0013790820242172495, "loss": 2.5112, "step": 14697 }, { "epoch": 0.39, "learning_rate": 0.0013790014799256707, "loss": 2.8556, "step": 14698 }, { "epoch": 0.4, "learning_rate": 0.001378920932762844, "loss": 3.0972, "step": 14699 }, { "epoch": 0.4, "learning_rate": 0.0013788403827293804, "loss": 2.893, "step": 14700 }, { "epoch": 0.4, "learning_rate": 0.0013787598298258897, "loss": 2.648, "step": 14701 }, { "epoch": 0.4, "learning_rate": 0.0013786792740529822, "loss": 2.6163, "step": 14702 }, { "epoch": 0.4, "learning_rate": 0.0013785987154112682, "loss": 2.3246, "step": 14703 }, { "epoch": 0.4, "learning_rate": 0.001378518153901358, "loss": 2.3894, "step": 14704 }, { "epoch": 0.4, "learning_rate": 0.0013784375895238622, "loss": 2.3863, "step": 14705 }, { "epoch": 0.4, "learning_rate": 0.0013783570222793905, "loss": 2.5188, "step": 14706 }, { "epoch": 0.4, "learning_rate": 0.0013782764521685538, "loss": 2.898, "step": 14707 }, { "epoch": 0.4, "learning_rate": 0.0013781958791919625, "loss": 2.6833, "step": 14708 }, { "epoch": 0.4, "learning_rate": 0.0013781153033502267, "loss": 2.5294, "step": 14709 }, { "epoch": 0.4, "learning_rate": 0.0013780347246439568, "loss": 2.7771, "step": 14710 }, { "epoch": 0.4, "learning_rate": 0.0013779541430737636, "loss": 2.5948, "step": 14711 }, { "epoch": 0.4, "learning_rate": 0.0013778735586402575, "loss": 2.1812, "step": 14712 }, { "epoch": 0.4, "learning_rate": 0.001377792971344049, "loss": 2.3809, "step": 14713 }, { "epoch": 0.4, "learning_rate": 0.0013777123811857478, "loss": 2.5351, "step": 14714 }, { "epoch": 0.4, "learning_rate": 0.0013776317881659657, "loss": 2.3538, "step": 14715 }, { "epoch": 0.4, "learning_rate": 0.0013775511922853125, "loss": 1.9366, "step": 14716 }, { "epoch": 0.4, "learning_rate": 0.001377470593544399, "loss": 2.2325, "step": 14717 }, { "epoch": 0.4, "learning_rate": 0.0013773899919438358, "loss": 2.3383, "step": 14718 }, { "epoch": 0.4, "learning_rate": 0.0013773093874842335, "loss": 2.5379, "step": 14719 }, { "epoch": 0.4, "learning_rate": 0.0013772287801662026, "loss": 2.6965, "step": 14720 }, { "epoch": 0.4, "learning_rate": 0.0013771481699903542, "loss": 2.628, "step": 14721 }, { "epoch": 0.4, "learning_rate": 0.0013770675569572983, "loss": 2.7877, "step": 14722 }, { "epoch": 0.4, "learning_rate": 0.0013769869410676463, "loss": 2.6993, "step": 14723 }, { "epoch": 0.4, "learning_rate": 0.0013769063223220085, "loss": 2.5079, "step": 14724 }, { "epoch": 0.4, "learning_rate": 0.001376825700720996, "loss": 2.721, "step": 14725 }, { "epoch": 0.4, "learning_rate": 0.001376745076265219, "loss": 2.6379, "step": 14726 }, { "epoch": 0.4, "learning_rate": 0.0013766644489552888, "loss": 2.6828, "step": 14727 }, { "epoch": 0.4, "learning_rate": 0.0013765838187918163, "loss": 2.969, "step": 14728 }, { "epoch": 0.4, "learning_rate": 0.001376503185775412, "loss": 2.5459, "step": 14729 }, { "epoch": 0.4, "learning_rate": 0.0013764225499066868, "loss": 2.0982, "step": 14730 }, { "epoch": 0.4, "learning_rate": 0.0013763419111862513, "loss": 2.8002, "step": 14731 }, { "epoch": 0.4, "learning_rate": 0.0013762612696147174, "loss": 2.8753, "step": 14732 }, { "epoch": 0.4, "learning_rate": 0.001376180625192695, "loss": 2.7145, "step": 14733 }, { "epoch": 0.4, "learning_rate": 0.0013760999779207955, "loss": 2.6066, "step": 14734 }, { "epoch": 0.4, "learning_rate": 0.00137601932779963, "loss": 2.2727, "step": 14735 }, { "epoch": 0.4, "learning_rate": 0.0013759386748298094, "loss": 2.5735, "step": 14736 }, { "epoch": 0.4, "learning_rate": 0.001375858019011944, "loss": 2.4772, "step": 14737 }, { "epoch": 0.4, "learning_rate": 0.0013757773603466459, "loss": 2.6107, "step": 14738 }, { "epoch": 0.4, "learning_rate": 0.0013756966988345257, "loss": 2.7423, "step": 14739 }, { "epoch": 0.4, "learning_rate": 0.0013756160344761943, "loss": 2.2596, "step": 14740 }, { "epoch": 0.4, "learning_rate": 0.001375535367272263, "loss": 2.5918, "step": 14741 }, { "epoch": 0.4, "learning_rate": 0.001375454697223343, "loss": 2.4719, "step": 14742 }, { "epoch": 0.4, "learning_rate": 0.0013753740243300455, "loss": 2.3325, "step": 14743 }, { "epoch": 0.4, "learning_rate": 0.0013752933485929812, "loss": 2.55, "step": 14744 }, { "epoch": 0.4, "learning_rate": 0.0013752126700127616, "loss": 2.5772, "step": 14745 }, { "epoch": 0.4, "learning_rate": 0.0013751319885899982, "loss": 2.5423, "step": 14746 }, { "epoch": 0.4, "learning_rate": 0.0013750513043253015, "loss": 2.4894, "step": 14747 }, { "epoch": 0.4, "learning_rate": 0.0013749706172192836, "loss": 2.4236, "step": 14748 }, { "epoch": 0.4, "learning_rate": 0.001374889927272555, "loss": 2.6521, "step": 14749 }, { "epoch": 0.4, "learning_rate": 0.0013748092344857275, "loss": 2.7073, "step": 14750 }, { "epoch": 0.4, "learning_rate": 0.0013747285388594121, "loss": 2.7989, "step": 14751 }, { "epoch": 0.4, "learning_rate": 0.0013746478403942207, "loss": 2.675, "step": 14752 }, { "epoch": 0.4, "learning_rate": 0.0013745671390907638, "loss": 2.7107, "step": 14753 }, { "epoch": 0.4, "learning_rate": 0.0013744864349496534, "loss": 2.9888, "step": 14754 }, { "epoch": 0.4, "learning_rate": 0.0013744057279715008, "loss": 3.093, "step": 14755 }, { "epoch": 0.4, "learning_rate": 0.0013743250181569172, "loss": 2.7587, "step": 14756 }, { "epoch": 0.4, "learning_rate": 0.001374244305506514, "loss": 2.4917, "step": 14757 }, { "epoch": 0.4, "learning_rate": 0.001374163590020903, "loss": 2.4216, "step": 14758 }, { "epoch": 0.4, "learning_rate": 0.001374082871700696, "loss": 2.5779, "step": 14759 }, { "epoch": 0.4, "learning_rate": 0.0013740021505465035, "loss": 2.1794, "step": 14760 }, { "epoch": 0.4, "learning_rate": 0.0013739214265589374, "loss": 2.8238, "step": 14761 }, { "epoch": 0.4, "learning_rate": 0.00137384069973861, "loss": 2.5469, "step": 14762 }, { "epoch": 0.4, "learning_rate": 0.0013737599700861319, "loss": 3.0287, "step": 14763 }, { "epoch": 0.4, "learning_rate": 0.0013736792376021155, "loss": 2.2006, "step": 14764 }, { "epoch": 0.4, "learning_rate": 0.0013735985022871715, "loss": 2.7428, "step": 14765 }, { "epoch": 0.4, "learning_rate": 0.0013735177641419124, "loss": 2.8034, "step": 14766 }, { "epoch": 0.4, "learning_rate": 0.0013734370231669494, "loss": 2.3074, "step": 14767 }, { "epoch": 0.4, "learning_rate": 0.0013733562793628942, "loss": 2.557, "step": 14768 }, { "epoch": 0.4, "learning_rate": 0.0013732755327303585, "loss": 2.5388, "step": 14769 }, { "epoch": 0.4, "learning_rate": 0.001373194783269954, "loss": 2.1107, "step": 14770 }, { "epoch": 0.4, "learning_rate": 0.0013731140309822928, "loss": 2.4784, "step": 14771 }, { "epoch": 0.4, "learning_rate": 0.0013730332758679867, "loss": 2.2226, "step": 14772 }, { "epoch": 0.4, "learning_rate": 0.0013729525179276465, "loss": 2.5845, "step": 14773 }, { "epoch": 0.4, "learning_rate": 0.0013728717571618852, "loss": 2.4803, "step": 14774 }, { "epoch": 0.4, "learning_rate": 0.0013727909935713142, "loss": 2.5545, "step": 14775 }, { "epoch": 0.4, "learning_rate": 0.001372710227156545, "loss": 2.8243, "step": 14776 }, { "epoch": 0.4, "learning_rate": 0.0013726294579181897, "loss": 2.8419, "step": 14777 }, { "epoch": 0.4, "learning_rate": 0.0013725486858568606, "loss": 2.9185, "step": 14778 }, { "epoch": 0.4, "learning_rate": 0.0013724679109731691, "loss": 2.4332, "step": 14779 }, { "epoch": 0.4, "learning_rate": 0.0013723871332677268, "loss": 2.7733, "step": 14780 }, { "epoch": 0.4, "learning_rate": 0.0013723063527411468, "loss": 2.6288, "step": 14781 }, { "epoch": 0.4, "learning_rate": 0.0013722255693940405, "loss": 2.4319, "step": 14782 }, { "epoch": 0.4, "learning_rate": 0.0013721447832270193, "loss": 2.5765, "step": 14783 }, { "epoch": 0.4, "learning_rate": 0.0013720639942406958, "loss": 3.0749, "step": 14784 }, { "epoch": 0.4, "learning_rate": 0.0013719832024356824, "loss": 2.7389, "step": 14785 }, { "epoch": 0.4, "learning_rate": 0.0013719024078125905, "loss": 2.5349, "step": 14786 }, { "epoch": 0.4, "learning_rate": 0.0013718216103720327, "loss": 2.5327, "step": 14787 }, { "epoch": 0.4, "learning_rate": 0.0013717408101146208, "loss": 2.4495, "step": 14788 }, { "epoch": 0.4, "learning_rate": 0.0013716600070409668, "loss": 2.6291, "step": 14789 }, { "epoch": 0.4, "learning_rate": 0.001371579201151683, "loss": 2.6655, "step": 14790 }, { "epoch": 0.4, "learning_rate": 0.0013714983924473817, "loss": 2.6245, "step": 14791 }, { "epoch": 0.4, "learning_rate": 0.0013714175809286752, "loss": 2.1325, "step": 14792 }, { "epoch": 0.4, "learning_rate": 0.001371336766596175, "loss": 2.4541, "step": 14793 }, { "epoch": 0.4, "learning_rate": 0.0013712559494504944, "loss": 2.3699, "step": 14794 }, { "epoch": 0.4, "learning_rate": 0.0013711751294922447, "loss": 2.5013, "step": 14795 }, { "epoch": 0.4, "learning_rate": 0.0013710943067220386, "loss": 2.536, "step": 14796 }, { "epoch": 0.4, "learning_rate": 0.0013710134811404887, "loss": 2.6842, "step": 14797 }, { "epoch": 0.4, "learning_rate": 0.0013709326527482069, "loss": 2.6395, "step": 14798 }, { "epoch": 0.4, "learning_rate": 0.0013708518215458053, "loss": 2.4774, "step": 14799 }, { "epoch": 0.4, "learning_rate": 0.0013707709875338968, "loss": 2.0006, "step": 14800 }, { "epoch": 0.4, "learning_rate": 0.0013706901507130938, "loss": 2.695, "step": 14801 }, { "epoch": 0.4, "learning_rate": 0.0013706093110840082, "loss": 2.9665, "step": 14802 }, { "epoch": 0.4, "learning_rate": 0.001370528468647253, "loss": 2.8141, "step": 14803 }, { "epoch": 0.4, "learning_rate": 0.0013704476234034399, "loss": 3.0124, "step": 14804 }, { "epoch": 0.4, "learning_rate": 0.0013703667753531823, "loss": 2.5423, "step": 14805 }, { "epoch": 0.4, "learning_rate": 0.0013702859244970921, "loss": 2.9538, "step": 14806 }, { "epoch": 0.4, "learning_rate": 0.0013702050708357821, "loss": 1.9931, "step": 14807 }, { "epoch": 0.4, "learning_rate": 0.0013701242143698642, "loss": 2.2074, "step": 14808 }, { "epoch": 0.4, "learning_rate": 0.001370043355099952, "loss": 2.4855, "step": 14809 }, { "epoch": 0.4, "learning_rate": 0.001369962493026657, "loss": 2.3962, "step": 14810 }, { "epoch": 0.4, "learning_rate": 0.0013698816281505924, "loss": 2.8591, "step": 14811 }, { "epoch": 0.4, "learning_rate": 0.001369800760472371, "loss": 2.7181, "step": 14812 }, { "epoch": 0.4, "learning_rate": 0.001369719889992605, "loss": 2.6096, "step": 14813 }, { "epoch": 0.4, "learning_rate": 0.0013696390167119072, "loss": 2.5569, "step": 14814 }, { "epoch": 0.4, "learning_rate": 0.00136955814063089, "loss": 2.6541, "step": 14815 }, { "epoch": 0.4, "learning_rate": 0.0013694772617501667, "loss": 2.1876, "step": 14816 }, { "epoch": 0.4, "learning_rate": 0.00136939638007035, "loss": 2.9033, "step": 14817 }, { "epoch": 0.4, "learning_rate": 0.0013693154955920518, "loss": 2.5783, "step": 14818 }, { "epoch": 0.4, "learning_rate": 0.0013692346083158857, "loss": 2.6666, "step": 14819 }, { "epoch": 0.4, "learning_rate": 0.0013691537182424643, "loss": 2.595, "step": 14820 }, { "epoch": 0.4, "learning_rate": 0.0013690728253724002, "loss": 2.5816, "step": 14821 }, { "epoch": 0.4, "learning_rate": 0.0013689919297063065, "loss": 2.5213, "step": 14822 }, { "epoch": 0.4, "learning_rate": 0.0013689110312447956, "loss": 2.7531, "step": 14823 }, { "epoch": 0.4, "learning_rate": 0.0013688301299884808, "loss": 2.2574, "step": 14824 }, { "epoch": 0.4, "learning_rate": 0.0013687492259379752, "loss": 2.6195, "step": 14825 }, { "epoch": 0.4, "learning_rate": 0.001368668319093891, "loss": 2.5435, "step": 14826 }, { "epoch": 0.4, "learning_rate": 0.0013685874094568418, "loss": 2.5697, "step": 14827 }, { "epoch": 0.4, "learning_rate": 0.00136850649702744, "loss": 2.7142, "step": 14828 }, { "epoch": 0.4, "learning_rate": 0.0013684255818062993, "loss": 2.7077, "step": 14829 }, { "epoch": 0.4, "learning_rate": 0.001368344663794032, "loss": 2.4695, "step": 14830 }, { "epoch": 0.4, "learning_rate": 0.0013682637429912512, "loss": 2.1633, "step": 14831 }, { "epoch": 0.4, "learning_rate": 0.0013681828193985704, "loss": 2.5646, "step": 14832 }, { "epoch": 0.4, "learning_rate": 0.0013681018930166023, "loss": 2.7299, "step": 14833 }, { "epoch": 0.4, "learning_rate": 0.00136802096384596, "loss": 2.3315, "step": 14834 }, { "epoch": 0.4, "learning_rate": 0.0013679400318872567, "loss": 2.5062, "step": 14835 }, { "epoch": 0.4, "learning_rate": 0.0013678590971411056, "loss": 2.5514, "step": 14836 }, { "epoch": 0.4, "learning_rate": 0.0013677781596081195, "loss": 2.7397, "step": 14837 }, { "epoch": 0.4, "learning_rate": 0.001367697219288912, "loss": 2.7807, "step": 14838 }, { "epoch": 0.4, "learning_rate": 0.001367616276184096, "loss": 2.5954, "step": 14839 }, { "epoch": 0.4, "learning_rate": 0.001367535330294285, "loss": 2.3412, "step": 14840 }, { "epoch": 0.4, "learning_rate": 0.001367454381620092, "loss": 2.7136, "step": 14841 }, { "epoch": 0.4, "learning_rate": 0.0013673734301621302, "loss": 2.4771, "step": 14842 }, { "epoch": 0.4, "learning_rate": 0.001367292475921013, "loss": 2.8231, "step": 14843 }, { "epoch": 0.4, "learning_rate": 0.0013672115188973538, "loss": 2.4613, "step": 14844 }, { "epoch": 0.4, "learning_rate": 0.0013671305590917658, "loss": 2.7452, "step": 14845 }, { "epoch": 0.4, "learning_rate": 0.0013670495965048622, "loss": 2.7659, "step": 14846 }, { "epoch": 0.4, "learning_rate": 0.0013669686311372563, "loss": 2.4819, "step": 14847 }, { "epoch": 0.4, "learning_rate": 0.001366887662989562, "loss": 2.7116, "step": 14848 }, { "epoch": 0.4, "learning_rate": 0.0013668066920623921, "loss": 2.5187, "step": 14849 }, { "epoch": 0.4, "learning_rate": 0.0013667257183563601, "loss": 2.5644, "step": 14850 }, { "epoch": 0.4, "learning_rate": 0.0013666447418720802, "loss": 2.4061, "step": 14851 }, { "epoch": 0.4, "learning_rate": 0.0013665637626101648, "loss": 2.68, "step": 14852 }, { "epoch": 0.4, "learning_rate": 0.0013664827805712281, "loss": 2.5311, "step": 14853 }, { "epoch": 0.4, "learning_rate": 0.0013664017957558832, "loss": 2.5955, "step": 14854 }, { "epoch": 0.4, "learning_rate": 0.001366320808164744, "loss": 2.5987, "step": 14855 }, { "epoch": 0.4, "learning_rate": 0.0013662398177984238, "loss": 2.6774, "step": 14856 }, { "epoch": 0.4, "learning_rate": 0.0013661588246575362, "loss": 2.2953, "step": 14857 }, { "epoch": 0.4, "learning_rate": 0.0013660778287426947, "loss": 2.3654, "step": 14858 }, { "epoch": 0.4, "learning_rate": 0.0013659968300545132, "loss": 2.2835, "step": 14859 }, { "epoch": 0.4, "learning_rate": 0.001365915828593605, "loss": 2.2362, "step": 14860 }, { "epoch": 0.4, "learning_rate": 0.0013658348243605844, "loss": 2.7269, "step": 14861 }, { "epoch": 0.4, "learning_rate": 0.001365753817356064, "loss": 2.5355, "step": 14862 }, { "epoch": 0.4, "learning_rate": 0.001365672807580658, "loss": 2.3993, "step": 14863 }, { "epoch": 0.4, "learning_rate": 0.0013655917950349805, "loss": 2.2858, "step": 14864 }, { "epoch": 0.4, "learning_rate": 0.0013655107797196447, "loss": 2.0147, "step": 14865 }, { "epoch": 0.4, "learning_rate": 0.0013654297616352647, "loss": 2.34, "step": 14866 }, { "epoch": 0.4, "learning_rate": 0.0013653487407824542, "loss": 2.376, "step": 14867 }, { "epoch": 0.4, "learning_rate": 0.001365267717161827, "loss": 2.6759, "step": 14868 }, { "epoch": 0.4, "learning_rate": 0.0013651866907739966, "loss": 2.7483, "step": 14869 }, { "epoch": 0.4, "learning_rate": 0.0013651056616195774, "loss": 2.4425, "step": 14870 }, { "epoch": 0.4, "learning_rate": 0.001365024629699183, "loss": 2.2351, "step": 14871 }, { "epoch": 0.4, "learning_rate": 0.001364943595013427, "loss": 2.5833, "step": 14872 }, { "epoch": 0.4, "learning_rate": 0.0013648625575629239, "loss": 2.7628, "step": 14873 }, { "epoch": 0.4, "learning_rate": 0.001364781517348287, "loss": 2.3527, "step": 14874 }, { "epoch": 0.4, "learning_rate": 0.0013647004743701308, "loss": 2.373, "step": 14875 }, { "epoch": 0.4, "learning_rate": 0.001364619428629069, "loss": 2.68, "step": 14876 }, { "epoch": 0.4, "learning_rate": 0.0013645383801257154, "loss": 2.503, "step": 14877 }, { "epoch": 0.4, "learning_rate": 0.0013644573288606843, "loss": 2.5709, "step": 14878 }, { "epoch": 0.4, "learning_rate": 0.0013643762748345894, "loss": 2.2849, "step": 14879 }, { "epoch": 0.4, "learning_rate": 0.0013642952180480455, "loss": 2.3795, "step": 14880 }, { "epoch": 0.4, "learning_rate": 0.0013642141585016659, "loss": 2.9003, "step": 14881 }, { "epoch": 0.4, "learning_rate": 0.0013641330961960648, "loss": 2.3215, "step": 14882 }, { "epoch": 0.4, "learning_rate": 0.0013640520311318566, "loss": 2.3389, "step": 14883 }, { "epoch": 0.4, "learning_rate": 0.0013639709633096553, "loss": 2.7185, "step": 14884 }, { "epoch": 0.4, "learning_rate": 0.0013638898927300748, "loss": 2.9725, "step": 14885 }, { "epoch": 0.4, "learning_rate": 0.00136380881939373, "loss": 2.6894, "step": 14886 }, { "epoch": 0.4, "learning_rate": 0.0013637277433012343, "loss": 2.6185, "step": 14887 }, { "epoch": 0.4, "learning_rate": 0.0013636466644532024, "loss": 2.5265, "step": 14888 }, { "epoch": 0.4, "learning_rate": 0.001363565582850248, "loss": 2.6597, "step": 14889 }, { "epoch": 0.4, "learning_rate": 0.0013634844984929861, "loss": 2.5586, "step": 14890 }, { "epoch": 0.4, "learning_rate": 0.0013634034113820309, "loss": 2.2603, "step": 14891 }, { "epoch": 0.4, "learning_rate": 0.001363322321517996, "loss": 2.5571, "step": 14892 }, { "epoch": 0.4, "learning_rate": 0.0013632412289014961, "loss": 2.7226, "step": 14893 }, { "epoch": 0.4, "learning_rate": 0.001363160133533146, "loss": 2.2517, "step": 14894 }, { "epoch": 0.4, "learning_rate": 0.0013630790354135591, "loss": 2.6331, "step": 14895 }, { "epoch": 0.4, "learning_rate": 0.001362997934543351, "loss": 2.769, "step": 14896 }, { "epoch": 0.4, "learning_rate": 0.001362916830923135, "loss": 2.3224, "step": 14897 }, { "epoch": 0.4, "learning_rate": 0.001362835724553526, "loss": 2.5541, "step": 14898 }, { "epoch": 0.4, "learning_rate": 0.0013627546154351385, "loss": 2.6118, "step": 14899 }, { "epoch": 0.4, "learning_rate": 0.0013626735035685868, "loss": 2.5241, "step": 14900 }, { "epoch": 0.4, "learning_rate": 0.0013625923889544855, "loss": 2.8411, "step": 14901 }, { "epoch": 0.4, "learning_rate": 0.0013625112715934492, "loss": 2.6372, "step": 14902 }, { "epoch": 0.4, "learning_rate": 0.0013624301514860923, "loss": 2.2988, "step": 14903 }, { "epoch": 0.4, "learning_rate": 0.0013623490286330294, "loss": 2.7155, "step": 14904 }, { "epoch": 0.4, "learning_rate": 0.0013622679030348749, "loss": 2.3558, "step": 14905 }, { "epoch": 0.4, "learning_rate": 0.0013621867746922436, "loss": 2.627, "step": 14906 }, { "epoch": 0.4, "learning_rate": 0.0013621056436057502, "loss": 2.4441, "step": 14907 }, { "epoch": 0.4, "learning_rate": 0.0013620245097760088, "loss": 2.5607, "step": 14908 }, { "epoch": 0.4, "learning_rate": 0.0013619433732036347, "loss": 2.1896, "step": 14909 }, { "epoch": 0.4, "learning_rate": 0.0013618622338892423, "loss": 2.4575, "step": 14910 }, { "epoch": 0.4, "learning_rate": 0.0013617810918334463, "loss": 2.7724, "step": 14911 }, { "epoch": 0.4, "learning_rate": 0.0013616999470368613, "loss": 2.7624, "step": 14912 }, { "epoch": 0.4, "learning_rate": 0.0013616187995001024, "loss": 2.4582, "step": 14913 }, { "epoch": 0.4, "learning_rate": 0.001361537649223784, "loss": 2.5509, "step": 14914 }, { "epoch": 0.4, "learning_rate": 0.001361456496208521, "loss": 2.3815, "step": 14915 }, { "epoch": 0.4, "learning_rate": 0.0013613753404549283, "loss": 2.5286, "step": 14916 }, { "epoch": 0.4, "learning_rate": 0.0013612941819636205, "loss": 2.3232, "step": 14917 }, { "epoch": 0.4, "learning_rate": 0.0013612130207352124, "loss": 2.4447, "step": 14918 }, { "epoch": 0.4, "learning_rate": 0.0013611318567703194, "loss": 2.652, "step": 14919 }, { "epoch": 0.4, "learning_rate": 0.0013610506900695561, "loss": 2.4446, "step": 14920 }, { "epoch": 0.4, "learning_rate": 0.001360969520633537, "loss": 2.9968, "step": 14921 }, { "epoch": 0.4, "learning_rate": 0.0013608883484628772, "loss": 2.1391, "step": 14922 }, { "epoch": 0.4, "learning_rate": 0.0013608071735581925, "loss": 2.8291, "step": 14923 }, { "epoch": 0.4, "learning_rate": 0.0013607259959200963, "loss": 2.5077, "step": 14924 }, { "epoch": 0.4, "learning_rate": 0.0013606448155492048, "loss": 2.5745, "step": 14925 }, { "epoch": 0.4, "learning_rate": 0.0013605636324461328, "loss": 2.8181, "step": 14926 }, { "epoch": 0.4, "learning_rate": 0.0013604824466114953, "loss": 2.2486, "step": 14927 }, { "epoch": 0.4, "learning_rate": 0.001360401258045907, "loss": 3.0674, "step": 14928 }, { "epoch": 0.4, "learning_rate": 0.001360320066749983, "loss": 2.692, "step": 14929 }, { "epoch": 0.4, "learning_rate": 0.001360238872724339, "loss": 2.4293, "step": 14930 }, { "epoch": 0.4, "learning_rate": 0.0013601576759695892, "loss": 2.6245, "step": 14931 }, { "epoch": 0.4, "learning_rate": 0.0013600764764863497, "loss": 2.6024, "step": 14932 }, { "epoch": 0.4, "learning_rate": 0.001359995274275235, "loss": 2.5662, "step": 14933 }, { "epoch": 0.4, "learning_rate": 0.0013599140693368607, "loss": 2.4216, "step": 14934 }, { "epoch": 0.4, "learning_rate": 0.0013598328616718414, "loss": 2.719, "step": 14935 }, { "epoch": 0.4, "learning_rate": 0.0013597516512807927, "loss": 2.7392, "step": 14936 }, { "epoch": 0.4, "learning_rate": 0.00135967043816433, "loss": 2.7129, "step": 14937 }, { "epoch": 0.4, "learning_rate": 0.0013595892223230684, "loss": 2.3621, "step": 14938 }, { "epoch": 0.4, "learning_rate": 0.001359508003757623, "loss": 2.4804, "step": 14939 }, { "epoch": 0.4, "learning_rate": 0.0013594267824686096, "loss": 2.4011, "step": 14940 }, { "epoch": 0.4, "learning_rate": 0.0013593455584566428, "loss": 2.4902, "step": 14941 }, { "epoch": 0.4, "learning_rate": 0.0013592643317223382, "loss": 2.6581, "step": 14942 }, { "epoch": 0.4, "learning_rate": 0.0013591831022663114, "loss": 2.5641, "step": 14943 }, { "epoch": 0.4, "learning_rate": 0.0013591018700891775, "loss": 2.4533, "step": 14944 }, { "epoch": 0.4, "learning_rate": 0.0013590206351915522, "loss": 2.1509, "step": 14945 }, { "epoch": 0.4, "learning_rate": 0.001358939397574051, "loss": 2.9588, "step": 14946 }, { "epoch": 0.4, "learning_rate": 0.0013588581572372886, "loss": 2.3612, "step": 14947 }, { "epoch": 0.4, "learning_rate": 0.0013587769141818811, "loss": 2.3149, "step": 14948 }, { "epoch": 0.4, "learning_rate": 0.0013586956684084439, "loss": 2.2265, "step": 14949 }, { "epoch": 0.4, "learning_rate": 0.0013586144199175924, "loss": 2.2841, "step": 14950 }, { "epoch": 0.4, "learning_rate": 0.0013585331687099422, "loss": 2.5342, "step": 14951 }, { "epoch": 0.4, "learning_rate": 0.0013584519147861087, "loss": 2.365, "step": 14952 }, { "epoch": 0.4, "learning_rate": 0.001358370658146708, "loss": 2.6009, "step": 14953 }, { "epoch": 0.4, "learning_rate": 0.001358289398792355, "loss": 2.7044, "step": 14954 }, { "epoch": 0.4, "learning_rate": 0.0013582081367236657, "loss": 2.6623, "step": 14955 }, { "epoch": 0.4, "learning_rate": 0.0013581268719412552, "loss": 2.866, "step": 14956 }, { "epoch": 0.4, "learning_rate": 0.00135804560444574, "loss": 2.801, "step": 14957 }, { "epoch": 0.4, "learning_rate": 0.0013579643342377348, "loss": 2.6407, "step": 14958 }, { "epoch": 0.4, "learning_rate": 0.0013578830613178562, "loss": 2.3696, "step": 14959 }, { "epoch": 0.4, "learning_rate": 0.0013578017856867195, "loss": 2.3864, "step": 14960 }, { "epoch": 0.4, "learning_rate": 0.0013577205073449403, "loss": 2.4907, "step": 14961 }, { "epoch": 0.4, "learning_rate": 0.0013576392262931345, "loss": 2.4416, "step": 14962 }, { "epoch": 0.4, "learning_rate": 0.0013575579425319179, "loss": 2.4008, "step": 14963 }, { "epoch": 0.4, "learning_rate": 0.0013574766560619062, "loss": 2.4551, "step": 14964 }, { "epoch": 0.4, "learning_rate": 0.0013573953668837154, "loss": 2.2565, "step": 14965 }, { "epoch": 0.4, "learning_rate": 0.0013573140749979613, "loss": 2.6899, "step": 14966 }, { "epoch": 0.4, "learning_rate": 0.0013572327804052594, "loss": 2.1736, "step": 14967 }, { "epoch": 0.4, "learning_rate": 0.0013571514831062256, "loss": 2.3431, "step": 14968 }, { "epoch": 0.4, "learning_rate": 0.0013570701831014764, "loss": 2.6279, "step": 14969 }, { "epoch": 0.4, "learning_rate": 0.0013569888803916274, "loss": 2.6367, "step": 14970 }, { "epoch": 0.4, "learning_rate": 0.0013569075749772944, "loss": 2.6453, "step": 14971 }, { "epoch": 0.4, "learning_rate": 0.0013568262668590932, "loss": 2.5376, "step": 14972 }, { "epoch": 0.4, "learning_rate": 0.0013567449560376401, "loss": 2.3453, "step": 14973 }, { "epoch": 0.4, "learning_rate": 0.001356663642513551, "loss": 2.4334, "step": 14974 }, { "epoch": 0.4, "learning_rate": 0.001356582326287442, "loss": 2.1006, "step": 14975 }, { "epoch": 0.4, "learning_rate": 0.0013565010073599288, "loss": 2.2413, "step": 14976 }, { "epoch": 0.4, "learning_rate": 0.0013564196857316281, "loss": 2.0071, "step": 14977 }, { "epoch": 0.4, "learning_rate": 0.0013563383614031556, "loss": 2.2091, "step": 14978 }, { "epoch": 0.4, "learning_rate": 0.001356257034375127, "loss": 2.4129, "step": 14979 }, { "epoch": 0.4, "learning_rate": 0.0013561757046481589, "loss": 2.4748, "step": 14980 }, { "epoch": 0.4, "learning_rate": 0.0013560943722228673, "loss": 2.2953, "step": 14981 }, { "epoch": 0.4, "learning_rate": 0.0013560130370998684, "loss": 2.9288, "step": 14982 }, { "epoch": 0.4, "learning_rate": 0.0013559316992797785, "loss": 2.4612, "step": 14983 }, { "epoch": 0.4, "learning_rate": 0.0013558503587632138, "loss": 2.5725, "step": 14984 }, { "epoch": 0.4, "learning_rate": 0.00135576901555079, "loss": 2.8606, "step": 14985 }, { "epoch": 0.4, "learning_rate": 0.001355687669643124, "loss": 2.783, "step": 14986 }, { "epoch": 0.4, "learning_rate": 0.001355606321040832, "loss": 2.9031, "step": 14987 }, { "epoch": 0.4, "learning_rate": 0.0013555249697445298, "loss": 2.5319, "step": 14988 }, { "epoch": 0.4, "learning_rate": 0.0013554436157548343, "loss": 2.6389, "step": 14989 }, { "epoch": 0.4, "learning_rate": 0.0013553622590723614, "loss": 2.448, "step": 14990 }, { "epoch": 0.4, "learning_rate": 0.001355280899697727, "loss": 2.779, "step": 14991 }, { "epoch": 0.4, "learning_rate": 0.0013551995376315487, "loss": 2.5782, "step": 14992 }, { "epoch": 0.4, "learning_rate": 0.001355118172874442, "loss": 2.7712, "step": 14993 }, { "epoch": 0.4, "learning_rate": 0.0013550368054270235, "loss": 2.5541, "step": 14994 }, { "epoch": 0.4, "learning_rate": 0.0013549554352899093, "loss": 2.5562, "step": 14995 }, { "epoch": 0.4, "learning_rate": 0.0013548740624637168, "loss": 2.4977, "step": 14996 }, { "epoch": 0.4, "learning_rate": 0.0013547926869490615, "loss": 2.2931, "step": 14997 }, { "epoch": 0.4, "learning_rate": 0.0013547113087465602, "loss": 2.8955, "step": 14998 }, { "epoch": 0.4, "learning_rate": 0.0013546299278568298, "loss": 2.4769, "step": 14999 }, { "epoch": 0.4, "learning_rate": 0.001354548544280486, "loss": 2.498, "step": 15000 }, { "epoch": 0.4, "learning_rate": 0.001354467158018146, "loss": 2.2355, "step": 15001 }, { "epoch": 0.4, "learning_rate": 0.0013543857690704263, "loss": 2.087, "step": 15002 }, { "epoch": 0.4, "learning_rate": 0.001354304377437943, "loss": 2.6106, "step": 15003 }, { "epoch": 0.4, "learning_rate": 0.0013542229831213135, "loss": 2.8992, "step": 15004 }, { "epoch": 0.4, "learning_rate": 0.001354141586121154, "loss": 2.6873, "step": 15005 }, { "epoch": 0.4, "learning_rate": 0.0013540601864380807, "loss": 2.7311, "step": 15006 }, { "epoch": 0.4, "learning_rate": 0.0013539787840727113, "loss": 2.263, "step": 15007 }, { "epoch": 0.4, "learning_rate": 0.0013538973790256617, "loss": 2.2682, "step": 15008 }, { "epoch": 0.4, "learning_rate": 0.0013538159712975489, "loss": 2.4627, "step": 15009 }, { "epoch": 0.4, "learning_rate": 0.0013537345608889892, "loss": 2.575, "step": 15010 }, { "epoch": 0.4, "learning_rate": 0.0013536531478006, "loss": 2.4392, "step": 15011 }, { "epoch": 0.4, "learning_rate": 0.0013535717320329978, "loss": 3.0943, "step": 15012 }, { "epoch": 0.4, "learning_rate": 0.0013534903135867995, "loss": 2.3045, "step": 15013 }, { "epoch": 0.4, "learning_rate": 0.0013534088924626211, "loss": 2.6443, "step": 15014 }, { "epoch": 0.4, "learning_rate": 0.0013533274686610807, "loss": 2.598, "step": 15015 }, { "epoch": 0.4, "learning_rate": 0.0013532460421827948, "loss": 2.5445, "step": 15016 }, { "epoch": 0.4, "learning_rate": 0.0013531646130283796, "loss": 2.7767, "step": 15017 }, { "epoch": 0.4, "learning_rate": 0.0013530831811984524, "loss": 2.7386, "step": 15018 }, { "epoch": 0.4, "learning_rate": 0.0013530017466936305, "loss": 2.7539, "step": 15019 }, { "epoch": 0.4, "learning_rate": 0.0013529203095145304, "loss": 2.7627, "step": 15020 }, { "epoch": 0.4, "learning_rate": 0.001352838869661769, "loss": 2.6486, "step": 15021 }, { "epoch": 0.4, "learning_rate": 0.001352757427135963, "loss": 2.7873, "step": 15022 }, { "epoch": 0.4, "learning_rate": 0.0013526759819377304, "loss": 2.2208, "step": 15023 }, { "epoch": 0.4, "learning_rate": 0.0013525945340676874, "loss": 2.5963, "step": 15024 }, { "epoch": 0.4, "learning_rate": 0.0013525130835264514, "loss": 2.4797, "step": 15025 }, { "epoch": 0.4, "learning_rate": 0.0013524316303146389, "loss": 2.569, "step": 15026 }, { "epoch": 0.4, "learning_rate": 0.0013523501744328677, "loss": 2.7048, "step": 15027 }, { "epoch": 0.4, "learning_rate": 0.0013522687158817547, "loss": 2.4812, "step": 15028 }, { "epoch": 0.4, "learning_rate": 0.0013521872546619167, "loss": 2.8336, "step": 15029 }, { "epoch": 0.4, "learning_rate": 0.001352105790773971, "loss": 2.9007, "step": 15030 }, { "epoch": 0.4, "learning_rate": 0.0013520243242185347, "loss": 2.7756, "step": 15031 }, { "epoch": 0.4, "learning_rate": 0.0013519428549962252, "loss": 2.3608, "step": 15032 }, { "epoch": 0.4, "learning_rate": 0.0013518613831076597, "loss": 2.3384, "step": 15033 }, { "epoch": 0.4, "learning_rate": 0.0013517799085534547, "loss": 2.5044, "step": 15034 }, { "epoch": 0.4, "learning_rate": 0.0013516984313342287, "loss": 2.4225, "step": 15035 }, { "epoch": 0.4, "learning_rate": 0.001351616951450598, "loss": 2.8001, "step": 15036 }, { "epoch": 0.4, "learning_rate": 0.00135153546890318, "loss": 2.1456, "step": 15037 }, { "epoch": 0.4, "learning_rate": 0.001351453983692592, "loss": 2.3046, "step": 15038 }, { "epoch": 0.4, "learning_rate": 0.0013513724958194517, "loss": 2.847, "step": 15039 }, { "epoch": 0.4, "learning_rate": 0.0013512910052843764, "loss": 2.8221, "step": 15040 }, { "epoch": 0.4, "learning_rate": 0.0013512095120879828, "loss": 2.2891, "step": 15041 }, { "epoch": 0.4, "learning_rate": 0.001351128016230889, "loss": 2.0143, "step": 15042 }, { "epoch": 0.4, "learning_rate": 0.001351046517713712, "loss": 2.6583, "step": 15043 }, { "epoch": 0.4, "learning_rate": 0.0013509650165370694, "loss": 2.6169, "step": 15044 }, { "epoch": 0.4, "learning_rate": 0.0013508835127015787, "loss": 2.4097, "step": 15045 }, { "epoch": 0.4, "learning_rate": 0.0013508020062078573, "loss": 2.331, "step": 15046 }, { "epoch": 0.4, "learning_rate": 0.0013507204970565224, "loss": 3.0481, "step": 15047 }, { "epoch": 0.4, "learning_rate": 0.0013506389852481918, "loss": 2.6503, "step": 15048 }, { "epoch": 0.4, "learning_rate": 0.0013505574707834826, "loss": 2.7592, "step": 15049 }, { "epoch": 0.4, "learning_rate": 0.0013504759536630134, "loss": 2.612, "step": 15050 }, { "epoch": 0.4, "learning_rate": 0.0013503944338874004, "loss": 2.6497, "step": 15051 }, { "epoch": 0.4, "learning_rate": 0.001350312911457262, "loss": 2.6098, "step": 15052 }, { "epoch": 0.4, "learning_rate": 0.0013502313863732157, "loss": 2.2947, "step": 15053 }, { "epoch": 0.4, "learning_rate": 0.001350149858635879, "loss": 2.3681, "step": 15054 }, { "epoch": 0.4, "learning_rate": 0.0013500683282458693, "loss": 2.7831, "step": 15055 }, { "epoch": 0.4, "learning_rate": 0.0013499867952038052, "loss": 2.5657, "step": 15056 }, { "epoch": 0.4, "learning_rate": 0.001349905259510303, "loss": 2.5334, "step": 15057 }, { "epoch": 0.4, "learning_rate": 0.0013498237211659813, "loss": 2.4781, "step": 15058 }, { "epoch": 0.4, "learning_rate": 0.001349742180171458, "loss": 2.9203, "step": 15059 }, { "epoch": 0.4, "learning_rate": 0.00134966063652735, "loss": 2.8446, "step": 15060 }, { "epoch": 0.4, "learning_rate": 0.0013495790902342756, "loss": 2.5433, "step": 15061 }, { "epoch": 0.4, "learning_rate": 0.001349497541292853, "loss": 2.5527, "step": 15062 }, { "epoch": 0.4, "learning_rate": 0.0013494159897036993, "loss": 2.1055, "step": 15063 }, { "epoch": 0.4, "learning_rate": 0.001349334435467432, "loss": 2.6535, "step": 15064 }, { "epoch": 0.4, "learning_rate": 0.00134925287858467, "loss": 2.8835, "step": 15065 }, { "epoch": 0.4, "learning_rate": 0.0013491713190560306, "loss": 2.4373, "step": 15066 }, { "epoch": 0.4, "learning_rate": 0.0013490897568821313, "loss": 2.8448, "step": 15067 }, { "epoch": 0.4, "learning_rate": 0.001349008192063591, "loss": 2.5975, "step": 15068 }, { "epoch": 0.4, "learning_rate": 0.0013489266246010268, "loss": 2.6927, "step": 15069 }, { "epoch": 0.4, "learning_rate": 0.0013488450544950565, "loss": 2.3639, "step": 15070 }, { "epoch": 0.41, "learning_rate": 0.001348763481746299, "loss": 2.6771, "step": 15071 }, { "epoch": 0.41, "learning_rate": 0.0013486819063553714, "loss": 2.6905, "step": 15072 }, { "epoch": 0.41, "learning_rate": 0.0013486003283228922, "loss": 2.8002, "step": 15073 }, { "epoch": 0.41, "learning_rate": 0.0013485187476494792, "loss": 2.7871, "step": 15074 }, { "epoch": 0.41, "learning_rate": 0.0013484371643357504, "loss": 2.756, "step": 15075 }, { "epoch": 0.41, "learning_rate": 0.0013483555783823239, "loss": 2.3836, "step": 15076 }, { "epoch": 0.41, "learning_rate": 0.0013482739897898177, "loss": 2.969, "step": 15077 }, { "epoch": 0.41, "learning_rate": 0.0013481923985588502, "loss": 2.4732, "step": 15078 }, { "epoch": 0.41, "learning_rate": 0.0013481108046900397, "loss": 2.0087, "step": 15079 }, { "epoch": 0.41, "learning_rate": 0.0013480292081840032, "loss": 2.9417, "step": 15080 }, { "epoch": 0.41, "learning_rate": 0.00134794760904136, "loss": 2.2256, "step": 15081 }, { "epoch": 0.41, "learning_rate": 0.0013478660072627283, "loss": 2.6345, "step": 15082 }, { "epoch": 0.41, "learning_rate": 0.0013477844028487254, "loss": 2.7607, "step": 15083 }, { "epoch": 0.41, "learning_rate": 0.00134770279579997, "loss": 1.958, "step": 15084 }, { "epoch": 0.41, "learning_rate": 0.0013476211861170808, "loss": 2.5617, "step": 15085 }, { "epoch": 0.41, "learning_rate": 0.0013475395738006756, "loss": 2.4721, "step": 15086 }, { "epoch": 0.41, "learning_rate": 0.0013474579588513725, "loss": 2.3665, "step": 15087 }, { "epoch": 0.41, "learning_rate": 0.00134737634126979, "loss": 2.3957, "step": 15088 }, { "epoch": 0.41, "learning_rate": 0.0013472947210565467, "loss": 2.5502, "step": 15089 }, { "epoch": 0.41, "learning_rate": 0.0013472130982122603, "loss": 2.2766, "step": 15090 }, { "epoch": 0.41, "learning_rate": 0.0013471314727375502, "loss": 2.4454, "step": 15091 }, { "epoch": 0.41, "learning_rate": 0.0013470498446330336, "loss": 2.637, "step": 15092 }, { "epoch": 0.41, "learning_rate": 0.0013469682138993293, "loss": 3.3094, "step": 15093 }, { "epoch": 0.41, "learning_rate": 0.001346886580537056, "loss": 2.3271, "step": 15094 }, { "epoch": 0.41, "learning_rate": 0.0013468049445468323, "loss": 2.4048, "step": 15095 }, { "epoch": 0.41, "learning_rate": 0.001346723305929276, "loss": 2.9039, "step": 15096 }, { "epoch": 0.41, "learning_rate": 0.001346641664685006, "loss": 2.598, "step": 15097 }, { "epoch": 0.41, "learning_rate": 0.0013465600208146407, "loss": 2.4413, "step": 15098 }, { "epoch": 0.41, "learning_rate": 0.001346478374318799, "loss": 3.0039, "step": 15099 }, { "epoch": 0.41, "learning_rate": 0.001346396725198098, "loss": 2.5007, "step": 15100 }, { "epoch": 0.41, "learning_rate": 0.0013463150734531583, "loss": 2.8549, "step": 15101 }, { "epoch": 0.41, "learning_rate": 0.0013462334190845976, "loss": 2.6155, "step": 15102 }, { "epoch": 0.41, "learning_rate": 0.001346151762093034, "loss": 2.3959, "step": 15103 }, { "epoch": 0.41, "learning_rate": 0.0013460701024790866, "loss": 2.2839, "step": 15104 }, { "epoch": 0.41, "learning_rate": 0.001345988440243374, "loss": 2.2567, "step": 15105 }, { "epoch": 0.41, "learning_rate": 0.0013459067753865148, "loss": 2.4991, "step": 15106 }, { "epoch": 0.41, "learning_rate": 0.0013458251079091282, "loss": 2.7448, "step": 15107 }, { "epoch": 0.41, "learning_rate": 0.0013457434378118319, "loss": 2.4189, "step": 15108 }, { "epoch": 0.41, "learning_rate": 0.0013456617650952451, "loss": 2.2354, "step": 15109 }, { "epoch": 0.41, "learning_rate": 0.0013455800897599869, "loss": 2.7518, "step": 15110 }, { "epoch": 0.41, "learning_rate": 0.0013454984118066752, "loss": 2.673, "step": 15111 }, { "epoch": 0.41, "learning_rate": 0.0013454167312359298, "loss": 2.25, "step": 15112 }, { "epoch": 0.41, "learning_rate": 0.001345335048048369, "loss": 2.4129, "step": 15113 }, { "epoch": 0.41, "learning_rate": 0.0013452533622446113, "loss": 2.7848, "step": 15114 }, { "epoch": 0.41, "learning_rate": 0.001345171673825276, "loss": 2.3639, "step": 15115 }, { "epoch": 0.41, "learning_rate": 0.0013450899827909817, "loss": 2.3041, "step": 15116 }, { "epoch": 0.41, "learning_rate": 0.0013450082891423474, "loss": 2.3425, "step": 15117 }, { "epoch": 0.41, "learning_rate": 0.0013449265928799923, "loss": 2.6257, "step": 15118 }, { "epoch": 0.41, "learning_rate": 0.0013448448940045347, "loss": 2.5441, "step": 15119 }, { "epoch": 0.41, "learning_rate": 0.0013447631925165937, "loss": 2.5289, "step": 15120 }, { "epoch": 0.41, "learning_rate": 0.001344681488416789, "loss": 2.4521, "step": 15121 }, { "epoch": 0.41, "learning_rate": 0.0013445997817057385, "loss": 2.5834, "step": 15122 }, { "epoch": 0.41, "learning_rate": 0.0013445180723840613, "loss": 2.2067, "step": 15123 }, { "epoch": 0.41, "learning_rate": 0.0013444363604523772, "loss": 2.865, "step": 15124 }, { "epoch": 0.41, "learning_rate": 0.001344354645911305, "loss": 2.447, "step": 15125 }, { "epoch": 0.41, "learning_rate": 0.0013442729287614634, "loss": 2.8931, "step": 15126 }, { "epoch": 0.41, "learning_rate": 0.0013441912090034717, "loss": 2.2147, "step": 15127 }, { "epoch": 0.41, "learning_rate": 0.001344109486637949, "loss": 2.4487, "step": 15128 }, { "epoch": 0.41, "learning_rate": 0.001344027761665514, "loss": 2.3918, "step": 15129 }, { "epoch": 0.41, "learning_rate": 0.0013439460340867863, "loss": 2.547, "step": 15130 }, { "epoch": 0.41, "learning_rate": 0.001343864303902385, "loss": 2.5302, "step": 15131 }, { "epoch": 0.41, "learning_rate": 0.0013437825711129295, "loss": 2.6271, "step": 15132 }, { "epoch": 0.41, "learning_rate": 0.0013437008357190384, "loss": 2.8312, "step": 15133 }, { "epoch": 0.41, "learning_rate": 0.0013436190977213311, "loss": 2.975, "step": 15134 }, { "epoch": 0.41, "learning_rate": 0.0013435373571204273, "loss": 2.4024, "step": 15135 }, { "epoch": 0.41, "learning_rate": 0.0013434556139169454, "loss": 2.2746, "step": 15136 }, { "epoch": 0.41, "learning_rate": 0.0013433738681115058, "loss": 2.4771, "step": 15137 }, { "epoch": 0.41, "learning_rate": 0.0013432921197047269, "loss": 2.8453, "step": 15138 }, { "epoch": 0.41, "learning_rate": 0.0013432103686972282, "loss": 3.0968, "step": 15139 }, { "epoch": 0.41, "learning_rate": 0.0013431286150896288, "loss": 2.065, "step": 15140 }, { "epoch": 0.41, "learning_rate": 0.001343046858882549, "loss": 2.5956, "step": 15141 }, { "epoch": 0.41, "learning_rate": 0.0013429651000766072, "loss": 2.4791, "step": 15142 }, { "epoch": 0.41, "learning_rate": 0.0013428833386724228, "loss": 2.5205, "step": 15143 }, { "epoch": 0.41, "learning_rate": 0.0013428015746706162, "loss": 2.7905, "step": 15144 }, { "epoch": 0.41, "learning_rate": 0.0013427198080718057, "loss": 2.2554, "step": 15145 }, { "epoch": 0.41, "learning_rate": 0.0013426380388766113, "loss": 2.2708, "step": 15146 }, { "epoch": 0.41, "learning_rate": 0.0013425562670856524, "loss": 3.0145, "step": 15147 }, { "epoch": 0.41, "learning_rate": 0.0013424744926995484, "loss": 2.4825, "step": 15148 }, { "epoch": 0.41, "learning_rate": 0.001342392715718919, "loss": 2.0903, "step": 15149 }, { "epoch": 0.41, "learning_rate": 0.0013423109361443836, "loss": 2.3567, "step": 15150 }, { "epoch": 0.41, "learning_rate": 0.0013422291539765617, "loss": 2.4453, "step": 15151 }, { "epoch": 0.41, "learning_rate": 0.001342147369216073, "loss": 2.6436, "step": 15152 }, { "epoch": 0.41, "learning_rate": 0.0013420655818635369, "loss": 2.7077, "step": 15153 }, { "epoch": 0.41, "learning_rate": 0.001341983791919573, "loss": 2.724, "step": 15154 }, { "epoch": 0.41, "learning_rate": 0.0013419019993848012, "loss": 2.8652, "step": 15155 }, { "epoch": 0.41, "learning_rate": 0.0013418202042598409, "loss": 2.9952, "step": 15156 }, { "epoch": 0.41, "learning_rate": 0.001341738406545312, "loss": 2.2051, "step": 15157 }, { "epoch": 0.41, "learning_rate": 0.0013416566062418335, "loss": 2.5541, "step": 15158 }, { "epoch": 0.41, "learning_rate": 0.0013415748033500262, "loss": 2.2446, "step": 15159 }, { "epoch": 0.41, "learning_rate": 0.001341492997870509, "loss": 2.5029, "step": 15160 }, { "epoch": 0.41, "learning_rate": 0.0013414111898039022, "loss": 2.6167, "step": 15161 }, { "epoch": 0.41, "learning_rate": 0.001341329379150825, "loss": 2.7319, "step": 15162 }, { "epoch": 0.41, "learning_rate": 0.0013412475659118975, "loss": 2.5053, "step": 15163 }, { "epoch": 0.41, "learning_rate": 0.0013411657500877394, "loss": 2.1504, "step": 15164 }, { "epoch": 0.41, "learning_rate": 0.0013410839316789706, "loss": 2.6273, "step": 15165 }, { "epoch": 0.41, "learning_rate": 0.0013410021106862108, "loss": 2.6681, "step": 15166 }, { "epoch": 0.41, "learning_rate": 0.0013409202871100803, "loss": 2.7125, "step": 15167 }, { "epoch": 0.41, "learning_rate": 0.0013408384609511984, "loss": 2.5852, "step": 15168 }, { "epoch": 0.41, "learning_rate": 0.0013407566322101855, "loss": 2.5755, "step": 15169 }, { "epoch": 0.41, "learning_rate": 0.0013406748008876611, "loss": 2.3357, "step": 15170 }, { "epoch": 0.41, "learning_rate": 0.001340592966984245, "loss": 2.6396, "step": 15171 }, { "epoch": 0.41, "learning_rate": 0.001340511130500558, "loss": 2.655, "step": 15172 }, { "epoch": 0.41, "learning_rate": 0.0013404292914372194, "loss": 2.6639, "step": 15173 }, { "epoch": 0.41, "learning_rate": 0.0013403474497948491, "loss": 2.8682, "step": 15174 }, { "epoch": 0.41, "learning_rate": 0.0013402656055740679, "loss": 2.4763, "step": 15175 }, { "epoch": 0.41, "learning_rate": 0.001340183758775495, "loss": 2.9848, "step": 15176 }, { "epoch": 0.41, "learning_rate": 0.0013401019093997506, "loss": 2.8395, "step": 15177 }, { "epoch": 0.41, "learning_rate": 0.0013400200574474551, "loss": 2.5052, "step": 15178 }, { "epoch": 0.41, "learning_rate": 0.0013399382029192282, "loss": 2.6276, "step": 15179 }, { "epoch": 0.41, "learning_rate": 0.0013398563458156905, "loss": 2.6407, "step": 15180 }, { "epoch": 0.41, "learning_rate": 0.001339774486137462, "loss": 3.0331, "step": 15181 }, { "epoch": 0.41, "learning_rate": 0.0013396926238851625, "loss": 2.7509, "step": 15182 }, { "epoch": 0.41, "learning_rate": 0.0013396107590594125, "loss": 2.3063, "step": 15183 }, { "epoch": 0.41, "learning_rate": 0.0013395288916608322, "loss": 2.5296, "step": 15184 }, { "epoch": 0.41, "learning_rate": 0.0013394470216900414, "loss": 2.658, "step": 15185 }, { "epoch": 0.41, "learning_rate": 0.001339365149147661, "loss": 2.2514, "step": 15186 }, { "epoch": 0.41, "learning_rate": 0.0013392832740343106, "loss": 3.2527, "step": 15187 }, { "epoch": 0.41, "learning_rate": 0.0013392013963506111, "loss": 2.0961, "step": 15188 }, { "epoch": 0.41, "learning_rate": 0.001339119516097182, "loss": 2.9581, "step": 15189 }, { "epoch": 0.41, "learning_rate": 0.0013390376332746445, "loss": 2.4605, "step": 15190 }, { "epoch": 0.41, "learning_rate": 0.0013389557478836185, "loss": 2.7108, "step": 15191 }, { "epoch": 0.41, "learning_rate": 0.0013388738599247243, "loss": 2.6154, "step": 15192 }, { "epoch": 0.41, "learning_rate": 0.001338791969398582, "loss": 2.9222, "step": 15193 }, { "epoch": 0.41, "learning_rate": 0.0013387100763058127, "loss": 2.54, "step": 15194 }, { "epoch": 0.41, "learning_rate": 0.0013386281806470363, "loss": 2.6429, "step": 15195 }, { "epoch": 0.41, "learning_rate": 0.0013385462824228734, "loss": 2.7233, "step": 15196 }, { "epoch": 0.41, "learning_rate": 0.0013384643816339442, "loss": 2.7898, "step": 15197 }, { "epoch": 0.41, "learning_rate": 0.0013383824782808697, "loss": 2.5472, "step": 15198 }, { "epoch": 0.41, "learning_rate": 0.0013383005723642696, "loss": 2.5809, "step": 15199 }, { "epoch": 0.41, "learning_rate": 0.0013382186638847653, "loss": 2.5585, "step": 15200 }, { "epoch": 0.41, "learning_rate": 0.0013381367528429765, "loss": 2.3355, "step": 15201 }, { "epoch": 0.41, "learning_rate": 0.0013380548392395242, "loss": 2.8896, "step": 15202 }, { "epoch": 0.41, "learning_rate": 0.001337972923075029, "loss": 2.471, "step": 15203 }, { "epoch": 0.41, "learning_rate": 0.0013378910043501113, "loss": 2.4058, "step": 15204 }, { "epoch": 0.41, "learning_rate": 0.0013378090830653917, "loss": 2.2841, "step": 15205 }, { "epoch": 0.41, "learning_rate": 0.001337727159221491, "loss": 2.6309, "step": 15206 }, { "epoch": 0.41, "learning_rate": 0.0013376452328190296, "loss": 2.5005, "step": 15207 }, { "epoch": 0.41, "learning_rate": 0.0013375633038586285, "loss": 2.7293, "step": 15208 }, { "epoch": 0.41, "learning_rate": 0.0013374813723409078, "loss": 2.5813, "step": 15209 }, { "epoch": 0.41, "learning_rate": 0.0013373994382664888, "loss": 2.1947, "step": 15210 }, { "epoch": 0.41, "learning_rate": 0.001337317501635992, "loss": 2.8663, "step": 15211 }, { "epoch": 0.41, "learning_rate": 0.0013372355624500381, "loss": 2.3062, "step": 15212 }, { "epoch": 0.41, "learning_rate": 0.0013371536207092477, "loss": 2.2823, "step": 15213 }, { "epoch": 0.41, "learning_rate": 0.001337071676414242, "loss": 2.6552, "step": 15214 }, { "epoch": 0.41, "learning_rate": 0.0013369897295656412, "loss": 2.3926, "step": 15215 }, { "epoch": 0.41, "learning_rate": 0.0013369077801640668, "loss": 2.9695, "step": 15216 }, { "epoch": 0.41, "learning_rate": 0.0013368258282101392, "loss": 2.4152, "step": 15217 }, { "epoch": 0.41, "learning_rate": 0.0013367438737044793, "loss": 2.5748, "step": 15218 }, { "epoch": 0.41, "learning_rate": 0.0013366619166477079, "loss": 2.5151, "step": 15219 }, { "epoch": 0.41, "learning_rate": 0.001336579957040446, "loss": 2.5423, "step": 15220 }, { "epoch": 0.41, "learning_rate": 0.001336497994883315, "loss": 2.9203, "step": 15221 }, { "epoch": 0.41, "learning_rate": 0.0013364160301769347, "loss": 2.5208, "step": 15222 }, { "epoch": 0.41, "learning_rate": 0.0013363340629219272, "loss": 2.7154, "step": 15223 }, { "epoch": 0.41, "learning_rate": 0.0013362520931189126, "loss": 2.9618, "step": 15224 }, { "epoch": 0.41, "learning_rate": 0.0013361701207685126, "loss": 2.8266, "step": 15225 }, { "epoch": 0.41, "learning_rate": 0.0013360881458713476, "loss": 2.6134, "step": 15226 }, { "epoch": 0.41, "learning_rate": 0.0013360061684280391, "loss": 2.3802, "step": 15227 }, { "epoch": 0.41, "learning_rate": 0.0013359241884392076, "loss": 2.5465, "step": 15228 }, { "epoch": 0.41, "learning_rate": 0.0013358422059054746, "loss": 2.4665, "step": 15229 }, { "epoch": 0.41, "learning_rate": 0.0013357602208274614, "loss": 2.6339, "step": 15230 }, { "epoch": 0.41, "learning_rate": 0.0013356782332057887, "loss": 2.3005, "step": 15231 }, { "epoch": 0.41, "learning_rate": 0.0013355962430410776, "loss": 2.4405, "step": 15232 }, { "epoch": 0.41, "learning_rate": 0.0013355142503339494, "loss": 2.3565, "step": 15233 }, { "epoch": 0.41, "learning_rate": 0.0013354322550850253, "loss": 2.3693, "step": 15234 }, { "epoch": 0.41, "learning_rate": 0.0013353502572949264, "loss": 2.8412, "step": 15235 }, { "epoch": 0.41, "learning_rate": 0.0013352682569642736, "loss": 2.7787, "step": 15236 }, { "epoch": 0.41, "learning_rate": 0.0013351862540936887, "loss": 2.9692, "step": 15237 }, { "epoch": 0.41, "learning_rate": 0.0013351042486837925, "loss": 2.1621, "step": 15238 }, { "epoch": 0.41, "learning_rate": 0.0013350222407352069, "loss": 2.715, "step": 15239 }, { "epoch": 0.41, "learning_rate": 0.001334940230248552, "loss": 2.4142, "step": 15240 }, { "epoch": 0.41, "learning_rate": 0.0013348582172244504, "loss": 2.9039, "step": 15241 }, { "epoch": 0.41, "learning_rate": 0.0013347762016635224, "loss": 2.1452, "step": 15242 }, { "epoch": 0.41, "learning_rate": 0.00133469418356639, "loss": 2.936, "step": 15243 }, { "epoch": 0.41, "learning_rate": 0.0013346121629336741, "loss": 2.3987, "step": 15244 }, { "epoch": 0.41, "learning_rate": 0.0013345301397659963, "loss": 2.3462, "step": 15245 }, { "epoch": 0.41, "learning_rate": 0.0013344481140639783, "loss": 2.1858, "step": 15246 }, { "epoch": 0.41, "learning_rate": 0.001334366085828241, "loss": 2.8112, "step": 15247 }, { "epoch": 0.41, "learning_rate": 0.0013342840550594059, "loss": 2.5714, "step": 15248 }, { "epoch": 0.41, "learning_rate": 0.0013342020217580943, "loss": 2.4224, "step": 15249 }, { "epoch": 0.41, "learning_rate": 0.0013341199859249287, "loss": 2.6895, "step": 15250 }, { "epoch": 0.41, "learning_rate": 0.0013340379475605291, "loss": 2.453, "step": 15251 }, { "epoch": 0.41, "learning_rate": 0.0013339559066655178, "loss": 2.6372, "step": 15252 }, { "epoch": 0.41, "learning_rate": 0.0013338738632405168, "loss": 2.7123, "step": 15253 }, { "epoch": 0.41, "learning_rate": 0.0013337918172861467, "loss": 2.7255, "step": 15254 }, { "epoch": 0.41, "learning_rate": 0.0013337097688030295, "loss": 2.562, "step": 15255 }, { "epoch": 0.41, "learning_rate": 0.0013336277177917867, "loss": 3.0097, "step": 15256 }, { "epoch": 0.41, "learning_rate": 0.0013335456642530402, "loss": 2.4365, "step": 15257 }, { "epoch": 0.41, "learning_rate": 0.0013334636081874112, "loss": 2.7183, "step": 15258 }, { "epoch": 0.41, "learning_rate": 0.0013333815495955212, "loss": 2.3128, "step": 15259 }, { "epoch": 0.41, "learning_rate": 0.0013332994884779927, "loss": 2.4223, "step": 15260 }, { "epoch": 0.41, "learning_rate": 0.0013332174248354468, "loss": 2.5961, "step": 15261 }, { "epoch": 0.41, "learning_rate": 0.001333135358668505, "loss": 2.4939, "step": 15262 }, { "epoch": 0.41, "learning_rate": 0.0013330532899777895, "loss": 2.2798, "step": 15263 }, { "epoch": 0.41, "learning_rate": 0.0013329712187639218, "loss": 2.4229, "step": 15264 }, { "epoch": 0.41, "learning_rate": 0.0013328891450275235, "loss": 2.1323, "step": 15265 }, { "epoch": 0.41, "learning_rate": 0.001332807068769217, "loss": 2.401, "step": 15266 }, { "epoch": 0.41, "learning_rate": 0.001332724989989623, "loss": 2.3159, "step": 15267 }, { "epoch": 0.41, "learning_rate": 0.0013326429086893644, "loss": 2.1415, "step": 15268 }, { "epoch": 0.41, "learning_rate": 0.0013325608248690624, "loss": 2.6562, "step": 15269 }, { "epoch": 0.41, "learning_rate": 0.0013324787385293393, "loss": 2.5384, "step": 15270 }, { "epoch": 0.41, "learning_rate": 0.0013323966496708165, "loss": 2.8384, "step": 15271 }, { "epoch": 0.41, "learning_rate": 0.001332314558294116, "loss": 2.4686, "step": 15272 }, { "epoch": 0.41, "learning_rate": 0.0013322324643998602, "loss": 2.7134, "step": 15273 }, { "epoch": 0.41, "learning_rate": 0.0013321503679886706, "loss": 2.5215, "step": 15274 }, { "epoch": 0.41, "learning_rate": 0.0013320682690611686, "loss": 2.5922, "step": 15275 }, { "epoch": 0.41, "learning_rate": 0.0013319861676179775, "loss": 2.3268, "step": 15276 }, { "epoch": 0.41, "learning_rate": 0.0013319040636597182, "loss": 2.3739, "step": 15277 }, { "epoch": 0.41, "learning_rate": 0.001331821957187013, "loss": 2.4874, "step": 15278 }, { "epoch": 0.41, "learning_rate": 0.0013317398482004838, "loss": 2.5786, "step": 15279 }, { "epoch": 0.41, "learning_rate": 0.0013316577367007531, "loss": 2.5377, "step": 15280 }, { "epoch": 0.41, "learning_rate": 0.0013315756226884427, "loss": 2.518, "step": 15281 }, { "epoch": 0.41, "learning_rate": 0.0013314935061641748, "loss": 2.5519, "step": 15282 }, { "epoch": 0.41, "learning_rate": 0.0013314113871285712, "loss": 2.6793, "step": 15283 }, { "epoch": 0.41, "learning_rate": 0.0013313292655822541, "loss": 2.6441, "step": 15284 }, { "epoch": 0.41, "learning_rate": 0.0013312471415258458, "loss": 2.3182, "step": 15285 }, { "epoch": 0.41, "learning_rate": 0.0013311650149599684, "loss": 2.5411, "step": 15286 }, { "epoch": 0.41, "learning_rate": 0.001331082885885244, "loss": 2.5402, "step": 15287 }, { "epoch": 0.41, "learning_rate": 0.0013310007543022948, "loss": 2.4282, "step": 15288 }, { "epoch": 0.41, "learning_rate": 0.0013309186202117432, "loss": 2.5145, "step": 15289 }, { "epoch": 0.41, "learning_rate": 0.0013308364836142113, "loss": 2.5351, "step": 15290 }, { "epoch": 0.41, "learning_rate": 0.0013307543445103213, "loss": 2.36, "step": 15291 }, { "epoch": 0.41, "learning_rate": 0.0013306722029006951, "loss": 2.491, "step": 15292 }, { "epoch": 0.41, "learning_rate": 0.0013305900587859561, "loss": 2.5307, "step": 15293 }, { "epoch": 0.41, "learning_rate": 0.0013305079121667257, "loss": 2.6524, "step": 15294 }, { "epoch": 0.41, "learning_rate": 0.001330425763043626, "loss": 2.4134, "step": 15295 }, { "epoch": 0.41, "learning_rate": 0.0013303436114172804, "loss": 2.3923, "step": 15296 }, { "epoch": 0.41, "learning_rate": 0.0013302614572883104, "loss": 2.3617, "step": 15297 }, { "epoch": 0.41, "learning_rate": 0.0013301793006573383, "loss": 2.8124, "step": 15298 }, { "epoch": 0.41, "learning_rate": 0.0013300971415249876, "loss": 2.3662, "step": 15299 }, { "epoch": 0.41, "learning_rate": 0.0013300149798918797, "loss": 2.6722, "step": 15300 }, { "epoch": 0.41, "learning_rate": 0.001329932815758637, "loss": 2.7552, "step": 15301 }, { "epoch": 0.41, "learning_rate": 0.0013298506491258824, "loss": 3.1034, "step": 15302 }, { "epoch": 0.41, "learning_rate": 0.0013297684799942384, "loss": 2.6233, "step": 15303 }, { "epoch": 0.41, "learning_rate": 0.0013296863083643276, "loss": 2.7747, "step": 15304 }, { "epoch": 0.41, "learning_rate": 0.0013296041342367717, "loss": 2.4703, "step": 15305 }, { "epoch": 0.41, "learning_rate": 0.001329521957612194, "loss": 2.5928, "step": 15306 }, { "epoch": 0.41, "learning_rate": 0.0013294397784912172, "loss": 2.6457, "step": 15307 }, { "epoch": 0.41, "learning_rate": 0.0013293575968744628, "loss": 2.457, "step": 15308 }, { "epoch": 0.41, "learning_rate": 0.0013292754127625548, "loss": 2.3739, "step": 15309 }, { "epoch": 0.41, "learning_rate": 0.0013291932261561149, "loss": 2.6158, "step": 15310 }, { "epoch": 0.41, "learning_rate": 0.001329111037055766, "loss": 2.6556, "step": 15311 }, { "epoch": 0.41, "learning_rate": 0.0013290288454621308, "loss": 2.4554, "step": 15312 }, { "epoch": 0.41, "learning_rate": 0.0013289466513758319, "loss": 2.7616, "step": 15313 }, { "epoch": 0.41, "learning_rate": 0.0013288644547974917, "loss": 2.5222, "step": 15314 }, { "epoch": 0.41, "learning_rate": 0.0013287822557277334, "loss": 2.2477, "step": 15315 }, { "epoch": 0.41, "learning_rate": 0.0013287000541671796, "loss": 2.5936, "step": 15316 }, { "epoch": 0.41, "learning_rate": 0.001328617850116453, "loss": 2.6127, "step": 15317 }, { "epoch": 0.41, "learning_rate": 0.0013285356435761757, "loss": 2.7772, "step": 15318 }, { "epoch": 0.41, "learning_rate": 0.0013284534345469718, "loss": 2.9564, "step": 15319 }, { "epoch": 0.41, "learning_rate": 0.0013283712230294632, "loss": 2.698, "step": 15320 }, { "epoch": 0.41, "learning_rate": 0.0013282890090242727, "loss": 2.77, "step": 15321 }, { "epoch": 0.41, "learning_rate": 0.0013282067925320237, "loss": 2.3328, "step": 15322 }, { "epoch": 0.41, "learning_rate": 0.0013281245735533385, "loss": 2.7069, "step": 15323 }, { "epoch": 0.41, "learning_rate": 0.0013280423520888403, "loss": 3.0071, "step": 15324 }, { "epoch": 0.41, "learning_rate": 0.001327960128139152, "loss": 2.8382, "step": 15325 }, { "epoch": 0.41, "learning_rate": 0.0013278779017048962, "loss": 2.1484, "step": 15326 }, { "epoch": 0.41, "learning_rate": 0.0013277956727866962, "loss": 2.4927, "step": 15327 }, { "epoch": 0.41, "learning_rate": 0.0013277134413851744, "loss": 2.7528, "step": 15328 }, { "epoch": 0.41, "learning_rate": 0.0013276312075009547, "loss": 2.4666, "step": 15329 }, { "epoch": 0.41, "learning_rate": 0.001327548971134659, "loss": 2.6945, "step": 15330 }, { "epoch": 0.41, "learning_rate": 0.0013274667322869112, "loss": 2.5699, "step": 15331 }, { "epoch": 0.41, "learning_rate": 0.001327384490958334, "loss": 2.6137, "step": 15332 }, { "epoch": 0.41, "learning_rate": 0.0013273022471495502, "loss": 2.501, "step": 15333 }, { "epoch": 0.41, "learning_rate": 0.0013272200008611831, "loss": 2.6692, "step": 15334 }, { "epoch": 0.41, "learning_rate": 0.001327137752093856, "loss": 2.7939, "step": 15335 }, { "epoch": 0.41, "learning_rate": 0.0013270555008481919, "loss": 2.2718, "step": 15336 }, { "epoch": 0.41, "learning_rate": 0.0013269732471248134, "loss": 2.5879, "step": 15337 }, { "epoch": 0.41, "learning_rate": 0.0013268909909243444, "loss": 2.6491, "step": 15338 }, { "epoch": 0.41, "learning_rate": 0.0013268087322474073, "loss": 2.8756, "step": 15339 }, { "epoch": 0.41, "learning_rate": 0.0013267264710946263, "loss": 2.677, "step": 15340 }, { "epoch": 0.41, "learning_rate": 0.0013266442074666232, "loss": 2.7062, "step": 15341 }, { "epoch": 0.41, "learning_rate": 0.0013265619413640225, "loss": 2.6009, "step": 15342 }, { "epoch": 0.41, "learning_rate": 0.0013264796727874468, "loss": 2.3516, "step": 15343 }, { "epoch": 0.41, "learning_rate": 0.0013263974017375193, "loss": 2.6138, "step": 15344 }, { "epoch": 0.41, "learning_rate": 0.0013263151282148636, "loss": 2.7894, "step": 15345 }, { "epoch": 0.41, "learning_rate": 0.0013262328522201028, "loss": 2.5269, "step": 15346 }, { "epoch": 0.41, "learning_rate": 0.00132615057375386, "loss": 2.475, "step": 15347 }, { "epoch": 0.41, "learning_rate": 0.001326068292816759, "loss": 2.355, "step": 15348 }, { "epoch": 0.41, "learning_rate": 0.001325986009409423, "loss": 2.5938, "step": 15349 }, { "epoch": 0.41, "learning_rate": 0.0013259037235324753, "loss": 3.1248, "step": 15350 }, { "epoch": 0.41, "learning_rate": 0.0013258214351865392, "loss": 2.63, "step": 15351 }, { "epoch": 0.41, "learning_rate": 0.0013257391443722382, "loss": 2.8186, "step": 15352 }, { "epoch": 0.41, "learning_rate": 0.0013256568510901954, "loss": 2.4538, "step": 15353 }, { "epoch": 0.41, "learning_rate": 0.0013255745553410346, "loss": 2.7755, "step": 15354 }, { "epoch": 0.41, "learning_rate": 0.0013254922571253793, "loss": 2.5693, "step": 15355 }, { "epoch": 0.41, "learning_rate": 0.001325409956443853, "loss": 2.472, "step": 15356 }, { "epoch": 0.41, "learning_rate": 0.0013253276532970788, "loss": 2.6949, "step": 15357 }, { "epoch": 0.41, "learning_rate": 0.0013252453476856804, "loss": 2.5869, "step": 15358 }, { "epoch": 0.41, "learning_rate": 0.0013251630396102817, "loss": 2.5989, "step": 15359 }, { "epoch": 0.41, "learning_rate": 0.0013250807290715056, "loss": 3.2207, "step": 15360 }, { "epoch": 0.41, "learning_rate": 0.0013249984160699762, "loss": 2.7145, "step": 15361 }, { "epoch": 0.41, "learning_rate": 0.0013249161006063169, "loss": 2.8025, "step": 15362 }, { "epoch": 0.41, "learning_rate": 0.0013248337826811513, "loss": 2.4326, "step": 15363 }, { "epoch": 0.41, "learning_rate": 0.0013247514622951031, "loss": 2.3466, "step": 15364 }, { "epoch": 0.41, "learning_rate": 0.0013246691394487957, "loss": 2.5549, "step": 15365 }, { "epoch": 0.41, "learning_rate": 0.0013245868141428532, "loss": 2.8261, "step": 15366 }, { "epoch": 0.41, "learning_rate": 0.0013245044863778987, "loss": 2.9174, "step": 15367 }, { "epoch": 0.41, "learning_rate": 0.0013244221561545565, "loss": 2.971, "step": 15368 }, { "epoch": 0.41, "learning_rate": 0.0013243398234734501, "loss": 2.8051, "step": 15369 }, { "epoch": 0.41, "learning_rate": 0.001324257488335203, "loss": 2.5826, "step": 15370 }, { "epoch": 0.41, "learning_rate": 0.0013241751507404391, "loss": 2.3416, "step": 15371 }, { "epoch": 0.41, "learning_rate": 0.0013240928106897823, "loss": 2.3385, "step": 15372 }, { "epoch": 0.41, "learning_rate": 0.0013240104681838563, "loss": 2.186, "step": 15373 }, { "epoch": 0.41, "learning_rate": 0.001323928123223285, "loss": 2.382, "step": 15374 }, { "epoch": 0.41, "learning_rate": 0.0013238457758086922, "loss": 2.4348, "step": 15375 }, { "epoch": 0.41, "learning_rate": 0.0013237634259407015, "loss": 2.3566, "step": 15376 }, { "epoch": 0.41, "learning_rate": 0.001323681073619937, "loss": 3.0278, "step": 15377 }, { "epoch": 0.41, "learning_rate": 0.0013235987188470225, "loss": 2.7496, "step": 15378 }, { "epoch": 0.41, "learning_rate": 0.0013235163616225822, "loss": 2.4186, "step": 15379 }, { "epoch": 0.41, "learning_rate": 0.0013234340019472395, "loss": 2.4479, "step": 15380 }, { "epoch": 0.41, "learning_rate": 0.0013233516398216188, "loss": 2.4344, "step": 15381 }, { "epoch": 0.41, "learning_rate": 0.001323269275246344, "loss": 3.1245, "step": 15382 }, { "epoch": 0.41, "learning_rate": 0.0013231869082220389, "loss": 2.5759, "step": 15383 }, { "epoch": 0.41, "learning_rate": 0.0013231045387493271, "loss": 2.3464, "step": 15384 }, { "epoch": 0.41, "learning_rate": 0.0013230221668288336, "loss": 2.4836, "step": 15385 }, { "epoch": 0.41, "learning_rate": 0.001322939792461182, "loss": 2.0889, "step": 15386 }, { "epoch": 0.41, "learning_rate": 0.001322857415646996, "loss": 2.6846, "step": 15387 }, { "epoch": 0.41, "learning_rate": 0.0013227750363868998, "loss": 2.5012, "step": 15388 }, { "epoch": 0.41, "learning_rate": 0.0013226926546815179, "loss": 2.7878, "step": 15389 }, { "epoch": 0.41, "learning_rate": 0.001322610270531474, "loss": 2.9652, "step": 15390 }, { "epoch": 0.41, "learning_rate": 0.0013225278839373927, "loss": 2.4081, "step": 15391 }, { "epoch": 0.41, "learning_rate": 0.0013224454948998973, "loss": 2.4775, "step": 15392 }, { "epoch": 0.41, "learning_rate": 0.001322363103419613, "loss": 2.1716, "step": 15393 }, { "epoch": 0.41, "learning_rate": 0.001322280709497163, "loss": 2.6028, "step": 15394 }, { "epoch": 0.41, "learning_rate": 0.0013221983131331723, "loss": 2.2179, "step": 15395 }, { "epoch": 0.41, "learning_rate": 0.0013221159143282644, "loss": 2.3583, "step": 15396 }, { "epoch": 0.41, "learning_rate": 0.0013220335130830643, "loss": 2.8258, "step": 15397 }, { "epoch": 0.41, "learning_rate": 0.0013219511093981958, "loss": 2.7051, "step": 15398 }, { "epoch": 0.41, "learning_rate": 0.0013218687032742831, "loss": 2.5306, "step": 15399 }, { "epoch": 0.41, "learning_rate": 0.0013217862947119507, "loss": 2.6466, "step": 15400 }, { "epoch": 0.41, "learning_rate": 0.001321703883711823, "loss": 2.5559, "step": 15401 }, { "epoch": 0.41, "learning_rate": 0.0013216214702745242, "loss": 2.6291, "step": 15402 }, { "epoch": 0.41, "learning_rate": 0.0013215390544006782, "loss": 2.383, "step": 15403 }, { "epoch": 0.41, "learning_rate": 0.0013214566360909101, "loss": 2.7328, "step": 15404 }, { "epoch": 0.41, "learning_rate": 0.0013213742153458444, "loss": 2.7473, "step": 15405 }, { "epoch": 0.41, "learning_rate": 0.0013212917921661047, "loss": 2.6532, "step": 15406 }, { "epoch": 0.41, "learning_rate": 0.0013212093665523155, "loss": 2.3203, "step": 15407 }, { "epoch": 0.41, "learning_rate": 0.0013211269385051021, "loss": 2.2625, "step": 15408 }, { "epoch": 0.41, "learning_rate": 0.0013210445080250883, "loss": 2.4492, "step": 15409 }, { "epoch": 0.41, "learning_rate": 0.0013209620751128987, "loss": 2.5876, "step": 15410 }, { "epoch": 0.41, "learning_rate": 0.0013208796397691576, "loss": 2.5746, "step": 15411 }, { "epoch": 0.41, "learning_rate": 0.00132079720199449, "loss": 2.6374, "step": 15412 }, { "epoch": 0.41, "learning_rate": 0.00132071476178952, "loss": 2.5886, "step": 15413 }, { "epoch": 0.41, "learning_rate": 0.0013206323191548724, "loss": 1.828, "step": 15414 }, { "epoch": 0.41, "learning_rate": 0.0013205498740911717, "loss": 2.4514, "step": 15415 }, { "epoch": 0.41, "learning_rate": 0.0013204674265990424, "loss": 2.7229, "step": 15416 }, { "epoch": 0.41, "learning_rate": 0.0013203849766791089, "loss": 2.3003, "step": 15417 }, { "epoch": 0.41, "learning_rate": 0.0013203025243319966, "loss": 2.7014, "step": 15418 }, { "epoch": 0.41, "learning_rate": 0.0013202200695583294, "loss": 2.2926, "step": 15419 }, { "epoch": 0.41, "learning_rate": 0.001320137612358732, "loss": 2.7723, "step": 15420 }, { "epoch": 0.41, "learning_rate": 0.0013200551527338296, "loss": 2.514, "step": 15421 }, { "epoch": 0.41, "learning_rate": 0.0013199726906842463, "loss": 2.6804, "step": 15422 }, { "epoch": 0.41, "learning_rate": 0.001319890226210607, "loss": 2.3596, "step": 15423 }, { "epoch": 0.41, "learning_rate": 0.0013198077593135368, "loss": 2.5867, "step": 15424 }, { "epoch": 0.41, "learning_rate": 0.0013197252899936605, "loss": 2.6676, "step": 15425 }, { "epoch": 0.41, "learning_rate": 0.001319642818251602, "loss": 2.5505, "step": 15426 }, { "epoch": 0.41, "learning_rate": 0.001319560344087987, "loss": 2.7911, "step": 15427 }, { "epoch": 0.41, "learning_rate": 0.00131947786750344, "loss": 2.4195, "step": 15428 }, { "epoch": 0.41, "learning_rate": 0.0013193953884985856, "loss": 2.8729, "step": 15429 }, { "epoch": 0.41, "learning_rate": 0.001319312907074049, "loss": 2.4874, "step": 15430 }, { "epoch": 0.41, "learning_rate": 0.0013192304232304546, "loss": 2.2196, "step": 15431 }, { "epoch": 0.41, "learning_rate": 0.0013191479369684279, "loss": 2.5129, "step": 15432 }, { "epoch": 0.41, "learning_rate": 0.0013190654482885932, "loss": 2.6861, "step": 15433 }, { "epoch": 0.41, "learning_rate": 0.0013189829571915762, "loss": 2.397, "step": 15434 }, { "epoch": 0.41, "learning_rate": 0.001318900463678001, "loss": 2.8104, "step": 15435 }, { "epoch": 0.41, "learning_rate": 0.0013188179677484928, "loss": 2.7609, "step": 15436 }, { "epoch": 0.41, "learning_rate": 0.0013187354694036769, "loss": 2.5102, "step": 15437 }, { "epoch": 0.41, "learning_rate": 0.001318652968644178, "loss": 2.5637, "step": 15438 }, { "epoch": 0.41, "learning_rate": 0.001318570465470621, "loss": 2.5596, "step": 15439 }, { "epoch": 0.41, "learning_rate": 0.0013184879598836313, "loss": 2.9092, "step": 15440 }, { "epoch": 0.41, "learning_rate": 0.0013184054518838337, "loss": 2.953, "step": 15441 }, { "epoch": 0.41, "learning_rate": 0.0013183229414718536, "loss": 2.5571, "step": 15442 }, { "epoch": 0.42, "learning_rate": 0.0013182404286483152, "loss": 2.4126, "step": 15443 }, { "epoch": 0.42, "learning_rate": 0.0013181579134138447, "loss": 2.5202, "step": 15444 }, { "epoch": 0.42, "learning_rate": 0.0013180753957690665, "loss": 2.7561, "step": 15445 }, { "epoch": 0.42, "learning_rate": 0.0013179928757146061, "loss": 2.5391, "step": 15446 }, { "epoch": 0.42, "learning_rate": 0.0013179103532510884, "loss": 2.3072, "step": 15447 }, { "epoch": 0.42, "learning_rate": 0.0013178278283791389, "loss": 2.5119, "step": 15448 }, { "epoch": 0.42, "learning_rate": 0.0013177453010993826, "loss": 2.4196, "step": 15449 }, { "epoch": 0.42, "learning_rate": 0.0013176627714124444, "loss": 2.6828, "step": 15450 }, { "epoch": 0.42, "learning_rate": 0.00131758023931895, "loss": 2.7423, "step": 15451 }, { "epoch": 0.42, "learning_rate": 0.0013174977048195245, "loss": 2.3552, "step": 15452 }, { "epoch": 0.42, "learning_rate": 0.0013174151679147931, "loss": 2.8844, "step": 15453 }, { "epoch": 0.42, "learning_rate": 0.0013173326286053811, "loss": 2.6849, "step": 15454 }, { "epoch": 0.42, "learning_rate": 0.001317250086891914, "loss": 2.383, "step": 15455 }, { "epoch": 0.42, "learning_rate": 0.001317167542775017, "loss": 2.0529, "step": 15456 }, { "epoch": 0.42, "learning_rate": 0.0013170849962553153, "loss": 2.4451, "step": 15457 }, { "epoch": 0.42, "learning_rate": 0.0013170024473334342, "loss": 2.1326, "step": 15458 }, { "epoch": 0.42, "learning_rate": 0.0013169198960099994, "loss": 2.8523, "step": 15459 }, { "epoch": 0.42, "learning_rate": 0.0013168373422856362, "loss": 2.5843, "step": 15460 }, { "epoch": 0.42, "learning_rate": 0.00131675478616097, "loss": 2.5543, "step": 15461 }, { "epoch": 0.42, "learning_rate": 0.0013166722276366258, "loss": 2.7419, "step": 15462 }, { "epoch": 0.42, "learning_rate": 0.0013165896667132295, "loss": 2.4241, "step": 15463 }, { "epoch": 0.42, "learning_rate": 0.0013165071033914067, "loss": 2.9242, "step": 15464 }, { "epoch": 0.42, "learning_rate": 0.0013164245376717828, "loss": 2.9873, "step": 15465 }, { "epoch": 0.42, "learning_rate": 0.001316341969554983, "loss": 2.5284, "step": 15466 }, { "epoch": 0.42, "learning_rate": 0.0013162593990416328, "loss": 2.6187, "step": 15467 }, { "epoch": 0.42, "learning_rate": 0.0013161768261323581, "loss": 2.9949, "step": 15468 }, { "epoch": 0.42, "learning_rate": 0.0013160942508277842, "loss": 2.6175, "step": 15469 }, { "epoch": 0.42, "learning_rate": 0.0013160116731285368, "loss": 2.4814, "step": 15470 }, { "epoch": 0.42, "learning_rate": 0.0013159290930352416, "loss": 2.7648, "step": 15471 }, { "epoch": 0.42, "learning_rate": 0.0013158465105485243, "loss": 2.5625, "step": 15472 }, { "epoch": 0.42, "learning_rate": 0.0013157639256690097, "loss": 2.8646, "step": 15473 }, { "epoch": 0.42, "learning_rate": 0.0013156813383973242, "loss": 2.3996, "step": 15474 }, { "epoch": 0.42, "learning_rate": 0.0013155987487340937, "loss": 2.3547, "step": 15475 }, { "epoch": 0.42, "learning_rate": 0.0013155161566799432, "loss": 3.0264, "step": 15476 }, { "epoch": 0.42, "learning_rate": 0.001315433562235499, "loss": 2.8606, "step": 15477 }, { "epoch": 0.42, "learning_rate": 0.001315350965401386, "loss": 2.9148, "step": 15478 }, { "epoch": 0.42, "learning_rate": 0.001315268366178231, "loss": 2.6654, "step": 15479 }, { "epoch": 0.42, "learning_rate": 0.0013151857645666589, "loss": 2.9175, "step": 15480 }, { "epoch": 0.42, "learning_rate": 0.0013151031605672958, "loss": 2.6519, "step": 15481 }, { "epoch": 0.42, "learning_rate": 0.0013150205541807675, "loss": 2.329, "step": 15482 }, { "epoch": 0.42, "learning_rate": 0.0013149379454077, "loss": 2.7084, "step": 15483 }, { "epoch": 0.42, "learning_rate": 0.001314855334248719, "loss": 2.5591, "step": 15484 }, { "epoch": 0.42, "learning_rate": 0.00131477272070445, "loss": 2.4795, "step": 15485 }, { "epoch": 0.42, "learning_rate": 0.001314690104775519, "loss": 2.5491, "step": 15486 }, { "epoch": 0.42, "learning_rate": 0.0013146074864625525, "loss": 2.6653, "step": 15487 }, { "epoch": 0.42, "learning_rate": 0.0013145248657661756, "loss": 2.2237, "step": 15488 }, { "epoch": 0.42, "learning_rate": 0.0013144422426870147, "loss": 2.637, "step": 15489 }, { "epoch": 0.42, "learning_rate": 0.0013143596172256954, "loss": 2.5664, "step": 15490 }, { "epoch": 0.42, "learning_rate": 0.0013142769893828442, "loss": 2.5352, "step": 15491 }, { "epoch": 0.42, "learning_rate": 0.0013141943591590865, "loss": 2.4668, "step": 15492 }, { "epoch": 0.42, "learning_rate": 0.001314111726555048, "loss": 2.6565, "step": 15493 }, { "epoch": 0.42, "learning_rate": 0.001314029091571356, "loss": 2.3555, "step": 15494 }, { "epoch": 0.42, "learning_rate": 0.0013139464542086356, "loss": 3.061, "step": 15495 }, { "epoch": 0.42, "learning_rate": 0.0013138638144675127, "loss": 2.369, "step": 15496 }, { "epoch": 0.42, "learning_rate": 0.0013137811723486137, "loss": 2.785, "step": 15497 }, { "epoch": 0.42, "learning_rate": 0.0013136985278525651, "loss": 2.6159, "step": 15498 }, { "epoch": 0.42, "learning_rate": 0.001313615880979992, "loss": 2.4527, "step": 15499 }, { "epoch": 0.42, "learning_rate": 0.001313533231731521, "loss": 2.1032, "step": 15500 }, { "epoch": 0.42, "learning_rate": 0.0013134505801077787, "loss": 2.4825, "step": 15501 }, { "epoch": 0.42, "learning_rate": 0.001313367926109391, "loss": 2.6015, "step": 15502 }, { "epoch": 0.42, "learning_rate": 0.0013132852697369832, "loss": 2.6107, "step": 15503 }, { "epoch": 0.42, "learning_rate": 0.0013132026109911829, "loss": 2.5118, "step": 15504 }, { "epoch": 0.42, "learning_rate": 0.0013131199498726152, "loss": 2.7373, "step": 15505 }, { "epoch": 0.42, "learning_rate": 0.0013130372863819067, "loss": 2.7069, "step": 15506 }, { "epoch": 0.42, "learning_rate": 0.001312954620519684, "loss": 2.1683, "step": 15507 }, { "epoch": 0.42, "learning_rate": 0.0013128719522865731, "loss": 2.6751, "step": 15508 }, { "epoch": 0.42, "learning_rate": 0.0013127892816831995, "loss": 2.4293, "step": 15509 }, { "epoch": 0.42, "learning_rate": 0.0013127066087101908, "loss": 2.441, "step": 15510 }, { "epoch": 0.42, "learning_rate": 0.0013126239333681729, "loss": 2.561, "step": 15511 }, { "epoch": 0.42, "learning_rate": 0.0013125412556577716, "loss": 2.3784, "step": 15512 }, { "epoch": 0.42, "learning_rate": 0.0013124585755796138, "loss": 2.4734, "step": 15513 }, { "epoch": 0.42, "learning_rate": 0.0013123758931343258, "loss": 2.4881, "step": 15514 }, { "epoch": 0.42, "learning_rate": 0.0013122932083225339, "loss": 2.3869, "step": 15515 }, { "epoch": 0.42, "learning_rate": 0.001312210521144864, "loss": 2.9003, "step": 15516 }, { "epoch": 0.42, "learning_rate": 0.001312127831601943, "loss": 2.6331, "step": 15517 }, { "epoch": 0.42, "learning_rate": 0.0013120451396943982, "loss": 2.5622, "step": 15518 }, { "epoch": 0.42, "learning_rate": 0.0013119624454228545, "loss": 2.3902, "step": 15519 }, { "epoch": 0.42, "learning_rate": 0.0013118797487879392, "loss": 2.2242, "step": 15520 }, { "epoch": 0.42, "learning_rate": 0.0013117970497902789, "loss": 2.729, "step": 15521 }, { "epoch": 0.42, "learning_rate": 0.0013117143484304996, "loss": 2.2659, "step": 15522 }, { "epoch": 0.42, "learning_rate": 0.0013116316447092284, "loss": 2.8607, "step": 15523 }, { "epoch": 0.42, "learning_rate": 0.0013115489386270913, "loss": 2.7528, "step": 15524 }, { "epoch": 0.42, "learning_rate": 0.0013114662301847155, "loss": 2.7951, "step": 15525 }, { "epoch": 0.42, "learning_rate": 0.0013113835193827269, "loss": 1.9584, "step": 15526 }, { "epoch": 0.42, "learning_rate": 0.0013113008062217526, "loss": 2.72, "step": 15527 }, { "epoch": 0.42, "learning_rate": 0.0013112180907024192, "loss": 2.0807, "step": 15528 }, { "epoch": 0.42, "learning_rate": 0.0013111353728253528, "loss": 2.617, "step": 15529 }, { "epoch": 0.42, "learning_rate": 0.0013110526525911808, "loss": 2.3944, "step": 15530 }, { "epoch": 0.42, "learning_rate": 0.0013109699300005294, "loss": 2.8609, "step": 15531 }, { "epoch": 0.42, "learning_rate": 0.0013108872050540254, "loss": 2.6604, "step": 15532 }, { "epoch": 0.42, "learning_rate": 0.0013108044777522952, "loss": 2.7405, "step": 15533 }, { "epoch": 0.42, "learning_rate": 0.0013107217480959662, "loss": 2.9035, "step": 15534 }, { "epoch": 0.42, "learning_rate": 0.0013106390160856644, "loss": 2.7201, "step": 15535 }, { "epoch": 0.42, "learning_rate": 0.0013105562817220173, "loss": 2.4709, "step": 15536 }, { "epoch": 0.42, "learning_rate": 0.0013104735450056512, "loss": 2.6165, "step": 15537 }, { "epoch": 0.42, "learning_rate": 0.0013103908059371933, "loss": 2.4709, "step": 15538 }, { "epoch": 0.42, "learning_rate": 0.00131030806451727, "loss": 2.6003, "step": 15539 }, { "epoch": 0.42, "learning_rate": 0.0013102253207465083, "loss": 2.2457, "step": 15540 }, { "epoch": 0.42, "learning_rate": 0.001310142574625535, "loss": 3.0841, "step": 15541 }, { "epoch": 0.42, "learning_rate": 0.0013100598261549768, "loss": 2.3857, "step": 15542 }, { "epoch": 0.42, "learning_rate": 0.001309977075335461, "loss": 2.6994, "step": 15543 }, { "epoch": 0.42, "learning_rate": 0.0013098943221676142, "loss": 2.5387, "step": 15544 }, { "epoch": 0.42, "learning_rate": 0.0013098115666520637, "loss": 2.7245, "step": 15545 }, { "epoch": 0.42, "learning_rate": 0.0013097288087894358, "loss": 2.588, "step": 15546 }, { "epoch": 0.42, "learning_rate": 0.001309646048580358, "loss": 2.5945, "step": 15547 }, { "epoch": 0.42, "learning_rate": 0.001309563286025457, "loss": 2.5586, "step": 15548 }, { "epoch": 0.42, "learning_rate": 0.00130948052112536, "loss": 2.1236, "step": 15549 }, { "epoch": 0.42, "learning_rate": 0.0013093977538806939, "loss": 2.7295, "step": 15550 }, { "epoch": 0.42, "learning_rate": 0.0013093149842920858, "loss": 2.4631, "step": 15551 }, { "epoch": 0.42, "learning_rate": 0.001309232212360162, "loss": 2.08, "step": 15552 }, { "epoch": 0.42, "learning_rate": 0.001309149438085551, "loss": 2.5197, "step": 15553 }, { "epoch": 0.42, "learning_rate": 0.0013090666614688792, "loss": 2.6045, "step": 15554 }, { "epoch": 0.42, "learning_rate": 0.0013089838825107733, "loss": 2.1893, "step": 15555 }, { "epoch": 0.42, "learning_rate": 0.0013089011012118608, "loss": 2.5123, "step": 15556 }, { "epoch": 0.42, "learning_rate": 0.0013088183175727689, "loss": 2.451, "step": 15557 }, { "epoch": 0.42, "learning_rate": 0.0013087355315941245, "loss": 2.7042, "step": 15558 }, { "epoch": 0.42, "learning_rate": 0.0013086527432765547, "loss": 2.2634, "step": 15559 }, { "epoch": 0.42, "learning_rate": 0.001308569952620687, "loss": 2.4382, "step": 15560 }, { "epoch": 0.42, "learning_rate": 0.0013084871596271488, "loss": 2.1492, "step": 15561 }, { "epoch": 0.42, "learning_rate": 0.001308404364296567, "loss": 2.6793, "step": 15562 }, { "epoch": 0.42, "learning_rate": 0.0013083215666295684, "loss": 2.2261, "step": 15563 }, { "epoch": 0.42, "learning_rate": 0.0013082387666267813, "loss": 3.1125, "step": 15564 }, { "epoch": 0.42, "learning_rate": 0.001308155964288832, "loss": 2.396, "step": 15565 }, { "epoch": 0.42, "learning_rate": 0.0013080731596163487, "loss": 2.3216, "step": 15566 }, { "epoch": 0.42, "learning_rate": 0.001307990352609958, "loss": 1.9102, "step": 15567 }, { "epoch": 0.42, "learning_rate": 0.0013079075432702873, "loss": 2.5202, "step": 15568 }, { "epoch": 0.42, "learning_rate": 0.001307824731597964, "loss": 2.4839, "step": 15569 }, { "epoch": 0.42, "learning_rate": 0.0013077419175936157, "loss": 2.5337, "step": 15570 }, { "epoch": 0.42, "learning_rate": 0.0013076591012578698, "loss": 2.3061, "step": 15571 }, { "epoch": 0.42, "learning_rate": 0.0013075762825913535, "loss": 1.9205, "step": 15572 }, { "epoch": 0.42, "learning_rate": 0.0013074934615946944, "loss": 2.5615, "step": 15573 }, { "epoch": 0.42, "learning_rate": 0.0013074106382685196, "loss": 2.936, "step": 15574 }, { "epoch": 0.42, "learning_rate": 0.0013073278126134564, "loss": 2.5395, "step": 15575 }, { "epoch": 0.42, "learning_rate": 0.0013072449846301332, "loss": 2.761, "step": 15576 }, { "epoch": 0.42, "learning_rate": 0.001307162154319177, "loss": 2.6878, "step": 15577 }, { "epoch": 0.42, "learning_rate": 0.001307079321681215, "loss": 2.9957, "step": 15578 }, { "epoch": 0.42, "learning_rate": 0.0013069964867168746, "loss": 2.4408, "step": 15579 }, { "epoch": 0.42, "learning_rate": 0.001306913649426784, "loss": 2.9062, "step": 15580 }, { "epoch": 0.42, "learning_rate": 0.0013068308098115708, "loss": 2.8523, "step": 15581 }, { "epoch": 0.42, "learning_rate": 0.001306747967871862, "loss": 2.8402, "step": 15582 }, { "epoch": 0.42, "learning_rate": 0.001306665123608285, "loss": 2.32, "step": 15583 }, { "epoch": 0.42, "learning_rate": 0.0013065822770214686, "loss": 2.1848, "step": 15584 }, { "epoch": 0.42, "learning_rate": 0.0013064994281120393, "loss": 2.4875, "step": 15585 }, { "epoch": 0.42, "learning_rate": 0.001306416576880625, "loss": 2.302, "step": 15586 }, { "epoch": 0.42, "learning_rate": 0.0013063337233278536, "loss": 2.9153, "step": 15587 }, { "epoch": 0.42, "learning_rate": 0.0013062508674543528, "loss": 2.9258, "step": 15588 }, { "epoch": 0.42, "learning_rate": 0.0013061680092607503, "loss": 2.4958, "step": 15589 }, { "epoch": 0.42, "learning_rate": 0.0013060851487476735, "loss": 2.608, "step": 15590 }, { "epoch": 0.42, "learning_rate": 0.0013060022859157504, "loss": 2.9659, "step": 15591 }, { "epoch": 0.42, "learning_rate": 0.0013059194207656083, "loss": 2.3657, "step": 15592 }, { "epoch": 0.42, "learning_rate": 0.0013058365532978757, "loss": 2.787, "step": 15593 }, { "epoch": 0.42, "learning_rate": 0.00130575368351318, "loss": 2.4687, "step": 15594 }, { "epoch": 0.42, "learning_rate": 0.0013056708114121492, "loss": 1.9955, "step": 15595 }, { "epoch": 0.42, "learning_rate": 0.001305587936995411, "loss": 2.2199, "step": 15596 }, { "epoch": 0.42, "learning_rate": 0.0013055050602635932, "loss": 2.9064, "step": 15597 }, { "epoch": 0.42, "learning_rate": 0.0013054221812173236, "loss": 2.3983, "step": 15598 }, { "epoch": 0.42, "learning_rate": 0.00130533929985723, "loss": 2.6026, "step": 15599 }, { "epoch": 0.42, "learning_rate": 0.0013052564161839407, "loss": 3.0061, "step": 15600 }, { "epoch": 0.42, "learning_rate": 0.001305173530198083, "loss": 2.7564, "step": 15601 }, { "epoch": 0.42, "learning_rate": 0.0013050906419002854, "loss": 2.4875, "step": 15602 }, { "epoch": 0.42, "learning_rate": 0.001305007751291176, "loss": 3.1828, "step": 15603 }, { "epoch": 0.42, "learning_rate": 0.0013049248583713823, "loss": 2.436, "step": 15604 }, { "epoch": 0.42, "learning_rate": 0.001304841963141532, "loss": 2.8402, "step": 15605 }, { "epoch": 0.42, "learning_rate": 0.0013047590656022536, "loss": 2.7287, "step": 15606 }, { "epoch": 0.42, "learning_rate": 0.0013046761657541752, "loss": 2.674, "step": 15607 }, { "epoch": 0.42, "learning_rate": 0.0013045932635979245, "loss": 2.4242, "step": 15608 }, { "epoch": 0.42, "learning_rate": 0.0013045103591341296, "loss": 2.3912, "step": 15609 }, { "epoch": 0.42, "learning_rate": 0.0013044274523634188, "loss": 2.2098, "step": 15610 }, { "epoch": 0.42, "learning_rate": 0.0013043445432864202, "loss": 2.2455, "step": 15611 }, { "epoch": 0.42, "learning_rate": 0.0013042616319037614, "loss": 2.5784, "step": 15612 }, { "epoch": 0.42, "learning_rate": 0.0013041787182160713, "loss": 2.6893, "step": 15613 }, { "epoch": 0.42, "learning_rate": 0.0013040958022239773, "loss": 2.9406, "step": 15614 }, { "epoch": 0.42, "learning_rate": 0.0013040128839281078, "loss": 2.7381, "step": 15615 }, { "epoch": 0.42, "learning_rate": 0.0013039299633290913, "loss": 2.545, "step": 15616 }, { "epoch": 0.42, "learning_rate": 0.0013038470404275557, "loss": 2.3106, "step": 15617 }, { "epoch": 0.42, "learning_rate": 0.0013037641152241289, "loss": 2.3273, "step": 15618 }, { "epoch": 0.42, "learning_rate": 0.00130368118771944, "loss": 2.6972, "step": 15619 }, { "epoch": 0.42, "learning_rate": 0.0013035982579141163, "loss": 2.6339, "step": 15620 }, { "epoch": 0.42, "learning_rate": 0.0013035153258087865, "loss": 2.5346, "step": 15621 }, { "epoch": 0.42, "learning_rate": 0.001303432391404079, "loss": 2.6048, "step": 15622 }, { "epoch": 0.42, "learning_rate": 0.001303349454700622, "loss": 2.6745, "step": 15623 }, { "epoch": 0.42, "learning_rate": 0.001303266515699044, "loss": 2.69, "step": 15624 }, { "epoch": 0.42, "learning_rate": 0.0013031835743999728, "loss": 2.1417, "step": 15625 }, { "epoch": 0.42, "learning_rate": 0.0013031006308040368, "loss": 2.4438, "step": 15626 }, { "epoch": 0.42, "learning_rate": 0.001303017684911865, "loss": 2.2157, "step": 15627 }, { "epoch": 0.42, "learning_rate": 0.0013029347367240851, "loss": 3.019, "step": 15628 }, { "epoch": 0.42, "learning_rate": 0.001302851786241326, "loss": 2.4348, "step": 15629 }, { "epoch": 0.42, "learning_rate": 0.0013027688334642158, "loss": 2.6522, "step": 15630 }, { "epoch": 0.42, "learning_rate": 0.001302685878393383, "loss": 2.3059, "step": 15631 }, { "epoch": 0.42, "learning_rate": 0.0013026029210294564, "loss": 2.7138, "step": 15632 }, { "epoch": 0.42, "learning_rate": 0.0013025199613730639, "loss": 2.6683, "step": 15633 }, { "epoch": 0.42, "learning_rate": 0.0013024369994248345, "loss": 2.3931, "step": 15634 }, { "epoch": 0.42, "learning_rate": 0.001302354035185396, "loss": 2.0512, "step": 15635 }, { "epoch": 0.42, "learning_rate": 0.0013022710686553779, "loss": 2.3717, "step": 15636 }, { "epoch": 0.42, "learning_rate": 0.0013021880998354079, "loss": 2.6835, "step": 15637 }, { "epoch": 0.42, "learning_rate": 0.0013021051287261149, "loss": 2.4415, "step": 15638 }, { "epoch": 0.42, "learning_rate": 0.0013020221553281274, "loss": 2.6515, "step": 15639 }, { "epoch": 0.42, "learning_rate": 0.0013019391796420744, "loss": 3.0035, "step": 15640 }, { "epoch": 0.42, "learning_rate": 0.001301856201668584, "loss": 2.5081, "step": 15641 }, { "epoch": 0.42, "learning_rate": 0.0013017732214082847, "loss": 2.4199, "step": 15642 }, { "epoch": 0.42, "learning_rate": 0.0013016902388618056, "loss": 2.7616, "step": 15643 }, { "epoch": 0.42, "learning_rate": 0.0013016072540297755, "loss": 2.7086, "step": 15644 }, { "epoch": 0.42, "learning_rate": 0.0013015242669128222, "loss": 2.2139, "step": 15645 }, { "epoch": 0.42, "learning_rate": 0.0013014412775115753, "loss": 2.8163, "step": 15646 }, { "epoch": 0.42, "learning_rate": 0.0013013582858266634, "loss": 2.6799, "step": 15647 }, { "epoch": 0.42, "learning_rate": 0.0013012752918587147, "loss": 2.7108, "step": 15648 }, { "epoch": 0.42, "learning_rate": 0.0013011922956083582, "loss": 2.5089, "step": 15649 }, { "epoch": 0.42, "learning_rate": 0.0013011092970762227, "loss": 2.6021, "step": 15650 }, { "epoch": 0.42, "learning_rate": 0.0013010262962629372, "loss": 2.3008, "step": 15651 }, { "epoch": 0.42, "learning_rate": 0.0013009432931691304, "loss": 2.8457, "step": 15652 }, { "epoch": 0.42, "learning_rate": 0.0013008602877954308, "loss": 2.6574, "step": 15653 }, { "epoch": 0.42, "learning_rate": 0.0013007772801424675, "loss": 2.7343, "step": 15654 }, { "epoch": 0.42, "learning_rate": 0.0013006942702108693, "loss": 2.3839, "step": 15655 }, { "epoch": 0.42, "learning_rate": 0.001300611258001265, "loss": 2.829, "step": 15656 }, { "epoch": 0.42, "learning_rate": 0.0013005282435142836, "loss": 2.8907, "step": 15657 }, { "epoch": 0.42, "learning_rate": 0.0013004452267505538, "loss": 2.7161, "step": 15658 }, { "epoch": 0.42, "learning_rate": 0.001300362207710705, "loss": 2.5826, "step": 15659 }, { "epoch": 0.42, "learning_rate": 0.0013002791863953656, "loss": 2.8053, "step": 15660 }, { "epoch": 0.42, "learning_rate": 0.0013001961628051645, "loss": 2.6432, "step": 15661 }, { "epoch": 0.42, "learning_rate": 0.0013001131369407312, "loss": 2.2947, "step": 15662 }, { "epoch": 0.42, "learning_rate": 0.001300030108802695, "loss": 3.103, "step": 15663 }, { "epoch": 0.42, "learning_rate": 0.0012999470783916836, "loss": 2.4722, "step": 15664 }, { "epoch": 0.42, "learning_rate": 0.0012998640457083268, "loss": 2.1447, "step": 15665 }, { "epoch": 0.42, "learning_rate": 0.001299781010753254, "loss": 2.389, "step": 15666 }, { "epoch": 0.42, "learning_rate": 0.0012996979735270934, "loss": 2.7044, "step": 15667 }, { "epoch": 0.42, "learning_rate": 0.0012996149340304749, "loss": 2.2921, "step": 15668 }, { "epoch": 0.42, "learning_rate": 0.001299531892264027, "loss": 2.37, "step": 15669 }, { "epoch": 0.42, "learning_rate": 0.0012994488482283794, "loss": 2.2295, "step": 15670 }, { "epoch": 0.42, "learning_rate": 0.0012993658019241603, "loss": 2.6398, "step": 15671 }, { "epoch": 0.42, "learning_rate": 0.0012992827533519998, "loss": 2.5109, "step": 15672 }, { "epoch": 0.42, "learning_rate": 0.0012991997025125267, "loss": 2.6648, "step": 15673 }, { "epoch": 0.42, "learning_rate": 0.0012991166494063697, "loss": 2.7647, "step": 15674 }, { "epoch": 0.42, "learning_rate": 0.0012990335940341589, "loss": 2.6605, "step": 15675 }, { "epoch": 0.42, "learning_rate": 0.0012989505363965228, "loss": 2.3102, "step": 15676 }, { "epoch": 0.42, "learning_rate": 0.0012988674764940914, "loss": 2.7123, "step": 15677 }, { "epoch": 0.42, "learning_rate": 0.0012987844143274928, "loss": 2.5415, "step": 15678 }, { "epoch": 0.42, "learning_rate": 0.0012987013498973572, "loss": 2.526, "step": 15679 }, { "epoch": 0.42, "learning_rate": 0.0012986182832043134, "loss": 1.8139, "step": 15680 }, { "epoch": 0.42, "learning_rate": 0.0012985352142489907, "loss": 2.8421, "step": 15681 }, { "epoch": 0.42, "learning_rate": 0.001298452143032019, "loss": 2.4732, "step": 15682 }, { "epoch": 0.42, "learning_rate": 0.0012983690695540274, "loss": 2.4952, "step": 15683 }, { "epoch": 0.42, "learning_rate": 0.0012982859938156443, "loss": 2.54, "step": 15684 }, { "epoch": 0.42, "learning_rate": 0.0012982029158175004, "loss": 2.7054, "step": 15685 }, { "epoch": 0.42, "learning_rate": 0.0012981198355602247, "loss": 2.4662, "step": 15686 }, { "epoch": 0.42, "learning_rate": 0.0012980367530444458, "loss": 2.5383, "step": 15687 }, { "epoch": 0.42, "learning_rate": 0.0012979536682707943, "loss": 2.3243, "step": 15688 }, { "epoch": 0.42, "learning_rate": 0.0012978705812398987, "loss": 2.8696, "step": 15689 }, { "epoch": 0.42, "learning_rate": 0.001297787491952389, "loss": 2.4191, "step": 15690 }, { "epoch": 0.42, "learning_rate": 0.0012977044004088944, "loss": 2.6111, "step": 15691 }, { "epoch": 0.42, "learning_rate": 0.0012976213066100445, "loss": 2.3955, "step": 15692 }, { "epoch": 0.42, "learning_rate": 0.0012975382105564692, "loss": 2.7402, "step": 15693 }, { "epoch": 0.42, "learning_rate": 0.0012974551122487972, "loss": 2.7795, "step": 15694 }, { "epoch": 0.42, "learning_rate": 0.0012973720116876586, "loss": 2.2352, "step": 15695 }, { "epoch": 0.42, "learning_rate": 0.0012972889088736827, "loss": 2.3063, "step": 15696 }, { "epoch": 0.42, "learning_rate": 0.0012972058038074991, "loss": 2.4672, "step": 15697 }, { "epoch": 0.42, "learning_rate": 0.0012971226964897378, "loss": 2.5117, "step": 15698 }, { "epoch": 0.42, "learning_rate": 0.0012970395869210279, "loss": 2.4122, "step": 15699 }, { "epoch": 0.42, "learning_rate": 0.001296956475101999, "loss": 2.3733, "step": 15700 }, { "epoch": 0.42, "learning_rate": 0.001296873361033281, "loss": 2.6016, "step": 15701 }, { "epoch": 0.42, "learning_rate": 0.0012967902447155036, "loss": 2.445, "step": 15702 }, { "epoch": 0.42, "learning_rate": 0.0012967071261492963, "loss": 2.4442, "step": 15703 }, { "epoch": 0.42, "learning_rate": 0.0012966240053352888, "loss": 2.4483, "step": 15704 }, { "epoch": 0.42, "learning_rate": 0.001296540882274111, "loss": 2.5847, "step": 15705 }, { "epoch": 0.42, "learning_rate": 0.0012964577569663928, "loss": 2.3919, "step": 15706 }, { "epoch": 0.42, "learning_rate": 0.0012963746294127629, "loss": 2.3271, "step": 15707 }, { "epoch": 0.42, "learning_rate": 0.0012962914996138522, "loss": 2.7647, "step": 15708 }, { "epoch": 0.42, "learning_rate": 0.0012962083675702903, "loss": 2.4603, "step": 15709 }, { "epoch": 0.42, "learning_rate": 0.0012961252332827065, "loss": 2.8734, "step": 15710 }, { "epoch": 0.42, "learning_rate": 0.0012960420967517306, "loss": 2.2676, "step": 15711 }, { "epoch": 0.42, "learning_rate": 0.0012959589579779932, "loss": 2.8425, "step": 15712 }, { "epoch": 0.42, "learning_rate": 0.0012958758169621233, "loss": 2.5021, "step": 15713 }, { "epoch": 0.42, "learning_rate": 0.0012957926737047513, "loss": 2.6639, "step": 15714 }, { "epoch": 0.42, "learning_rate": 0.0012957095282065069, "loss": 3.2799, "step": 15715 }, { "epoch": 0.42, "learning_rate": 0.00129562638046802, "loss": 2.711, "step": 15716 }, { "epoch": 0.42, "learning_rate": 0.0012955432304899205, "loss": 2.608, "step": 15717 }, { "epoch": 0.42, "learning_rate": 0.0012954600782728383, "loss": 2.4843, "step": 15718 }, { "epoch": 0.42, "learning_rate": 0.0012953769238174032, "loss": 2.288, "step": 15719 }, { "epoch": 0.42, "learning_rate": 0.0012952937671242455, "loss": 2.0611, "step": 15720 }, { "epoch": 0.42, "learning_rate": 0.0012952106081939947, "loss": 2.6709, "step": 15721 }, { "epoch": 0.42, "learning_rate": 0.0012951274470272816, "loss": 2.406, "step": 15722 }, { "epoch": 0.42, "learning_rate": 0.0012950442836247354, "loss": 2.2146, "step": 15723 }, { "epoch": 0.42, "learning_rate": 0.0012949611179869864, "loss": 2.612, "step": 15724 }, { "epoch": 0.42, "learning_rate": 0.001294877950114665, "loss": 2.5206, "step": 15725 }, { "epoch": 0.42, "learning_rate": 0.001294794780008401, "loss": 2.0885, "step": 15726 }, { "epoch": 0.42, "learning_rate": 0.001294711607668824, "loss": 2.5347, "step": 15727 }, { "epoch": 0.42, "learning_rate": 0.001294628433096565, "loss": 2.6065, "step": 15728 }, { "epoch": 0.42, "learning_rate": 0.0012945452562922535, "loss": 2.8097, "step": 15729 }, { "epoch": 0.42, "learning_rate": 0.0012944620772565197, "loss": 2.8097, "step": 15730 }, { "epoch": 0.42, "learning_rate": 0.001294378895989994, "loss": 2.3921, "step": 15731 }, { "epoch": 0.42, "learning_rate": 0.0012942957124933063, "loss": 2.6827, "step": 15732 }, { "epoch": 0.42, "learning_rate": 0.001294212526767087, "loss": 2.7431, "step": 15733 }, { "epoch": 0.42, "learning_rate": 0.001294129338811966, "loss": 2.553, "step": 15734 }, { "epoch": 0.42, "learning_rate": 0.001294046148628574, "loss": 2.406, "step": 15735 }, { "epoch": 0.42, "learning_rate": 0.0012939629562175408, "loss": 2.607, "step": 15736 }, { "epoch": 0.42, "learning_rate": 0.001293879761579497, "loss": 2.9733, "step": 15737 }, { "epoch": 0.42, "learning_rate": 0.0012937965647150725, "loss": 2.7878, "step": 15738 }, { "epoch": 0.42, "learning_rate": 0.0012937133656248975, "loss": 2.5759, "step": 15739 }, { "epoch": 0.42, "learning_rate": 0.0012936301643096026, "loss": 2.617, "step": 15740 }, { "epoch": 0.42, "learning_rate": 0.0012935469607698185, "loss": 2.7525, "step": 15741 }, { "epoch": 0.42, "learning_rate": 0.0012934637550061747, "loss": 2.5512, "step": 15742 }, { "epoch": 0.42, "learning_rate": 0.0012933805470193023, "loss": 2.2165, "step": 15743 }, { "epoch": 0.42, "learning_rate": 0.001293297336809831, "loss": 2.13, "step": 15744 }, { "epoch": 0.42, "learning_rate": 0.0012932141243783917, "loss": 2.7042, "step": 15745 }, { "epoch": 0.42, "learning_rate": 0.0012931309097256145, "loss": 2.6404, "step": 15746 }, { "epoch": 0.42, "learning_rate": 0.00129304769285213, "loss": 2.5517, "step": 15747 }, { "epoch": 0.42, "learning_rate": 0.0012929644737585686, "loss": 2.4164, "step": 15748 }, { "epoch": 0.42, "learning_rate": 0.0012928812524455608, "loss": 2.2946, "step": 15749 }, { "epoch": 0.42, "learning_rate": 0.0012927980289137366, "loss": 2.5985, "step": 15750 }, { "epoch": 0.42, "learning_rate": 0.0012927148031637273, "loss": 2.2941, "step": 15751 }, { "epoch": 0.42, "learning_rate": 0.001292631575196163, "loss": 2.8916, "step": 15752 }, { "epoch": 0.42, "learning_rate": 0.0012925483450116739, "loss": 2.4715, "step": 15753 }, { "epoch": 0.42, "learning_rate": 0.0012924651126108911, "loss": 2.3585, "step": 15754 }, { "epoch": 0.42, "learning_rate": 0.001292381877994445, "loss": 2.5088, "step": 15755 }, { "epoch": 0.42, "learning_rate": 0.0012922986411629657, "loss": 2.7305, "step": 15756 }, { "epoch": 0.42, "learning_rate": 0.0012922154021170842, "loss": 2.7602, "step": 15757 }, { "epoch": 0.42, "learning_rate": 0.0012921321608574312, "loss": 2.7263, "step": 15758 }, { "epoch": 0.42, "learning_rate": 0.0012920489173846373, "loss": 2.914, "step": 15759 }, { "epoch": 0.42, "learning_rate": 0.0012919656716993328, "loss": 2.5865, "step": 15760 }, { "epoch": 0.42, "learning_rate": 0.0012918824238021488, "loss": 2.5383, "step": 15761 }, { "epoch": 0.42, "learning_rate": 0.0012917991736937154, "loss": 2.4096, "step": 15762 }, { "epoch": 0.42, "learning_rate": 0.0012917159213746636, "loss": 2.4356, "step": 15763 }, { "epoch": 0.42, "learning_rate": 0.0012916326668456245, "loss": 2.3187, "step": 15764 }, { "epoch": 0.42, "learning_rate": 0.0012915494101072285, "loss": 2.7032, "step": 15765 }, { "epoch": 0.42, "learning_rate": 0.001291466151160106, "loss": 2.4383, "step": 15766 }, { "epoch": 0.42, "learning_rate": 0.0012913828900048881, "loss": 2.653, "step": 15767 }, { "epoch": 0.42, "learning_rate": 0.0012912996266422057, "loss": 2.6205, "step": 15768 }, { "epoch": 0.42, "learning_rate": 0.0012912163610726893, "loss": 2.6636, "step": 15769 }, { "epoch": 0.42, "learning_rate": 0.0012911330932969694, "loss": 2.7174, "step": 15770 }, { "epoch": 0.42, "learning_rate": 0.0012910498233156778, "loss": 2.6859, "step": 15771 }, { "epoch": 0.42, "learning_rate": 0.0012909665511294445, "loss": 2.0855, "step": 15772 }, { "epoch": 0.42, "learning_rate": 0.0012908832767389007, "loss": 2.5687, "step": 15773 }, { "epoch": 0.42, "learning_rate": 0.0012908000001446772, "loss": 2.7286, "step": 15774 }, { "epoch": 0.42, "learning_rate": 0.0012907167213474051, "loss": 2.8639, "step": 15775 }, { "epoch": 0.42, "learning_rate": 0.0012906334403477147, "loss": 2.6985, "step": 15776 }, { "epoch": 0.42, "learning_rate": 0.0012905501571462378, "loss": 2.5961, "step": 15777 }, { "epoch": 0.42, "learning_rate": 0.0012904668717436043, "loss": 2.4651, "step": 15778 }, { "epoch": 0.42, "learning_rate": 0.001290383584140446, "loss": 2.792, "step": 15779 }, { "epoch": 0.42, "learning_rate": 0.0012903002943373935, "loss": 2.2333, "step": 15780 }, { "epoch": 0.42, "learning_rate": 0.001290217002335078, "loss": 2.5659, "step": 15781 }, { "epoch": 0.42, "learning_rate": 0.0012901337081341305, "loss": 2.7264, "step": 15782 }, { "epoch": 0.42, "learning_rate": 0.0012900504117351814, "loss": 2.1367, "step": 15783 }, { "epoch": 0.42, "learning_rate": 0.0012899671131388628, "loss": 2.7969, "step": 15784 }, { "epoch": 0.42, "learning_rate": 0.0012898838123458047, "loss": 2.663, "step": 15785 }, { "epoch": 0.42, "learning_rate": 0.0012898005093566391, "loss": 2.6352, "step": 15786 }, { "epoch": 0.42, "learning_rate": 0.0012897172041719965, "loss": 2.1072, "step": 15787 }, { "epoch": 0.42, "learning_rate": 0.0012896338967925082, "loss": 3.0244, "step": 15788 }, { "epoch": 0.42, "learning_rate": 0.0012895505872188048, "loss": 2.3287, "step": 15789 }, { "epoch": 0.42, "learning_rate": 0.0012894672754515185, "loss": 2.8216, "step": 15790 }, { "epoch": 0.42, "learning_rate": 0.0012893839614912797, "loss": 2.4343, "step": 15791 }, { "epoch": 0.42, "learning_rate": 0.00128930064533872, "loss": 2.5588, "step": 15792 }, { "epoch": 0.42, "learning_rate": 0.0012892173269944695, "loss": 2.6075, "step": 15793 }, { "epoch": 0.42, "learning_rate": 0.001289134006459161, "loss": 2.481, "step": 15794 }, { "epoch": 0.42, "learning_rate": 0.001289050683733425, "loss": 2.3942, "step": 15795 }, { "epoch": 0.42, "learning_rate": 0.0012889673588178923, "loss": 2.6926, "step": 15796 }, { "epoch": 0.42, "learning_rate": 0.0012888840317131947, "loss": 2.7337, "step": 15797 }, { "epoch": 0.42, "learning_rate": 0.0012888007024199632, "loss": 2.6997, "step": 15798 }, { "epoch": 0.42, "learning_rate": 0.0012887173709388296, "loss": 2.5542, "step": 15799 }, { "epoch": 0.42, "learning_rate": 0.0012886340372704247, "loss": 2.6289, "step": 15800 }, { "epoch": 0.42, "learning_rate": 0.0012885507014153794, "loss": 2.6169, "step": 15801 }, { "epoch": 0.42, "learning_rate": 0.001288467363374326, "loss": 2.5856, "step": 15802 }, { "epoch": 0.42, "learning_rate": 0.0012883840231478953, "loss": 2.377, "step": 15803 }, { "epoch": 0.42, "learning_rate": 0.0012883006807367192, "loss": 2.4095, "step": 15804 }, { "epoch": 0.42, "learning_rate": 0.0012882173361414282, "loss": 2.8986, "step": 15805 }, { "epoch": 0.42, "learning_rate": 0.0012881339893626542, "loss": 2.4763, "step": 15806 }, { "epoch": 0.42, "learning_rate": 0.001288050640401029, "loss": 2.3592, "step": 15807 }, { "epoch": 0.42, "learning_rate": 0.0012879672892571836, "loss": 2.6081, "step": 15808 }, { "epoch": 0.42, "learning_rate": 0.001287883935931749, "loss": 2.3631, "step": 15809 }, { "epoch": 0.42, "learning_rate": 0.0012878005804253577, "loss": 2.3288, "step": 15810 }, { "epoch": 0.42, "learning_rate": 0.0012877172227386405, "loss": 2.3219, "step": 15811 }, { "epoch": 0.42, "learning_rate": 0.001287633862872229, "loss": 3.0691, "step": 15812 }, { "epoch": 0.42, "learning_rate": 0.0012875505008267548, "loss": 2.4648, "step": 15813 }, { "epoch": 0.42, "learning_rate": 0.0012874671366028495, "loss": 2.6394, "step": 15814 }, { "epoch": 0.43, "learning_rate": 0.0012873837702011444, "loss": 2.9234, "step": 15815 }, { "epoch": 0.43, "learning_rate": 0.0012873004016222711, "loss": 2.984, "step": 15816 }, { "epoch": 0.43, "learning_rate": 0.0012872170308668616, "loss": 2.3208, "step": 15817 }, { "epoch": 0.43, "learning_rate": 0.0012871336579355472, "loss": 2.3524, "step": 15818 }, { "epoch": 0.43, "learning_rate": 0.0012870502828289593, "loss": 2.6378, "step": 15819 }, { "epoch": 0.43, "learning_rate": 0.00128696690554773, "loss": 2.5959, "step": 15820 }, { "epoch": 0.43, "learning_rate": 0.001286883526092491, "loss": 2.5359, "step": 15821 }, { "epoch": 0.43, "learning_rate": 0.0012868001444638732, "loss": 2.2052, "step": 15822 }, { "epoch": 0.43, "learning_rate": 0.0012867167606625091, "loss": 2.417, "step": 15823 }, { "epoch": 0.43, "learning_rate": 0.0012866333746890297, "loss": 2.7283, "step": 15824 }, { "epoch": 0.43, "learning_rate": 0.0012865499865440677, "loss": 2.7092, "step": 15825 }, { "epoch": 0.43, "learning_rate": 0.0012864665962282538, "loss": 2.5669, "step": 15826 }, { "epoch": 0.43, "learning_rate": 0.0012863832037422202, "loss": 2.6871, "step": 15827 }, { "epoch": 0.43, "learning_rate": 0.0012862998090865988, "loss": 2.5131, "step": 15828 }, { "epoch": 0.43, "learning_rate": 0.001286216412262021, "loss": 2.171, "step": 15829 }, { "epoch": 0.43, "learning_rate": 0.0012861330132691192, "loss": 2.5762, "step": 15830 }, { "epoch": 0.43, "learning_rate": 0.0012860496121085245, "loss": 2.6549, "step": 15831 }, { "epoch": 0.43, "learning_rate": 0.0012859662087808693, "loss": 2.7139, "step": 15832 }, { "epoch": 0.43, "learning_rate": 0.001285882803286785, "loss": 2.6023, "step": 15833 }, { "epoch": 0.43, "learning_rate": 0.001285799395626904, "loss": 2.72, "step": 15834 }, { "epoch": 0.43, "learning_rate": 0.0012857159858018579, "loss": 2.7495, "step": 15835 }, { "epoch": 0.43, "learning_rate": 0.001285632573812278, "loss": 2.7602, "step": 15836 }, { "epoch": 0.43, "learning_rate": 0.0012855491596587974, "loss": 2.4046, "step": 15837 }, { "epoch": 0.43, "learning_rate": 0.0012854657433420472, "loss": 2.6636, "step": 15838 }, { "epoch": 0.43, "learning_rate": 0.0012853823248626594, "loss": 2.5679, "step": 15839 }, { "epoch": 0.43, "learning_rate": 0.0012852989042212665, "loss": 2.281, "step": 15840 }, { "epoch": 0.43, "learning_rate": 0.0012852154814184998, "loss": 2.75, "step": 15841 }, { "epoch": 0.43, "learning_rate": 0.0012851320564549915, "loss": 2.8454, "step": 15842 }, { "epoch": 0.43, "learning_rate": 0.0012850486293313741, "loss": 2.592, "step": 15843 }, { "epoch": 0.43, "learning_rate": 0.001284965200048279, "loss": 2.6438, "step": 15844 }, { "epoch": 0.43, "learning_rate": 0.0012848817686063386, "loss": 2.6499, "step": 15845 }, { "epoch": 0.43, "learning_rate": 0.0012847983350061847, "loss": 2.8347, "step": 15846 }, { "epoch": 0.43, "learning_rate": 0.00128471489924845, "loss": 2.6214, "step": 15847 }, { "epoch": 0.43, "learning_rate": 0.0012846314613337655, "loss": 2.7298, "step": 15848 }, { "epoch": 0.43, "learning_rate": 0.001284548021262764, "loss": 2.3669, "step": 15849 }, { "epoch": 0.43, "learning_rate": 0.0012844645790360781, "loss": 2.9545, "step": 15850 }, { "epoch": 0.43, "learning_rate": 0.0012843811346543391, "loss": 2.5571, "step": 15851 }, { "epoch": 0.43, "learning_rate": 0.0012842976881181794, "loss": 2.3061, "step": 15852 }, { "epoch": 0.43, "learning_rate": 0.001284214239428231, "loss": 3.1289, "step": 15853 }, { "epoch": 0.43, "learning_rate": 0.0012841307885851267, "loss": 2.5582, "step": 15854 }, { "epoch": 0.43, "learning_rate": 0.0012840473355894982, "loss": 2.555, "step": 15855 }, { "epoch": 0.43, "learning_rate": 0.001283963880441978, "loss": 2.338, "step": 15856 }, { "epoch": 0.43, "learning_rate": 0.0012838804231431983, "loss": 2.5133, "step": 15857 }, { "epoch": 0.43, "learning_rate": 0.0012837969636937912, "loss": 3.0983, "step": 15858 }, { "epoch": 0.43, "learning_rate": 0.0012837135020943883, "loss": 2.4874, "step": 15859 }, { "epoch": 0.43, "learning_rate": 0.0012836300383456236, "loss": 2.9158, "step": 15860 }, { "epoch": 0.43, "learning_rate": 0.0012835465724481284, "loss": 2.6708, "step": 15861 }, { "epoch": 0.43, "learning_rate": 0.0012834631044025345, "loss": 2.6566, "step": 15862 }, { "epoch": 0.43, "learning_rate": 0.001283379634209475, "loss": 2.4915, "step": 15863 }, { "epoch": 0.43, "learning_rate": 0.0012832961618695822, "loss": 2.5287, "step": 15864 }, { "epoch": 0.43, "learning_rate": 0.0012832126873834884, "loss": 2.8001, "step": 15865 }, { "epoch": 0.43, "learning_rate": 0.0012831292107518255, "loss": 2.5671, "step": 15866 }, { "epoch": 0.43, "learning_rate": 0.0012830457319752268, "loss": 2.8083, "step": 15867 }, { "epoch": 0.43, "learning_rate": 0.001282962251054324, "loss": 2.2516, "step": 15868 }, { "epoch": 0.43, "learning_rate": 0.0012828787679897498, "loss": 2.2659, "step": 15869 }, { "epoch": 0.43, "learning_rate": 0.0012827952827821365, "loss": 2.2983, "step": 15870 }, { "epoch": 0.43, "learning_rate": 0.0012827117954321168, "loss": 2.5425, "step": 15871 }, { "epoch": 0.43, "learning_rate": 0.001282628305940323, "loss": 3.0403, "step": 15872 }, { "epoch": 0.43, "learning_rate": 0.0012825448143073878, "loss": 2.3396, "step": 15873 }, { "epoch": 0.43, "learning_rate": 0.001282461320533944, "loss": 2.6136, "step": 15874 }, { "epoch": 0.43, "learning_rate": 0.001282377824620623, "loss": 2.8506, "step": 15875 }, { "epoch": 0.43, "learning_rate": 0.0012822943265680584, "loss": 2.5805, "step": 15876 }, { "epoch": 0.43, "learning_rate": 0.0012822108263768825, "loss": 2.4759, "step": 15877 }, { "epoch": 0.43, "learning_rate": 0.001282127324047728, "loss": 2.406, "step": 15878 }, { "epoch": 0.43, "learning_rate": 0.0012820438195812267, "loss": 2.5264, "step": 15879 }, { "epoch": 0.43, "learning_rate": 0.0012819603129780126, "loss": 2.9895, "step": 15880 }, { "epoch": 0.43, "learning_rate": 0.0012818768042387172, "loss": 2.2108, "step": 15881 }, { "epoch": 0.43, "learning_rate": 0.0012817932933639736, "loss": 2.3054, "step": 15882 }, { "epoch": 0.43, "learning_rate": 0.0012817097803544141, "loss": 2.648, "step": 15883 }, { "epoch": 0.43, "learning_rate": 0.0012816262652106723, "loss": 2.261, "step": 15884 }, { "epoch": 0.43, "learning_rate": 0.0012815427479333796, "loss": 2.042, "step": 15885 }, { "epoch": 0.43, "learning_rate": 0.0012814592285231698, "loss": 2.6662, "step": 15886 }, { "epoch": 0.43, "learning_rate": 0.0012813757069806751, "loss": 2.729, "step": 15887 }, { "epoch": 0.43, "learning_rate": 0.0012812921833065282, "loss": 2.7179, "step": 15888 }, { "epoch": 0.43, "learning_rate": 0.0012812086575013622, "loss": 2.4033, "step": 15889 }, { "epoch": 0.43, "learning_rate": 0.0012811251295658096, "loss": 2.9371, "step": 15890 }, { "epoch": 0.43, "learning_rate": 0.0012810415995005034, "loss": 2.732, "step": 15891 }, { "epoch": 0.43, "learning_rate": 0.001280958067306076, "loss": 2.6933, "step": 15892 }, { "epoch": 0.43, "learning_rate": 0.001280874532983161, "loss": 2.1481, "step": 15893 }, { "epoch": 0.43, "learning_rate": 0.0012807909965323902, "loss": 1.8072, "step": 15894 }, { "epoch": 0.43, "learning_rate": 0.0012807074579543976, "loss": 1.9104, "step": 15895 }, { "epoch": 0.43, "learning_rate": 0.001280623917249815, "loss": 2.8493, "step": 15896 }, { "epoch": 0.43, "learning_rate": 0.0012805403744192761, "loss": 2.3097, "step": 15897 }, { "epoch": 0.43, "learning_rate": 0.0012804568294634132, "loss": 2.3721, "step": 15898 }, { "epoch": 0.43, "learning_rate": 0.0012803732823828593, "loss": 2.6095, "step": 15899 }, { "epoch": 0.43, "learning_rate": 0.0012802897331782481, "loss": 2.2678, "step": 15900 }, { "epoch": 0.43, "learning_rate": 0.001280206181850212, "loss": 2.5387, "step": 15901 }, { "epoch": 0.43, "learning_rate": 0.0012801226283993832, "loss": 2.3128, "step": 15902 }, { "epoch": 0.43, "learning_rate": 0.0012800390728263961, "loss": 2.648, "step": 15903 }, { "epoch": 0.43, "learning_rate": 0.001279955515131883, "loss": 2.286, "step": 15904 }, { "epoch": 0.43, "learning_rate": 0.0012798719553164769, "loss": 2.1457, "step": 15905 }, { "epoch": 0.43, "learning_rate": 0.0012797883933808108, "loss": 2.2756, "step": 15906 }, { "epoch": 0.43, "learning_rate": 0.001279704829325518, "loss": 2.4912, "step": 15907 }, { "epoch": 0.43, "learning_rate": 0.0012796212631512312, "loss": 2.0987, "step": 15908 }, { "epoch": 0.43, "learning_rate": 0.001279537694858584, "loss": 2.7144, "step": 15909 }, { "epoch": 0.43, "learning_rate": 0.0012794541244482089, "loss": 2.5594, "step": 15910 }, { "epoch": 0.43, "learning_rate": 0.0012793705519207397, "loss": 2.5406, "step": 15911 }, { "epoch": 0.43, "learning_rate": 0.0012792869772768087, "loss": 2.65, "step": 15912 }, { "epoch": 0.43, "learning_rate": 0.0012792034005170499, "loss": 2.5562, "step": 15913 }, { "epoch": 0.43, "learning_rate": 0.001279119821642096, "loss": 2.3073, "step": 15914 }, { "epoch": 0.43, "learning_rate": 0.0012790362406525798, "loss": 2.4017, "step": 15915 }, { "epoch": 0.43, "learning_rate": 0.0012789526575491352, "loss": 2.2779, "step": 15916 }, { "epoch": 0.43, "learning_rate": 0.0012788690723323955, "loss": 2.263, "step": 15917 }, { "epoch": 0.43, "learning_rate": 0.001278785485002993, "loss": 2.4903, "step": 15918 }, { "epoch": 0.43, "learning_rate": 0.0012787018955615617, "loss": 2.4782, "step": 15919 }, { "epoch": 0.43, "learning_rate": 0.0012786183040087347, "loss": 2.8327, "step": 15920 }, { "epoch": 0.43, "learning_rate": 0.0012785347103451453, "loss": 2.3304, "step": 15921 }, { "epoch": 0.43, "learning_rate": 0.0012784511145714265, "loss": 2.2728, "step": 15922 }, { "epoch": 0.43, "learning_rate": 0.001278367516688212, "loss": 2.6394, "step": 15923 }, { "epoch": 0.43, "learning_rate": 0.001278283916696135, "loss": 2.8776, "step": 15924 }, { "epoch": 0.43, "learning_rate": 0.0012782003145958287, "loss": 2.7089, "step": 15925 }, { "epoch": 0.43, "learning_rate": 0.0012781167103879266, "loss": 2.5267, "step": 15926 }, { "epoch": 0.43, "learning_rate": 0.0012780331040730623, "loss": 2.3341, "step": 15927 }, { "epoch": 0.43, "learning_rate": 0.0012779494956518685, "loss": 2.7221, "step": 15928 }, { "epoch": 0.43, "learning_rate": 0.001277865885124979, "loss": 2.564, "step": 15929 }, { "epoch": 0.43, "learning_rate": 0.0012777822724930274, "loss": 2.5791, "step": 15930 }, { "epoch": 0.43, "learning_rate": 0.0012776986577566472, "loss": 2.2909, "step": 15931 }, { "epoch": 0.43, "learning_rate": 0.0012776150409164713, "loss": 1.9765, "step": 15932 }, { "epoch": 0.43, "learning_rate": 0.0012775314219731335, "loss": 2.7036, "step": 15933 }, { "epoch": 0.43, "learning_rate": 0.0012774478009272673, "loss": 2.8789, "step": 15934 }, { "epoch": 0.43, "learning_rate": 0.0012773641777795062, "loss": 2.5539, "step": 15935 }, { "epoch": 0.43, "learning_rate": 0.0012772805525304838, "loss": 2.4265, "step": 15936 }, { "epoch": 0.43, "learning_rate": 0.0012771969251808334, "loss": 2.9431, "step": 15937 }, { "epoch": 0.43, "learning_rate": 0.0012771132957311883, "loss": 2.7323, "step": 15938 }, { "epoch": 0.43, "learning_rate": 0.001277029664182183, "loss": 2.6893, "step": 15939 }, { "epoch": 0.43, "learning_rate": 0.0012769460305344506, "loss": 3.1514, "step": 15940 }, { "epoch": 0.43, "learning_rate": 0.001276862394788624, "loss": 2.6989, "step": 15941 }, { "epoch": 0.43, "learning_rate": 0.0012767787569453375, "loss": 2.7604, "step": 15942 }, { "epoch": 0.43, "learning_rate": 0.0012766951170052247, "loss": 2.3958, "step": 15943 }, { "epoch": 0.43, "learning_rate": 0.0012766114749689194, "loss": 2.535, "step": 15944 }, { "epoch": 0.43, "learning_rate": 0.0012765278308370545, "loss": 2.5931, "step": 15945 }, { "epoch": 0.43, "learning_rate": 0.0012764441846102649, "loss": 2.2465, "step": 15946 }, { "epoch": 0.43, "learning_rate": 0.0012763605362891832, "loss": 2.4814, "step": 15947 }, { "epoch": 0.43, "learning_rate": 0.0012762768858744433, "loss": 2.4318, "step": 15948 }, { "epoch": 0.43, "learning_rate": 0.0012761932333666792, "loss": 2.3836, "step": 15949 }, { "epoch": 0.43, "learning_rate": 0.0012761095787665248, "loss": 2.0593, "step": 15950 }, { "epoch": 0.43, "learning_rate": 0.0012760259220746134, "loss": 2.5671, "step": 15951 }, { "epoch": 0.43, "learning_rate": 0.0012759422632915788, "loss": 2.3238, "step": 15952 }, { "epoch": 0.43, "learning_rate": 0.0012758586024180555, "loss": 2.536, "step": 15953 }, { "epoch": 0.43, "learning_rate": 0.0012757749394546763, "loss": 2.5607, "step": 15954 }, { "epoch": 0.43, "learning_rate": 0.0012756912744020755, "loss": 2.1774, "step": 15955 }, { "epoch": 0.43, "learning_rate": 0.001275607607260887, "loss": 2.715, "step": 15956 }, { "epoch": 0.43, "learning_rate": 0.0012755239380317445, "loss": 2.4115, "step": 15957 }, { "epoch": 0.43, "learning_rate": 0.0012754402667152817, "loss": 2.3443, "step": 15958 }, { "epoch": 0.43, "learning_rate": 0.001275356593312133, "loss": 2.8029, "step": 15959 }, { "epoch": 0.43, "learning_rate": 0.0012752729178229318, "loss": 2.6212, "step": 15960 }, { "epoch": 0.43, "learning_rate": 0.0012751892402483123, "loss": 2.1423, "step": 15961 }, { "epoch": 0.43, "learning_rate": 0.001275105560588908, "loss": 2.3519, "step": 15962 }, { "epoch": 0.43, "learning_rate": 0.0012750218788453536, "loss": 2.7221, "step": 15963 }, { "epoch": 0.43, "learning_rate": 0.0012749381950182823, "loss": 2.611, "step": 15964 }, { "epoch": 0.43, "learning_rate": 0.0012748545091083286, "loss": 2.3431, "step": 15965 }, { "epoch": 0.43, "learning_rate": 0.0012747708211161262, "loss": 2.3927, "step": 15966 }, { "epoch": 0.43, "learning_rate": 0.0012746871310423094, "loss": 2.6299, "step": 15967 }, { "epoch": 0.43, "learning_rate": 0.0012746034388875114, "loss": 2.7247, "step": 15968 }, { "epoch": 0.43, "learning_rate": 0.0012745197446523673, "loss": 2.8302, "step": 15969 }, { "epoch": 0.43, "learning_rate": 0.0012744360483375107, "loss": 2.6905, "step": 15970 }, { "epoch": 0.43, "learning_rate": 0.0012743523499435757, "loss": 2.6434, "step": 15971 }, { "epoch": 0.43, "learning_rate": 0.001274268649471196, "loss": 2.3985, "step": 15972 }, { "epoch": 0.43, "learning_rate": 0.0012741849469210065, "loss": 2.5264, "step": 15973 }, { "epoch": 0.43, "learning_rate": 0.0012741012422936406, "loss": 2.6443, "step": 15974 }, { "epoch": 0.43, "learning_rate": 0.0012740175355897328, "loss": 2.5664, "step": 15975 }, { "epoch": 0.43, "learning_rate": 0.001273933826809917, "loss": 2.3471, "step": 15976 }, { "epoch": 0.43, "learning_rate": 0.0012738501159548275, "loss": 2.3618, "step": 15977 }, { "epoch": 0.43, "learning_rate": 0.0012737664030250983, "loss": 2.7988, "step": 15978 }, { "epoch": 0.43, "learning_rate": 0.0012736826880213644, "loss": 2.7532, "step": 15979 }, { "epoch": 0.43, "learning_rate": 0.0012735989709442587, "loss": 3.0609, "step": 15980 }, { "epoch": 0.43, "learning_rate": 0.0012735152517944167, "loss": 2.3057, "step": 15981 }, { "epoch": 0.43, "learning_rate": 0.0012734315305724718, "loss": 2.6734, "step": 15982 }, { "epoch": 0.43, "learning_rate": 0.0012733478072790585, "loss": 2.5634, "step": 15983 }, { "epoch": 0.43, "learning_rate": 0.001273264081914811, "loss": 2.3569, "step": 15984 }, { "epoch": 0.43, "learning_rate": 0.0012731803544803637, "loss": 2.7512, "step": 15985 }, { "epoch": 0.43, "learning_rate": 0.0012730966249763509, "loss": 2.6742, "step": 15986 }, { "epoch": 0.43, "learning_rate": 0.001273012893403407, "loss": 2.5368, "step": 15987 }, { "epoch": 0.43, "learning_rate": 0.0012729291597621659, "loss": 2.6619, "step": 15988 }, { "epoch": 0.43, "learning_rate": 0.0012728454240532624, "loss": 2.7586, "step": 15989 }, { "epoch": 0.43, "learning_rate": 0.0012727616862773313, "loss": 2.6494, "step": 15990 }, { "epoch": 0.43, "learning_rate": 0.0012726779464350057, "loss": 2.016, "step": 15991 }, { "epoch": 0.43, "learning_rate": 0.001272594204526921, "loss": 2.2938, "step": 15992 }, { "epoch": 0.43, "learning_rate": 0.0012725104605537116, "loss": 2.6469, "step": 15993 }, { "epoch": 0.43, "learning_rate": 0.0012724267145160114, "loss": 2.0798, "step": 15994 }, { "epoch": 0.43, "learning_rate": 0.0012723429664144553, "loss": 2.4032, "step": 15995 }, { "epoch": 0.43, "learning_rate": 0.0012722592162496772, "loss": 2.7, "step": 15996 }, { "epoch": 0.43, "learning_rate": 0.0012721754640223123, "loss": 2.5283, "step": 15997 }, { "epoch": 0.43, "learning_rate": 0.0012720917097329945, "loss": 2.1959, "step": 15998 }, { "epoch": 0.43, "learning_rate": 0.0012720079533823586, "loss": 2.6888, "step": 15999 }, { "epoch": 0.43, "learning_rate": 0.0012719241949710391, "loss": 2.4829, "step": 16000 }, { "epoch": 0.43, "learning_rate": 0.0012718404344996706, "loss": 2.3613, "step": 16001 }, { "epoch": 0.43, "learning_rate": 0.0012717566719688878, "loss": 2.7292, "step": 16002 }, { "epoch": 0.43, "learning_rate": 0.0012716729073793244, "loss": 2.1233, "step": 16003 }, { "epoch": 0.43, "learning_rate": 0.001271589140731616, "loss": 2.4187, "step": 16004 }, { "epoch": 0.43, "learning_rate": 0.0012715053720263971, "loss": 2.4219, "step": 16005 }, { "epoch": 0.43, "learning_rate": 0.0012714216012643018, "loss": 2.3677, "step": 16006 }, { "epoch": 0.43, "learning_rate": 0.0012713378284459648, "loss": 2.6027, "step": 16007 }, { "epoch": 0.43, "learning_rate": 0.001271254053572021, "loss": 2.8829, "step": 16008 }, { "epoch": 0.43, "learning_rate": 0.0012711702766431052, "loss": 2.7188, "step": 16009 }, { "epoch": 0.43, "learning_rate": 0.001271086497659852, "loss": 3.0102, "step": 16010 }, { "epoch": 0.43, "learning_rate": 0.0012710027166228952, "loss": 2.9574, "step": 16011 }, { "epoch": 0.43, "learning_rate": 0.0012709189335328708, "loss": 2.6033, "step": 16012 }, { "epoch": 0.43, "learning_rate": 0.0012708351483904133, "loss": 2.5364, "step": 16013 }, { "epoch": 0.43, "learning_rate": 0.0012707513611961566, "loss": 2.668, "step": 16014 }, { "epoch": 0.43, "learning_rate": 0.0012706675719507362, "loss": 2.6517, "step": 16015 }, { "epoch": 0.43, "learning_rate": 0.0012705837806547865, "loss": 2.4544, "step": 16016 }, { "epoch": 0.43, "learning_rate": 0.0012704999873089427, "loss": 2.3447, "step": 16017 }, { "epoch": 0.43, "learning_rate": 0.0012704161919138393, "loss": 2.4187, "step": 16018 }, { "epoch": 0.43, "learning_rate": 0.001270332394470111, "loss": 2.0453, "step": 16019 }, { "epoch": 0.43, "learning_rate": 0.001270248594978393, "loss": 2.4195, "step": 16020 }, { "epoch": 0.43, "learning_rate": 0.00127016479343932, "loss": 2.3663, "step": 16021 }, { "epoch": 0.43, "learning_rate": 0.0012700809898535267, "loss": 2.7958, "step": 16022 }, { "epoch": 0.43, "learning_rate": 0.001269997184221648, "loss": 2.6208, "step": 16023 }, { "epoch": 0.43, "learning_rate": 0.0012699133765443188, "loss": 2.5121, "step": 16024 }, { "epoch": 0.43, "learning_rate": 0.0012698295668221746, "loss": 2.8285, "step": 16025 }, { "epoch": 0.43, "learning_rate": 0.0012697457550558497, "loss": 2.679, "step": 16026 }, { "epoch": 0.43, "learning_rate": 0.001269661941245979, "loss": 2.2853, "step": 16027 }, { "epoch": 0.43, "learning_rate": 0.0012695781253931975, "loss": 2.6493, "step": 16028 }, { "epoch": 0.43, "learning_rate": 0.0012694943074981406, "loss": 2.7565, "step": 16029 }, { "epoch": 0.43, "learning_rate": 0.001269410487561443, "loss": 2.389, "step": 16030 }, { "epoch": 0.43, "learning_rate": 0.0012693266655837397, "loss": 2.5876, "step": 16031 }, { "epoch": 0.43, "learning_rate": 0.0012692428415656655, "loss": 2.7817, "step": 16032 }, { "epoch": 0.43, "learning_rate": 0.001269159015507856, "loss": 2.7835, "step": 16033 }, { "epoch": 0.43, "learning_rate": 0.0012690751874109459, "loss": 2.648, "step": 16034 }, { "epoch": 0.43, "learning_rate": 0.00126899135727557, "loss": 2.4195, "step": 16035 }, { "epoch": 0.43, "learning_rate": 0.0012689075251023638, "loss": 2.6265, "step": 16036 }, { "epoch": 0.43, "learning_rate": 0.0012688236908919624, "loss": 2.2867, "step": 16037 }, { "epoch": 0.43, "learning_rate": 0.0012687398546450007, "loss": 2.2696, "step": 16038 }, { "epoch": 0.43, "learning_rate": 0.0012686560163621139, "loss": 2.7442, "step": 16039 }, { "epoch": 0.43, "learning_rate": 0.001268572176043937, "loss": 2.4162, "step": 16040 }, { "epoch": 0.43, "learning_rate": 0.0012684883336911055, "loss": 2.3744, "step": 16041 }, { "epoch": 0.43, "learning_rate": 0.0012684044893042543, "loss": 2.6371, "step": 16042 }, { "epoch": 0.43, "learning_rate": 0.0012683206428840189, "loss": 2.168, "step": 16043 }, { "epoch": 0.43, "learning_rate": 0.0012682367944310338, "loss": 2.5494, "step": 16044 }, { "epoch": 0.43, "learning_rate": 0.0012681529439459351, "loss": 2.2182, "step": 16045 }, { "epoch": 0.43, "learning_rate": 0.0012680690914293575, "loss": 2.9852, "step": 16046 }, { "epoch": 0.43, "learning_rate": 0.0012679852368819363, "loss": 3.1512, "step": 16047 }, { "epoch": 0.43, "learning_rate": 0.001267901380304307, "loss": 2.8291, "step": 16048 }, { "epoch": 0.43, "learning_rate": 0.001267817521697105, "loss": 2.7342, "step": 16049 }, { "epoch": 0.43, "learning_rate": 0.001267733661060965, "loss": 2.3124, "step": 16050 }, { "epoch": 0.43, "learning_rate": 0.0012676497983965225, "loss": 2.5883, "step": 16051 }, { "epoch": 0.43, "learning_rate": 0.0012675659337044133, "loss": 2.6549, "step": 16052 }, { "epoch": 0.43, "learning_rate": 0.0012674820669852725, "loss": 2.6307, "step": 16053 }, { "epoch": 0.43, "learning_rate": 0.0012673981982397348, "loss": 2.2339, "step": 16054 }, { "epoch": 0.43, "learning_rate": 0.0012673143274684368, "loss": 2.2105, "step": 16055 }, { "epoch": 0.43, "learning_rate": 0.001267230454672013, "loss": 2.5819, "step": 16056 }, { "epoch": 0.43, "learning_rate": 0.0012671465798510988, "loss": 2.7906, "step": 16057 }, { "epoch": 0.43, "learning_rate": 0.0012670627030063302, "loss": 2.4441, "step": 16058 }, { "epoch": 0.43, "learning_rate": 0.0012669788241383422, "loss": 2.6244, "step": 16059 }, { "epoch": 0.43, "learning_rate": 0.0012668949432477702, "loss": 2.046, "step": 16060 }, { "epoch": 0.43, "learning_rate": 0.0012668110603352503, "loss": 2.8161, "step": 16061 }, { "epoch": 0.43, "learning_rate": 0.001266727175401417, "loss": 2.6688, "step": 16062 }, { "epoch": 0.43, "learning_rate": 0.0012666432884469066, "loss": 2.3618, "step": 16063 }, { "epoch": 0.43, "learning_rate": 0.0012665593994723543, "loss": 2.3268, "step": 16064 }, { "epoch": 0.43, "learning_rate": 0.0012664755084783957, "loss": 2.2449, "step": 16065 }, { "epoch": 0.43, "learning_rate": 0.001266391615465666, "loss": 2.4309, "step": 16066 }, { "epoch": 0.43, "learning_rate": 0.001266307720434801, "loss": 2.6582, "step": 16067 }, { "epoch": 0.43, "learning_rate": 0.0012662238233864366, "loss": 2.3311, "step": 16068 }, { "epoch": 0.43, "learning_rate": 0.0012661399243212084, "loss": 2.7811, "step": 16069 }, { "epoch": 0.43, "learning_rate": 0.0012660560232397513, "loss": 2.4107, "step": 16070 }, { "epoch": 0.43, "learning_rate": 0.0012659721201427013, "loss": 2.04, "step": 16071 }, { "epoch": 0.43, "learning_rate": 0.0012658882150306942, "loss": 2.1279, "step": 16072 }, { "epoch": 0.43, "learning_rate": 0.0012658043079043653, "loss": 2.5631, "step": 16073 }, { "epoch": 0.43, "learning_rate": 0.0012657203987643507, "loss": 2.8278, "step": 16074 }, { "epoch": 0.43, "learning_rate": 0.0012656364876112859, "loss": 2.3927, "step": 16075 }, { "epoch": 0.43, "learning_rate": 0.0012655525744458065, "loss": 2.6221, "step": 16076 }, { "epoch": 0.43, "learning_rate": 0.001265468659268548, "loss": 2.4441, "step": 16077 }, { "epoch": 0.43, "learning_rate": 0.0012653847420801467, "loss": 3.0762, "step": 16078 }, { "epoch": 0.43, "learning_rate": 0.0012653008228812384, "loss": 2.5388, "step": 16079 }, { "epoch": 0.43, "learning_rate": 0.001265216901672458, "loss": 1.8963, "step": 16080 }, { "epoch": 0.43, "learning_rate": 0.0012651329784544416, "loss": 2.7197, "step": 16081 }, { "epoch": 0.43, "learning_rate": 0.0012650490532278257, "loss": 2.3322, "step": 16082 }, { "epoch": 0.43, "learning_rate": 0.0012649651259932452, "loss": 2.4859, "step": 16083 }, { "epoch": 0.43, "learning_rate": 0.0012648811967513366, "loss": 2.1302, "step": 16084 }, { "epoch": 0.43, "learning_rate": 0.0012647972655027348, "loss": 2.9613, "step": 16085 }, { "epoch": 0.43, "learning_rate": 0.001264713332248077, "loss": 2.3073, "step": 16086 }, { "epoch": 0.43, "learning_rate": 0.0012646293969879978, "loss": 2.5, "step": 16087 }, { "epoch": 0.43, "learning_rate": 0.0012645454597231339, "loss": 2.5931, "step": 16088 }, { "epoch": 0.43, "learning_rate": 0.0012644615204541205, "loss": 2.5811, "step": 16089 }, { "epoch": 0.43, "learning_rate": 0.001264377579181594, "loss": 2.555, "step": 16090 }, { "epoch": 0.43, "learning_rate": 0.0012642936359061907, "loss": 2.3336, "step": 16091 }, { "epoch": 0.43, "learning_rate": 0.0012642096906285458, "loss": 2.3976, "step": 16092 }, { "epoch": 0.43, "learning_rate": 0.0012641257433492954, "loss": 2.6853, "step": 16093 }, { "epoch": 0.43, "learning_rate": 0.0012640417940690755, "loss": 2.7278, "step": 16094 }, { "epoch": 0.43, "learning_rate": 0.0012639578427885226, "loss": 2.5373, "step": 16095 }, { "epoch": 0.43, "learning_rate": 0.0012638738895082717, "loss": 2.3972, "step": 16096 }, { "epoch": 0.43, "learning_rate": 0.0012637899342289596, "loss": 2.4004, "step": 16097 }, { "epoch": 0.43, "learning_rate": 0.0012637059769512226, "loss": 3.0962, "step": 16098 }, { "epoch": 0.43, "learning_rate": 0.0012636220176756958, "loss": 2.5147, "step": 16099 }, { "epoch": 0.43, "learning_rate": 0.0012635380564030158, "loss": 2.8628, "step": 16100 }, { "epoch": 0.43, "learning_rate": 0.0012634540931338184, "loss": 2.1731, "step": 16101 }, { "epoch": 0.43, "learning_rate": 0.00126337012786874, "loss": 2.2598, "step": 16102 }, { "epoch": 0.43, "learning_rate": 0.0012632861606084167, "loss": 2.1587, "step": 16103 }, { "epoch": 0.43, "learning_rate": 0.0012632021913534849, "loss": 3.0451, "step": 16104 }, { "epoch": 0.43, "learning_rate": 0.0012631182201045797, "loss": 2.5096, "step": 16105 }, { "epoch": 0.43, "learning_rate": 0.0012630342468623384, "loss": 2.6892, "step": 16106 }, { "epoch": 0.43, "learning_rate": 0.0012629502716273962, "loss": 2.5273, "step": 16107 }, { "epoch": 0.43, "learning_rate": 0.0012628662944003902, "loss": 2.5679, "step": 16108 }, { "epoch": 0.43, "learning_rate": 0.0012627823151819557, "loss": 2.4028, "step": 16109 }, { "epoch": 0.43, "learning_rate": 0.0012626983339727295, "loss": 2.5866, "step": 16110 }, { "epoch": 0.43, "learning_rate": 0.001262614350773348, "loss": 2.7502, "step": 16111 }, { "epoch": 0.43, "learning_rate": 0.001262530365584447, "loss": 2.2528, "step": 16112 }, { "epoch": 0.43, "learning_rate": 0.0012624463784066627, "loss": 2.776, "step": 16113 }, { "epoch": 0.43, "learning_rate": 0.0012623623892406316, "loss": 2.4358, "step": 16114 }, { "epoch": 0.43, "learning_rate": 0.0012622783980869904, "loss": 2.4872, "step": 16115 }, { "epoch": 0.43, "learning_rate": 0.0012621944049463743, "loss": 2.6608, "step": 16116 }, { "epoch": 0.43, "learning_rate": 0.0012621104098194205, "loss": 2.209, "step": 16117 }, { "epoch": 0.43, "learning_rate": 0.001262026412706765, "loss": 2.1341, "step": 16118 }, { "epoch": 0.43, "learning_rate": 0.0012619424136090446, "loss": 2.8665, "step": 16119 }, { "epoch": 0.43, "learning_rate": 0.0012618584125268948, "loss": 2.001, "step": 16120 }, { "epoch": 0.43, "learning_rate": 0.001261774409460953, "loss": 2.3186, "step": 16121 }, { "epoch": 0.43, "learning_rate": 0.001261690404411855, "loss": 2.7898, "step": 16122 }, { "epoch": 0.43, "learning_rate": 0.0012616063973802368, "loss": 2.2389, "step": 16123 }, { "epoch": 0.43, "learning_rate": 0.0012615223883667354, "loss": 3.0196, "step": 16124 }, { "epoch": 0.43, "learning_rate": 0.0012614383773719875, "loss": 2.2575, "step": 16125 }, { "epoch": 0.43, "learning_rate": 0.0012613543643966289, "loss": 2.7925, "step": 16126 }, { "epoch": 0.43, "learning_rate": 0.0012612703494412967, "loss": 2.5281, "step": 16127 }, { "epoch": 0.43, "learning_rate": 0.001261186332506627, "loss": 2.713, "step": 16128 }, { "epoch": 0.43, "learning_rate": 0.001261102313593256, "loss": 2.7196, "step": 16129 }, { "epoch": 0.43, "learning_rate": 0.0012610182927018207, "loss": 2.6949, "step": 16130 }, { "epoch": 0.43, "learning_rate": 0.0012609342698329579, "loss": 2.7642, "step": 16131 }, { "epoch": 0.43, "learning_rate": 0.0012608502449873032, "loss": 2.8372, "step": 16132 }, { "epoch": 0.43, "learning_rate": 0.0012607662181654935, "loss": 2.5369, "step": 16133 }, { "epoch": 0.43, "learning_rate": 0.001260682189368166, "loss": 2.599, "step": 16134 }, { "epoch": 0.43, "learning_rate": 0.001260598158595957, "loss": 2.1481, "step": 16135 }, { "epoch": 0.43, "learning_rate": 0.0012605141258495026, "loss": 2.7661, "step": 16136 }, { "epoch": 0.43, "learning_rate": 0.0012604300911294396, "loss": 2.4756, "step": 16137 }, { "epoch": 0.43, "learning_rate": 0.0012603460544364051, "loss": 2.3424, "step": 16138 }, { "epoch": 0.43, "learning_rate": 0.0012602620157710354, "loss": 2.8789, "step": 16139 }, { "epoch": 0.43, "learning_rate": 0.001260177975133967, "loss": 2.3403, "step": 16140 }, { "epoch": 0.43, "learning_rate": 0.0012600939325258368, "loss": 2.4953, "step": 16141 }, { "epoch": 0.43, "learning_rate": 0.001260009887947282, "loss": 3.0449, "step": 16142 }, { "epoch": 0.43, "learning_rate": 0.001259925841398938, "loss": 2.1944, "step": 16143 }, { "epoch": 0.43, "learning_rate": 0.0012598417928814428, "loss": 2.1763, "step": 16144 }, { "epoch": 0.43, "learning_rate": 0.0012597577423954325, "loss": 2.5603, "step": 16145 }, { "epoch": 0.43, "learning_rate": 0.001259673689941544, "loss": 2.5839, "step": 16146 }, { "epoch": 0.43, "learning_rate": 0.0012595896355204143, "loss": 2.6298, "step": 16147 }, { "epoch": 0.43, "learning_rate": 0.0012595055791326793, "loss": 2.2104, "step": 16148 }, { "epoch": 0.43, "learning_rate": 0.001259421520778977, "loss": 2.4583, "step": 16149 }, { "epoch": 0.43, "learning_rate": 0.0012593374604599433, "loss": 2.2835, "step": 16150 }, { "epoch": 0.43, "learning_rate": 0.0012592533981762154, "loss": 2.4375, "step": 16151 }, { "epoch": 0.43, "learning_rate": 0.0012591693339284303, "loss": 2.5652, "step": 16152 }, { "epoch": 0.43, "learning_rate": 0.0012590852677172243, "loss": 2.4134, "step": 16153 }, { "epoch": 0.43, "learning_rate": 0.001259001199543235, "loss": 2.3796, "step": 16154 }, { "epoch": 0.43, "learning_rate": 0.001258917129407099, "loss": 2.5927, "step": 16155 }, { "epoch": 0.43, "learning_rate": 0.0012588330573094525, "loss": 2.3397, "step": 16156 }, { "epoch": 0.43, "learning_rate": 0.0012587489832509339, "loss": 1.9765, "step": 16157 }, { "epoch": 0.43, "learning_rate": 0.0012586649072321788, "loss": 2.9484, "step": 16158 }, { "epoch": 0.43, "learning_rate": 0.0012585808292538245, "loss": 2.9321, "step": 16159 }, { "epoch": 0.43, "learning_rate": 0.001258496749316508, "loss": 2.8318, "step": 16160 }, { "epoch": 0.43, "learning_rate": 0.0012584126674208668, "loss": 2.6743, "step": 16161 }, { "epoch": 0.43, "learning_rate": 0.0012583285835675371, "loss": 2.3823, "step": 16162 }, { "epoch": 0.43, "learning_rate": 0.0012582444977571562, "loss": 2.7175, "step": 16163 }, { "epoch": 0.43, "learning_rate": 0.0012581604099903615, "loss": 2.6921, "step": 16164 }, { "epoch": 0.43, "learning_rate": 0.0012580763202677894, "loss": 2.2857, "step": 16165 }, { "epoch": 0.43, "learning_rate": 0.001257992228590077, "loss": 2.7089, "step": 16166 }, { "epoch": 0.43, "learning_rate": 0.001257908134957862, "loss": 2.6312, "step": 16167 }, { "epoch": 0.43, "learning_rate": 0.001257824039371781, "loss": 2.3816, "step": 16168 }, { "epoch": 0.43, "learning_rate": 0.001257739941832471, "loss": 2.4315, "step": 16169 }, { "epoch": 0.43, "learning_rate": 0.0012576558423405696, "loss": 3.0083, "step": 16170 }, { "epoch": 0.43, "learning_rate": 0.0012575717408967134, "loss": 2.4495, "step": 16171 }, { "epoch": 0.43, "learning_rate": 0.00125748763750154, "loss": 2.7928, "step": 16172 }, { "epoch": 0.43, "learning_rate": 0.0012574035321556859, "loss": 2.4136, "step": 16173 }, { "epoch": 0.43, "learning_rate": 0.0012573194248597889, "loss": 2.8658, "step": 16174 }, { "epoch": 0.43, "learning_rate": 0.0012572353156144857, "loss": 2.2208, "step": 16175 }, { "epoch": 0.43, "learning_rate": 0.001257151204420414, "loss": 2.8693, "step": 16176 }, { "epoch": 0.43, "learning_rate": 0.0012570670912782104, "loss": 2.7631, "step": 16177 }, { "epoch": 0.43, "learning_rate": 0.001256982976188513, "loss": 2.7527, "step": 16178 }, { "epoch": 0.43, "learning_rate": 0.001256898859151958, "loss": 2.6854, "step": 16179 }, { "epoch": 0.43, "learning_rate": 0.0012568147401691833, "loss": 2.2358, "step": 16180 }, { "epoch": 0.43, "learning_rate": 0.0012567306192408263, "loss": 2.4557, "step": 16181 }, { "epoch": 0.43, "learning_rate": 0.0012566464963675238, "loss": 2.7113, "step": 16182 }, { "epoch": 0.43, "learning_rate": 0.0012565623715499134, "loss": 2.8451, "step": 16183 }, { "epoch": 0.43, "learning_rate": 0.0012564782447886324, "loss": 2.9118, "step": 16184 }, { "epoch": 0.43, "learning_rate": 0.0012563941160843182, "loss": 2.7978, "step": 16185 }, { "epoch": 0.43, "learning_rate": 0.0012563099854376078, "loss": 2.9176, "step": 16186 }, { "epoch": 0.44, "learning_rate": 0.0012562258528491387, "loss": 2.7025, "step": 16187 }, { "epoch": 0.44, "learning_rate": 0.0012561417183195485, "loss": 2.7805, "step": 16188 }, { "epoch": 0.44, "learning_rate": 0.001256057581849474, "loss": 2.7622, "step": 16189 }, { "epoch": 0.44, "learning_rate": 0.0012559734434395536, "loss": 2.7067, "step": 16190 }, { "epoch": 0.44, "learning_rate": 0.0012558893030904241, "loss": 2.3016, "step": 16191 }, { "epoch": 0.44, "learning_rate": 0.0012558051608027227, "loss": 2.9194, "step": 16192 }, { "epoch": 0.44, "learning_rate": 0.0012557210165770876, "loss": 2.9736, "step": 16193 }, { "epoch": 0.44, "learning_rate": 0.0012556368704141553, "loss": 2.3316, "step": 16194 }, { "epoch": 0.44, "learning_rate": 0.0012555527223145641, "loss": 2.7671, "step": 16195 }, { "epoch": 0.44, "learning_rate": 0.001255468572278951, "loss": 2.8095, "step": 16196 }, { "epoch": 0.44, "learning_rate": 0.0012553844203079538, "loss": 2.5508, "step": 16197 }, { "epoch": 0.44, "learning_rate": 0.0012553002664022097, "loss": 2.9578, "step": 16198 }, { "epoch": 0.44, "learning_rate": 0.0012552161105623565, "loss": 2.5907, "step": 16199 }, { "epoch": 0.44, "learning_rate": 0.0012551319527890317, "loss": 2.6079, "step": 16200 }, { "epoch": 0.44, "learning_rate": 0.001255047793082873, "loss": 2.6786, "step": 16201 }, { "epoch": 0.44, "learning_rate": 0.0012549636314445175, "loss": 2.3455, "step": 16202 }, { "epoch": 0.44, "learning_rate": 0.0012548794678746034, "loss": 2.9862, "step": 16203 }, { "epoch": 0.44, "learning_rate": 0.001254795302373768, "loss": 2.5345, "step": 16204 }, { "epoch": 0.44, "learning_rate": 0.0012547111349426486, "loss": 2.3814, "step": 16205 }, { "epoch": 0.44, "learning_rate": 0.0012546269655818833, "loss": 2.6068, "step": 16206 }, { "epoch": 0.44, "learning_rate": 0.00125454279429211, "loss": 2.6541, "step": 16207 }, { "epoch": 0.44, "learning_rate": 0.0012544586210739657, "loss": 2.9309, "step": 16208 }, { "epoch": 0.44, "learning_rate": 0.0012543744459280887, "loss": 2.3356, "step": 16209 }, { "epoch": 0.44, "learning_rate": 0.0012542902688551156, "loss": 2.771, "step": 16210 }, { "epoch": 0.44, "learning_rate": 0.0012542060898556855, "loss": 2.2838, "step": 16211 }, { "epoch": 0.44, "learning_rate": 0.0012541219089304354, "loss": 2.3272, "step": 16212 }, { "epoch": 0.44, "learning_rate": 0.0012540377260800034, "loss": 2.4463, "step": 16213 }, { "epoch": 0.44, "learning_rate": 0.0012539535413050268, "loss": 2.1486, "step": 16214 }, { "epoch": 0.44, "learning_rate": 0.0012538693546061434, "loss": 2.791, "step": 16215 }, { "epoch": 0.44, "learning_rate": 0.0012537851659839912, "loss": 2.3193, "step": 16216 }, { "epoch": 0.44, "learning_rate": 0.001253700975439208, "loss": 2.7178, "step": 16217 }, { "epoch": 0.44, "learning_rate": 0.0012536167829724316, "loss": 2.3066, "step": 16218 }, { "epoch": 0.44, "learning_rate": 0.0012535325885843, "loss": 2.427, "step": 16219 }, { "epoch": 0.44, "learning_rate": 0.0012534483922754505, "loss": 2.6112, "step": 16220 }, { "epoch": 0.44, "learning_rate": 0.0012533641940465216, "loss": 2.7497, "step": 16221 }, { "epoch": 0.44, "learning_rate": 0.0012532799938981506, "loss": 2.677, "step": 16222 }, { "epoch": 0.44, "learning_rate": 0.0012531957918309757, "loss": 2.7689, "step": 16223 }, { "epoch": 0.44, "learning_rate": 0.001253111587845635, "loss": 2.55, "step": 16224 }, { "epoch": 0.44, "learning_rate": 0.0012530273819427657, "loss": 2.7954, "step": 16225 }, { "epoch": 0.44, "learning_rate": 0.0012529431741230064, "loss": 2.1354, "step": 16226 }, { "epoch": 0.44, "learning_rate": 0.0012528589643869949, "loss": 2.2885, "step": 16227 }, { "epoch": 0.44, "learning_rate": 0.0012527747527353692, "loss": 2.5747, "step": 16228 }, { "epoch": 0.44, "learning_rate": 0.0012526905391687668, "loss": 2.3301, "step": 16229 }, { "epoch": 0.44, "learning_rate": 0.0012526063236878264, "loss": 3.0421, "step": 16230 }, { "epoch": 0.44, "learning_rate": 0.0012525221062931857, "loss": 2.4933, "step": 16231 }, { "epoch": 0.44, "learning_rate": 0.0012524378869854824, "loss": 2.7688, "step": 16232 }, { "epoch": 0.44, "learning_rate": 0.0012523536657653546, "loss": 2.4836, "step": 16233 }, { "epoch": 0.44, "learning_rate": 0.001252269442633441, "loss": 2.6781, "step": 16234 }, { "epoch": 0.44, "learning_rate": 0.0012521852175903792, "loss": 2.4613, "step": 16235 }, { "epoch": 0.44, "learning_rate": 0.0012521009906368073, "loss": 3.3004, "step": 16236 }, { "epoch": 0.44, "learning_rate": 0.0012520167617733628, "loss": 2.5686, "step": 16237 }, { "epoch": 0.44, "learning_rate": 0.0012519325310006851, "loss": 2.4389, "step": 16238 }, { "epoch": 0.44, "learning_rate": 0.0012518482983194111, "loss": 2.5206, "step": 16239 }, { "epoch": 0.44, "learning_rate": 0.0012517640637301796, "loss": 2.5753, "step": 16240 }, { "epoch": 0.44, "learning_rate": 0.0012516798272336285, "loss": 2.7855, "step": 16241 }, { "epoch": 0.44, "learning_rate": 0.001251595588830396, "loss": 2.5902, "step": 16242 }, { "epoch": 0.44, "learning_rate": 0.0012515113485211205, "loss": 2.5556, "step": 16243 }, { "epoch": 0.44, "learning_rate": 0.00125142710630644, "loss": 2.4134, "step": 16244 }, { "epoch": 0.44, "learning_rate": 0.0012513428621869923, "loss": 2.7876, "step": 16245 }, { "epoch": 0.44, "learning_rate": 0.0012512586161634164, "loss": 2.8176, "step": 16246 }, { "epoch": 0.44, "learning_rate": 0.0012511743682363501, "loss": 2.4485, "step": 16247 }, { "epoch": 0.44, "learning_rate": 0.0012510901184064314, "loss": 1.8706, "step": 16248 }, { "epoch": 0.44, "learning_rate": 0.0012510058666742989, "loss": 2.2285, "step": 16249 }, { "epoch": 0.44, "learning_rate": 0.001250921613040591, "loss": 2.42, "step": 16250 }, { "epoch": 0.44, "learning_rate": 0.0012508373575059462, "loss": 2.8752, "step": 16251 }, { "epoch": 0.44, "learning_rate": 0.0012507531000710017, "loss": 2.2904, "step": 16252 }, { "epoch": 0.44, "learning_rate": 0.001250668840736397, "loss": 2.9991, "step": 16253 }, { "epoch": 0.44, "learning_rate": 0.0012505845795027699, "loss": 2.6268, "step": 16254 }, { "epoch": 0.44, "learning_rate": 0.0012505003163707587, "loss": 2.7008, "step": 16255 }, { "epoch": 0.44, "learning_rate": 0.001250416051341002, "loss": 2.1233, "step": 16256 }, { "epoch": 0.44, "learning_rate": 0.001250331784414138, "loss": 2.803, "step": 16257 }, { "epoch": 0.44, "learning_rate": 0.001250247515590805, "loss": 2.5296, "step": 16258 }, { "epoch": 0.44, "learning_rate": 0.001250163244871642, "loss": 2.7792, "step": 16259 }, { "epoch": 0.44, "learning_rate": 0.001250078972257287, "loss": 1.9942, "step": 16260 }, { "epoch": 0.44, "learning_rate": 0.0012499946977483779, "loss": 2.3583, "step": 16261 }, { "epoch": 0.44, "learning_rate": 0.0012499104213455538, "loss": 2.6158, "step": 16262 }, { "epoch": 0.44, "learning_rate": 0.0012498261430494532, "loss": 2.5719, "step": 16263 }, { "epoch": 0.44, "learning_rate": 0.0012497418628607143, "loss": 2.5111, "step": 16264 }, { "epoch": 0.44, "learning_rate": 0.0012496575807799757, "loss": 2.2739, "step": 16265 }, { "epoch": 0.44, "learning_rate": 0.001249573296807876, "loss": 2.1288, "step": 16266 }, { "epoch": 0.44, "learning_rate": 0.0012494890109450536, "loss": 2.6904, "step": 16267 }, { "epoch": 0.44, "learning_rate": 0.001249404723192147, "loss": 3.0168, "step": 16268 }, { "epoch": 0.44, "learning_rate": 0.0012493204335497948, "loss": 2.6763, "step": 16269 }, { "epoch": 0.44, "learning_rate": 0.0012492361420186357, "loss": 2.763, "step": 16270 }, { "epoch": 0.44, "learning_rate": 0.0012491518485993078, "loss": 2.2897, "step": 16271 }, { "epoch": 0.44, "learning_rate": 0.0012490675532924502, "loss": 2.2164, "step": 16272 }, { "epoch": 0.44, "learning_rate": 0.0012489832560987019, "loss": 2.5951, "step": 16273 }, { "epoch": 0.44, "learning_rate": 0.0012488989570187004, "loss": 2.6027, "step": 16274 }, { "epoch": 0.44, "learning_rate": 0.001248814656053085, "loss": 2.278, "step": 16275 }, { "epoch": 0.44, "learning_rate": 0.0012487303532024941, "loss": 2.4421, "step": 16276 }, { "epoch": 0.44, "learning_rate": 0.0012486460484675667, "loss": 2.5504, "step": 16277 }, { "epoch": 0.44, "learning_rate": 0.0012485617418489412, "loss": 2.6026, "step": 16278 }, { "epoch": 0.44, "learning_rate": 0.0012484774333472565, "loss": 2.7936, "step": 16279 }, { "epoch": 0.44, "learning_rate": 0.0012483931229631511, "loss": 2.525, "step": 16280 }, { "epoch": 0.44, "learning_rate": 0.001248308810697264, "loss": 2.6067, "step": 16281 }, { "epoch": 0.44, "learning_rate": 0.0012482244965502335, "loss": 2.2358, "step": 16282 }, { "epoch": 0.44, "learning_rate": 0.0012481401805226986, "loss": 2.8838, "step": 16283 }, { "epoch": 0.44, "learning_rate": 0.001248055862615298, "loss": 2.5244, "step": 16284 }, { "epoch": 0.44, "learning_rate": 0.0012479715428286707, "loss": 2.6383, "step": 16285 }, { "epoch": 0.44, "learning_rate": 0.0012478872211634554, "loss": 2.3261, "step": 16286 }, { "epoch": 0.44, "learning_rate": 0.001247802897620291, "loss": 2.7875, "step": 16287 }, { "epoch": 0.44, "learning_rate": 0.0012477185721998154, "loss": 2.5139, "step": 16288 }, { "epoch": 0.44, "learning_rate": 0.0012476342449026687, "loss": 2.38, "step": 16289 }, { "epoch": 0.44, "learning_rate": 0.0012475499157294893, "loss": 2.2741, "step": 16290 }, { "epoch": 0.44, "learning_rate": 0.0012474655846809158, "loss": 2.504, "step": 16291 }, { "epoch": 0.44, "learning_rate": 0.0012473812517575873, "loss": 3.016, "step": 16292 }, { "epoch": 0.44, "learning_rate": 0.0012472969169601428, "loss": 2.7966, "step": 16293 }, { "epoch": 0.44, "learning_rate": 0.0012472125802892211, "loss": 2.7784, "step": 16294 }, { "epoch": 0.44, "learning_rate": 0.0012471282417454608, "loss": 2.7551, "step": 16295 }, { "epoch": 0.44, "learning_rate": 0.0012470439013295012, "loss": 2.438, "step": 16296 }, { "epoch": 0.44, "learning_rate": 0.0012469595590419815, "loss": 2.7769, "step": 16297 }, { "epoch": 0.44, "learning_rate": 0.0012468752148835402, "loss": 2.8258, "step": 16298 }, { "epoch": 0.44, "learning_rate": 0.001246790868854816, "loss": 2.6278, "step": 16299 }, { "epoch": 0.44, "learning_rate": 0.0012467065209564488, "loss": 2.2966, "step": 16300 }, { "epoch": 0.44, "learning_rate": 0.0012466221711890766, "loss": 2.3037, "step": 16301 }, { "epoch": 0.44, "learning_rate": 0.0012465378195533395, "loss": 2.4579, "step": 16302 }, { "epoch": 0.44, "learning_rate": 0.0012464534660498756, "loss": 2.561, "step": 16303 }, { "epoch": 0.44, "learning_rate": 0.0012463691106793244, "loss": 2.647, "step": 16304 }, { "epoch": 0.44, "learning_rate": 0.0012462847534423247, "loss": 2.9877, "step": 16305 }, { "epoch": 0.44, "learning_rate": 0.0012462003943395162, "loss": 2.6207, "step": 16306 }, { "epoch": 0.44, "learning_rate": 0.001246116033371537, "loss": 2.5629, "step": 16307 }, { "epoch": 0.44, "learning_rate": 0.001246031670539027, "loss": 1.6731, "step": 16308 }, { "epoch": 0.44, "learning_rate": 0.0012459473058426252, "loss": 2.2902, "step": 16309 }, { "epoch": 0.44, "learning_rate": 0.0012458629392829703, "loss": 2.3697, "step": 16310 }, { "epoch": 0.44, "learning_rate": 0.001245778570860702, "loss": 2.6631, "step": 16311 }, { "epoch": 0.44, "learning_rate": 0.0012456942005764588, "loss": 2.3984, "step": 16312 }, { "epoch": 0.44, "learning_rate": 0.0012456098284308805, "loss": 3.1006, "step": 16313 }, { "epoch": 0.44, "learning_rate": 0.001245525454424606, "loss": 2.6863, "step": 16314 }, { "epoch": 0.44, "learning_rate": 0.0012454410785582744, "loss": 2.4851, "step": 16315 }, { "epoch": 0.44, "learning_rate": 0.0012453567008325255, "loss": 2.6823, "step": 16316 }, { "epoch": 0.44, "learning_rate": 0.001245272321247998, "loss": 2.8042, "step": 16317 }, { "epoch": 0.44, "learning_rate": 0.001245187939805331, "loss": 2.4237, "step": 16318 }, { "epoch": 0.44, "learning_rate": 0.0012451035565051638, "loss": 2.7115, "step": 16319 }, { "epoch": 0.44, "learning_rate": 0.0012450191713481362, "loss": 2.8995, "step": 16320 }, { "epoch": 0.44, "learning_rate": 0.0012449347843348872, "loss": 2.9415, "step": 16321 }, { "epoch": 0.44, "learning_rate": 0.0012448503954660562, "loss": 2.5586, "step": 16322 }, { "epoch": 0.44, "learning_rate": 0.0012447660047422819, "loss": 2.8978, "step": 16323 }, { "epoch": 0.44, "learning_rate": 0.0012446816121642044, "loss": 2.9477, "step": 16324 }, { "epoch": 0.44, "learning_rate": 0.001244597217732463, "loss": 2.8839, "step": 16325 }, { "epoch": 0.44, "learning_rate": 0.0012445128214476965, "loss": 2.2937, "step": 16326 }, { "epoch": 0.44, "learning_rate": 0.0012444284233105445, "loss": 2.5498, "step": 16327 }, { "epoch": 0.44, "learning_rate": 0.0012443440233216466, "loss": 2.6625, "step": 16328 }, { "epoch": 0.44, "learning_rate": 0.0012442596214816421, "loss": 2.1729, "step": 16329 }, { "epoch": 0.44, "learning_rate": 0.0012441752177911704, "loss": 2.3084, "step": 16330 }, { "epoch": 0.44, "learning_rate": 0.0012440908122508705, "loss": 2.4992, "step": 16331 }, { "epoch": 0.44, "learning_rate": 0.001244006404861383, "loss": 2.2455, "step": 16332 }, { "epoch": 0.44, "learning_rate": 0.001243921995623346, "loss": 2.7561, "step": 16333 }, { "epoch": 0.44, "learning_rate": 0.0012438375845373996, "loss": 2.5086, "step": 16334 }, { "epoch": 0.44, "learning_rate": 0.0012437531716041833, "loss": 2.0961, "step": 16335 }, { "epoch": 0.44, "learning_rate": 0.001243668756824337, "loss": 2.6224, "step": 16336 }, { "epoch": 0.44, "learning_rate": 0.0012435843401984992, "loss": 2.5773, "step": 16337 }, { "epoch": 0.44, "learning_rate": 0.0012434999217273103, "loss": 2.422, "step": 16338 }, { "epoch": 0.44, "learning_rate": 0.0012434155014114095, "loss": 2.5488, "step": 16339 }, { "epoch": 0.44, "learning_rate": 0.0012433310792514362, "loss": 2.9097, "step": 16340 }, { "epoch": 0.44, "learning_rate": 0.0012432466552480302, "loss": 2.1415, "step": 16341 }, { "epoch": 0.44, "learning_rate": 0.001243162229401831, "loss": 2.3532, "step": 16342 }, { "epoch": 0.44, "learning_rate": 0.0012430778017134786, "loss": 2.5521, "step": 16343 }, { "epoch": 0.44, "learning_rate": 0.0012429933721836118, "loss": 2.7511, "step": 16344 }, { "epoch": 0.44, "learning_rate": 0.0012429089408128708, "loss": 2.5986, "step": 16345 }, { "epoch": 0.44, "learning_rate": 0.001242824507601895, "loss": 2.4469, "step": 16346 }, { "epoch": 0.44, "learning_rate": 0.0012427400725513245, "loss": 2.4364, "step": 16347 }, { "epoch": 0.44, "learning_rate": 0.0012426556356617982, "loss": 2.6087, "step": 16348 }, { "epoch": 0.44, "learning_rate": 0.0012425711969339564, "loss": 2.5932, "step": 16349 }, { "epoch": 0.44, "learning_rate": 0.0012424867563684383, "loss": 2.3515, "step": 16350 }, { "epoch": 0.44, "learning_rate": 0.0012424023139658842, "loss": 2.4654, "step": 16351 }, { "epoch": 0.44, "learning_rate": 0.0012423178697269334, "loss": 2.2827, "step": 16352 }, { "epoch": 0.44, "learning_rate": 0.0012422334236522259, "loss": 2.3985, "step": 16353 }, { "epoch": 0.44, "learning_rate": 0.0012421489757424007, "loss": 2.3765, "step": 16354 }, { "epoch": 0.44, "learning_rate": 0.0012420645259980988, "loss": 2.4356, "step": 16355 }, { "epoch": 0.44, "learning_rate": 0.0012419800744199593, "loss": 2.6274, "step": 16356 }, { "epoch": 0.44, "learning_rate": 0.0012418956210086217, "loss": 2.6714, "step": 16357 }, { "epoch": 0.44, "learning_rate": 0.0012418111657647262, "loss": 2.681, "step": 16358 }, { "epoch": 0.44, "learning_rate": 0.0012417267086889125, "loss": 2.5306, "step": 16359 }, { "epoch": 0.44, "learning_rate": 0.0012416422497818207, "loss": 2.8167, "step": 16360 }, { "epoch": 0.44, "learning_rate": 0.0012415577890440904, "loss": 2.5783, "step": 16361 }, { "epoch": 0.44, "learning_rate": 0.0012414733264763612, "loss": 2.4618, "step": 16362 }, { "epoch": 0.44, "learning_rate": 0.0012413888620792736, "loss": 2.6345, "step": 16363 }, { "epoch": 0.44, "learning_rate": 0.0012413043958534667, "loss": 2.4996, "step": 16364 }, { "epoch": 0.44, "learning_rate": 0.0012412199277995813, "loss": 2.4096, "step": 16365 }, { "epoch": 0.44, "learning_rate": 0.0012411354579182565, "loss": 2.375, "step": 16366 }, { "epoch": 0.44, "learning_rate": 0.0012410509862101327, "loss": 2.2967, "step": 16367 }, { "epoch": 0.44, "learning_rate": 0.0012409665126758497, "loss": 2.3111, "step": 16368 }, { "epoch": 0.44, "learning_rate": 0.0012408820373160476, "loss": 2.5574, "step": 16369 }, { "epoch": 0.44, "learning_rate": 0.001240797560131366, "loss": 2.4358, "step": 16370 }, { "epoch": 0.44, "learning_rate": 0.0012407130811224454, "loss": 2.4766, "step": 16371 }, { "epoch": 0.44, "learning_rate": 0.0012406286002899255, "loss": 2.5313, "step": 16372 }, { "epoch": 0.44, "learning_rate": 0.0012405441176344466, "loss": 2.3797, "step": 16373 }, { "epoch": 0.44, "learning_rate": 0.0012404596331566477, "loss": 2.3832, "step": 16374 }, { "epoch": 0.44, "learning_rate": 0.0012403751468571702, "loss": 2.3535, "step": 16375 }, { "epoch": 0.44, "learning_rate": 0.0012402906587366536, "loss": 2.6212, "step": 16376 }, { "epoch": 0.44, "learning_rate": 0.0012402061687957376, "loss": 2.6801, "step": 16377 }, { "epoch": 0.44, "learning_rate": 0.0012401216770350628, "loss": 2.5986, "step": 16378 }, { "epoch": 0.44, "learning_rate": 0.001240037183455269, "loss": 2.7855, "step": 16379 }, { "epoch": 0.44, "learning_rate": 0.0012399526880569965, "loss": 2.8361, "step": 16380 }, { "epoch": 0.44, "learning_rate": 0.0012398681908408853, "loss": 2.7774, "step": 16381 }, { "epoch": 0.44, "learning_rate": 0.0012397836918075756, "loss": 2.2029, "step": 16382 }, { "epoch": 0.44, "learning_rate": 0.0012396991909577077, "loss": 2.2799, "step": 16383 }, { "epoch": 0.44, "learning_rate": 0.0012396146882919213, "loss": 2.4544, "step": 16384 }, { "epoch": 0.44, "learning_rate": 0.0012395301838108567, "loss": 2.5194, "step": 16385 }, { "epoch": 0.44, "learning_rate": 0.0012394456775151547, "loss": 2.9563, "step": 16386 }, { "epoch": 0.44, "learning_rate": 0.0012393611694054547, "loss": 2.9221, "step": 16387 }, { "epoch": 0.44, "learning_rate": 0.0012392766594823976, "loss": 2.3976, "step": 16388 }, { "epoch": 0.44, "learning_rate": 0.001239192147746623, "loss": 2.3782, "step": 16389 }, { "epoch": 0.44, "learning_rate": 0.001239107634198772, "loss": 2.3665, "step": 16390 }, { "epoch": 0.44, "learning_rate": 0.0012390231188394835, "loss": 2.1577, "step": 16391 }, { "epoch": 0.44, "learning_rate": 0.0012389386016693994, "loss": 2.5461, "step": 16392 }, { "epoch": 0.44, "learning_rate": 0.0012388540826891586, "loss": 2.8454, "step": 16393 }, { "epoch": 0.44, "learning_rate": 0.001238769561899402, "loss": 3.0544, "step": 16394 }, { "epoch": 0.44, "learning_rate": 0.00123868503930077, "loss": 2.0169, "step": 16395 }, { "epoch": 0.44, "learning_rate": 0.001238600514893903, "loss": 2.508, "step": 16396 }, { "epoch": 0.44, "learning_rate": 0.0012385159886794408, "loss": 2.5972, "step": 16397 }, { "epoch": 0.44, "learning_rate": 0.0012384314606580244, "loss": 2.0829, "step": 16398 }, { "epoch": 0.44, "learning_rate": 0.001238346930830294, "loss": 2.6937, "step": 16399 }, { "epoch": 0.44, "learning_rate": 0.0012382623991968895, "loss": 2.5798, "step": 16400 }, { "epoch": 0.44, "learning_rate": 0.0012381778657584517, "loss": 2.2634, "step": 16401 }, { "epoch": 0.44, "learning_rate": 0.0012380933305156212, "loss": 2.784, "step": 16402 }, { "epoch": 0.44, "learning_rate": 0.0012380087934690384, "loss": 2.4302, "step": 16403 }, { "epoch": 0.44, "learning_rate": 0.001237924254619343, "loss": 2.5194, "step": 16404 }, { "epoch": 0.44, "learning_rate": 0.001237839713967176, "loss": 2.4717, "step": 16405 }, { "epoch": 0.44, "learning_rate": 0.0012377551715131783, "loss": 1.9771, "step": 16406 }, { "epoch": 0.44, "learning_rate": 0.0012376706272579894, "loss": 2.4633, "step": 16407 }, { "epoch": 0.44, "learning_rate": 0.0012375860812022508, "loss": 2.7209, "step": 16408 }, { "epoch": 0.44, "learning_rate": 0.0012375015333466021, "loss": 2.6047, "step": 16409 }, { "epoch": 0.44, "learning_rate": 0.0012374169836916844, "loss": 2.6859, "step": 16410 }, { "epoch": 0.44, "learning_rate": 0.0012373324322381384, "loss": 2.447, "step": 16411 }, { "epoch": 0.44, "learning_rate": 0.001237247878986604, "loss": 2.0279, "step": 16412 }, { "epoch": 0.44, "learning_rate": 0.0012371633239377222, "loss": 2.7951, "step": 16413 }, { "epoch": 0.44, "learning_rate": 0.0012370787670921333, "loss": 2.288, "step": 16414 }, { "epoch": 0.44, "learning_rate": 0.0012369942084504784, "loss": 2.433, "step": 16415 }, { "epoch": 0.44, "learning_rate": 0.0012369096480133973, "loss": 2.8488, "step": 16416 }, { "epoch": 0.44, "learning_rate": 0.0012368250857815312, "loss": 2.5062, "step": 16417 }, { "epoch": 0.44, "learning_rate": 0.0012367405217555208, "loss": 2.813, "step": 16418 }, { "epoch": 0.44, "learning_rate": 0.0012366559559360065, "loss": 3.0483, "step": 16419 }, { "epoch": 0.44, "learning_rate": 0.0012365713883236286, "loss": 2.6567, "step": 16420 }, { "epoch": 0.44, "learning_rate": 0.0012364868189190285, "loss": 2.5221, "step": 16421 }, { "epoch": 0.44, "learning_rate": 0.0012364022477228465, "loss": 2.3962, "step": 16422 }, { "epoch": 0.44, "learning_rate": 0.0012363176747357233, "loss": 3.1225, "step": 16423 }, { "epoch": 0.44, "learning_rate": 0.0012362330999582997, "loss": 2.7279, "step": 16424 }, { "epoch": 0.44, "learning_rate": 0.0012361485233912163, "loss": 2.9424, "step": 16425 }, { "epoch": 0.44, "learning_rate": 0.001236063945035114, "loss": 2.2218, "step": 16426 }, { "epoch": 0.44, "learning_rate": 0.0012359793648906332, "loss": 2.5541, "step": 16427 }, { "epoch": 0.44, "learning_rate": 0.001235894782958415, "loss": 2.8048, "step": 16428 }, { "epoch": 0.44, "learning_rate": 0.0012358101992391004, "loss": 2.8384, "step": 16429 }, { "epoch": 0.44, "learning_rate": 0.0012357256137333298, "loss": 2.3584, "step": 16430 }, { "epoch": 0.44, "learning_rate": 0.001235641026441744, "loss": 2.7925, "step": 16431 }, { "epoch": 0.44, "learning_rate": 0.0012355564373649837, "loss": 2.9176, "step": 16432 }, { "epoch": 0.44, "learning_rate": 0.00123547184650369, "loss": 3.1568, "step": 16433 }, { "epoch": 0.44, "learning_rate": 0.001235387253858504, "loss": 2.6012, "step": 16434 }, { "epoch": 0.44, "learning_rate": 0.0012353026594300663, "loss": 2.5326, "step": 16435 }, { "epoch": 0.44, "learning_rate": 0.0012352180632190172, "loss": 2.766, "step": 16436 }, { "epoch": 0.44, "learning_rate": 0.0012351334652259984, "loss": 2.2906, "step": 16437 }, { "epoch": 0.44, "learning_rate": 0.0012350488654516508, "loss": 2.8807, "step": 16438 }, { "epoch": 0.44, "learning_rate": 0.0012349642638966147, "loss": 2.3842, "step": 16439 }, { "epoch": 0.44, "learning_rate": 0.0012348796605615312, "loss": 2.3779, "step": 16440 }, { "epoch": 0.44, "learning_rate": 0.0012347950554470418, "loss": 2.7185, "step": 16441 }, { "epoch": 0.44, "learning_rate": 0.0012347104485537868, "loss": 2.774, "step": 16442 }, { "epoch": 0.44, "learning_rate": 0.0012346258398824074, "loss": 2.698, "step": 16443 }, { "epoch": 0.44, "learning_rate": 0.0012345412294335442, "loss": 2.5145, "step": 16444 }, { "epoch": 0.44, "learning_rate": 0.0012344566172078394, "loss": 2.6233, "step": 16445 }, { "epoch": 0.44, "learning_rate": 0.0012343720032059326, "loss": 2.567, "step": 16446 }, { "epoch": 0.44, "learning_rate": 0.0012342873874284655, "loss": 2.4566, "step": 16447 }, { "epoch": 0.44, "learning_rate": 0.0012342027698760791, "loss": 2.4903, "step": 16448 }, { "epoch": 0.44, "learning_rate": 0.0012341181505494143, "loss": 2.7057, "step": 16449 }, { "epoch": 0.44, "learning_rate": 0.0012340335294491122, "loss": 2.6025, "step": 16450 }, { "epoch": 0.44, "learning_rate": 0.0012339489065758143, "loss": 2.7351, "step": 16451 }, { "epoch": 0.44, "learning_rate": 0.0012338642819301612, "loss": 2.4795, "step": 16452 }, { "epoch": 0.44, "learning_rate": 0.0012337796555127937, "loss": 2.0837, "step": 16453 }, { "epoch": 0.44, "learning_rate": 0.0012336950273243536, "loss": 2.8853, "step": 16454 }, { "epoch": 0.44, "learning_rate": 0.0012336103973654817, "loss": 2.5613, "step": 16455 }, { "epoch": 0.44, "learning_rate": 0.0012335257656368194, "loss": 2.6443, "step": 16456 }, { "epoch": 0.44, "learning_rate": 0.0012334411321390075, "loss": 2.5542, "step": 16457 }, { "epoch": 0.44, "learning_rate": 0.0012333564968726874, "loss": 2.2587, "step": 16458 }, { "epoch": 0.44, "learning_rate": 0.0012332718598385, "loss": 2.8823, "step": 16459 }, { "epoch": 0.44, "learning_rate": 0.0012331872210370866, "loss": 2.6936, "step": 16460 }, { "epoch": 0.44, "learning_rate": 0.001233102580469089, "loss": 1.8259, "step": 16461 }, { "epoch": 0.44, "learning_rate": 0.0012330179381351476, "loss": 2.5608, "step": 16462 }, { "epoch": 0.44, "learning_rate": 0.0012329332940359038, "loss": 2.6273, "step": 16463 }, { "epoch": 0.44, "learning_rate": 0.0012328486481719993, "loss": 2.3576, "step": 16464 }, { "epoch": 0.44, "learning_rate": 0.0012327640005440753, "loss": 2.4194, "step": 16465 }, { "epoch": 0.44, "learning_rate": 0.0012326793511527722, "loss": 2.0988, "step": 16466 }, { "epoch": 0.44, "learning_rate": 0.0012325946999987322, "loss": 2.1178, "step": 16467 }, { "epoch": 0.44, "learning_rate": 0.0012325100470825965, "loss": 2.6891, "step": 16468 }, { "epoch": 0.44, "learning_rate": 0.0012324253924050064, "loss": 2.5111, "step": 16469 }, { "epoch": 0.44, "learning_rate": 0.0012323407359666025, "loss": 2.1648, "step": 16470 }, { "epoch": 0.44, "learning_rate": 0.0012322560777680272, "loss": 2.6634, "step": 16471 }, { "epoch": 0.44, "learning_rate": 0.0012321714178099212, "loss": 2.562, "step": 16472 }, { "epoch": 0.44, "learning_rate": 0.0012320867560929262, "loss": 2.4218, "step": 16473 }, { "epoch": 0.44, "learning_rate": 0.0012320020926176833, "loss": 2.4568, "step": 16474 }, { "epoch": 0.44, "learning_rate": 0.001231917427384834, "loss": 2.5052, "step": 16475 }, { "epoch": 0.44, "learning_rate": 0.0012318327603950197, "loss": 2.7134, "step": 16476 }, { "epoch": 0.44, "learning_rate": 0.0012317480916488818, "loss": 2.5121, "step": 16477 }, { "epoch": 0.44, "learning_rate": 0.0012316634211470621, "loss": 2.8416, "step": 16478 }, { "epoch": 0.44, "learning_rate": 0.0012315787488902015, "loss": 2.8, "step": 16479 }, { "epoch": 0.44, "learning_rate": 0.0012314940748789417, "loss": 3.002, "step": 16480 }, { "epoch": 0.44, "learning_rate": 0.0012314093991139244, "loss": 2.3339, "step": 16481 }, { "epoch": 0.44, "learning_rate": 0.0012313247215957907, "loss": 2.5409, "step": 16482 }, { "epoch": 0.44, "learning_rate": 0.001231240042325182, "loss": 2.3258, "step": 16483 }, { "epoch": 0.44, "learning_rate": 0.0012311553613027404, "loss": 2.4803, "step": 16484 }, { "epoch": 0.44, "learning_rate": 0.0012310706785291072, "loss": 2.6441, "step": 16485 }, { "epoch": 0.44, "learning_rate": 0.0012309859940049237, "loss": 2.3503, "step": 16486 }, { "epoch": 0.44, "learning_rate": 0.0012309013077308314, "loss": 2.5446, "step": 16487 }, { "epoch": 0.44, "learning_rate": 0.0012308166197074724, "loss": 2.3673, "step": 16488 }, { "epoch": 0.44, "learning_rate": 0.0012307319299354879, "loss": 2.8808, "step": 16489 }, { "epoch": 0.44, "learning_rate": 0.0012306472384155192, "loss": 2.3859, "step": 16490 }, { "epoch": 0.44, "learning_rate": 0.0012305625451482088, "loss": 2.4598, "step": 16491 }, { "epoch": 0.44, "learning_rate": 0.0012304778501341976, "loss": 2.5997, "step": 16492 }, { "epoch": 0.44, "learning_rate": 0.0012303931533741272, "loss": 2.2142, "step": 16493 }, { "epoch": 0.44, "learning_rate": 0.0012303084548686396, "loss": 2.6407, "step": 16494 }, { "epoch": 0.44, "learning_rate": 0.0012302237546183764, "loss": 2.8775, "step": 16495 }, { "epoch": 0.44, "learning_rate": 0.0012301390526239788, "loss": 2.3799, "step": 16496 }, { "epoch": 0.44, "learning_rate": 0.0012300543488860895, "loss": 2.4823, "step": 16497 }, { "epoch": 0.44, "learning_rate": 0.0012299696434053492, "loss": 1.9096, "step": 16498 }, { "epoch": 0.44, "learning_rate": 0.0012298849361824, "loss": 2.4398, "step": 16499 }, { "epoch": 0.44, "learning_rate": 0.0012298002272178837, "loss": 2.1671, "step": 16500 }, { "epoch": 0.44, "learning_rate": 0.0012297155165124421, "loss": 2.6549, "step": 16501 }, { "epoch": 0.44, "learning_rate": 0.0012296308040667166, "loss": 2.1889, "step": 16502 }, { "epoch": 0.44, "learning_rate": 0.001229546089881349, "loss": 2.1482, "step": 16503 }, { "epoch": 0.44, "learning_rate": 0.0012294613739569818, "loss": 2.4673, "step": 16504 }, { "epoch": 0.44, "learning_rate": 0.001229376656294256, "loss": 2.8087, "step": 16505 }, { "epoch": 0.44, "learning_rate": 0.0012292919368938134, "loss": 2.466, "step": 16506 }, { "epoch": 0.44, "learning_rate": 0.0012292072157562962, "loss": 2.3352, "step": 16507 }, { "epoch": 0.44, "learning_rate": 0.0012291224928823465, "loss": 2.6399, "step": 16508 }, { "epoch": 0.44, "learning_rate": 0.0012290377682726056, "loss": 2.2093, "step": 16509 }, { "epoch": 0.44, "learning_rate": 0.0012289530419277153, "loss": 2.3005, "step": 16510 }, { "epoch": 0.44, "learning_rate": 0.001228868313848318, "loss": 2.3375, "step": 16511 }, { "epoch": 0.44, "learning_rate": 0.0012287835840350547, "loss": 2.6844, "step": 16512 }, { "epoch": 0.44, "learning_rate": 0.0012286988524885683, "loss": 2.7576, "step": 16513 }, { "epoch": 0.44, "learning_rate": 0.0012286141192095002, "loss": 2.5794, "step": 16514 }, { "epoch": 0.44, "learning_rate": 0.0012285293841984926, "loss": 2.4366, "step": 16515 }, { "epoch": 0.44, "learning_rate": 0.001228444647456187, "loss": 2.8103, "step": 16516 }, { "epoch": 0.44, "learning_rate": 0.0012283599089832255, "loss": 2.3819, "step": 16517 }, { "epoch": 0.44, "learning_rate": 0.0012282751687802504, "loss": 2.4906, "step": 16518 }, { "epoch": 0.44, "learning_rate": 0.0012281904268479033, "loss": 2.1662, "step": 16519 }, { "epoch": 0.44, "learning_rate": 0.0012281056831868265, "loss": 2.7178, "step": 16520 }, { "epoch": 0.44, "learning_rate": 0.0012280209377976616, "loss": 2.5412, "step": 16521 }, { "epoch": 0.44, "learning_rate": 0.0012279361906810508, "loss": 2.3947, "step": 16522 }, { "epoch": 0.44, "learning_rate": 0.0012278514418376362, "loss": 2.423, "step": 16523 }, { "epoch": 0.44, "learning_rate": 0.00122776669126806, "loss": 3.0568, "step": 16524 }, { "epoch": 0.44, "learning_rate": 0.001227681938972964, "loss": 2.413, "step": 16525 }, { "epoch": 0.44, "learning_rate": 0.0012275971849529904, "loss": 2.3741, "step": 16526 }, { "epoch": 0.44, "learning_rate": 0.0012275124292087812, "loss": 2.2251, "step": 16527 }, { "epoch": 0.44, "learning_rate": 0.0012274276717409785, "loss": 2.4576, "step": 16528 }, { "epoch": 0.44, "learning_rate": 0.001227342912550224, "loss": 2.1626, "step": 16529 }, { "epoch": 0.44, "learning_rate": 0.001227258151637161, "loss": 2.7131, "step": 16530 }, { "epoch": 0.44, "learning_rate": 0.0012271733890024303, "loss": 2.6284, "step": 16531 }, { "epoch": 0.44, "learning_rate": 0.0012270886246466748, "loss": 2.5852, "step": 16532 }, { "epoch": 0.44, "learning_rate": 0.0012270038585705362, "loss": 2.2767, "step": 16533 }, { "epoch": 0.44, "learning_rate": 0.0012269190907746575, "loss": 2.4734, "step": 16534 }, { "epoch": 0.44, "learning_rate": 0.00122683432125968, "loss": 2.2552, "step": 16535 }, { "epoch": 0.44, "learning_rate": 0.0012267495500262464, "loss": 2.1111, "step": 16536 }, { "epoch": 0.44, "learning_rate": 0.0012266647770749987, "loss": 2.3018, "step": 16537 }, { "epoch": 0.44, "learning_rate": 0.0012265800024065792, "loss": 2.804, "step": 16538 }, { "epoch": 0.44, "learning_rate": 0.0012264952260216298, "loss": 2.4632, "step": 16539 }, { "epoch": 0.44, "learning_rate": 0.0012264104479207934, "loss": 2.3846, "step": 16540 }, { "epoch": 0.44, "learning_rate": 0.0012263256681047116, "loss": 2.7212, "step": 16541 }, { "epoch": 0.44, "learning_rate": 0.0012262408865740273, "loss": 2.6423, "step": 16542 }, { "epoch": 0.44, "learning_rate": 0.0012261561033293825, "loss": 2.5583, "step": 16543 }, { "epoch": 0.44, "learning_rate": 0.0012260713183714195, "loss": 2.4703, "step": 16544 }, { "epoch": 0.44, "learning_rate": 0.0012259865317007805, "loss": 2.3731, "step": 16545 }, { "epoch": 0.44, "learning_rate": 0.001225901743318108, "loss": 2.3495, "step": 16546 }, { "epoch": 0.44, "learning_rate": 0.0012258169532240442, "loss": 2.5166, "step": 16547 }, { "epoch": 0.44, "learning_rate": 0.0012257321614192317, "loss": 2.3941, "step": 16548 }, { "epoch": 0.44, "learning_rate": 0.0012256473679043123, "loss": 2.5255, "step": 16549 }, { "epoch": 0.44, "learning_rate": 0.001225562572679929, "loss": 2.3559, "step": 16550 }, { "epoch": 0.44, "learning_rate": 0.0012254777757467244, "loss": 2.674, "step": 16551 }, { "epoch": 0.44, "learning_rate": 0.0012253929771053398, "loss": 2.5557, "step": 16552 }, { "epoch": 0.44, "learning_rate": 0.0012253081767564188, "loss": 2.7209, "step": 16553 }, { "epoch": 0.44, "learning_rate": 0.0012252233747006031, "loss": 2.7978, "step": 16554 }, { "epoch": 0.44, "learning_rate": 0.0012251385709385353, "loss": 2.2697, "step": 16555 }, { "epoch": 0.44, "learning_rate": 0.0012250537654708582, "loss": 2.5018, "step": 16556 }, { "epoch": 0.44, "learning_rate": 0.0012249689582982137, "loss": 2.4853, "step": 16557 }, { "epoch": 0.44, "learning_rate": 0.001224884149421245, "loss": 2.2565, "step": 16558 }, { "epoch": 0.45, "learning_rate": 0.0012247993388405938, "loss": 2.8598, "step": 16559 }, { "epoch": 0.45, "learning_rate": 0.0012247145265569031, "loss": 2.5316, "step": 16560 }, { "epoch": 0.45, "learning_rate": 0.0012246297125708154, "loss": 2.4373, "step": 16561 }, { "epoch": 0.45, "learning_rate": 0.0012245448968829732, "loss": 2.7913, "step": 16562 }, { "epoch": 0.45, "learning_rate": 0.0012244600794940191, "loss": 2.5271, "step": 16563 }, { "epoch": 0.45, "learning_rate": 0.0012243752604045952, "loss": 2.3795, "step": 16564 }, { "epoch": 0.45, "learning_rate": 0.0012242904396153446, "loss": 2.3771, "step": 16565 }, { "epoch": 0.45, "learning_rate": 0.0012242056171269098, "loss": 3.0618, "step": 16566 }, { "epoch": 0.45, "learning_rate": 0.0012241207929399333, "loss": 2.5829, "step": 16567 }, { "epoch": 0.45, "learning_rate": 0.0012240359670550578, "loss": 2.8273, "step": 16568 }, { "epoch": 0.45, "learning_rate": 0.0012239511394729256, "loss": 2.1241, "step": 16569 }, { "epoch": 0.45, "learning_rate": 0.0012238663101941801, "loss": 2.7679, "step": 16570 }, { "epoch": 0.45, "learning_rate": 0.0012237814792194633, "loss": 2.3719, "step": 16571 }, { "epoch": 0.45, "learning_rate": 0.0012236966465494178, "loss": 2.3966, "step": 16572 }, { "epoch": 0.45, "learning_rate": 0.0012236118121846866, "loss": 2.2832, "step": 16573 }, { "epoch": 0.45, "learning_rate": 0.0012235269761259123, "loss": 2.0489, "step": 16574 }, { "epoch": 0.45, "learning_rate": 0.0012234421383737375, "loss": 2.2627, "step": 16575 }, { "epoch": 0.45, "learning_rate": 0.001223357298928805, "loss": 2.7302, "step": 16576 }, { "epoch": 0.45, "learning_rate": 0.0012232724577917577, "loss": 2.9896, "step": 16577 }, { "epoch": 0.45, "learning_rate": 0.0012231876149632382, "loss": 2.3328, "step": 16578 }, { "epoch": 0.45, "learning_rate": 0.001223102770443889, "loss": 2.7311, "step": 16579 }, { "epoch": 0.45, "learning_rate": 0.0012230179242343534, "loss": 2.8793, "step": 16580 }, { "epoch": 0.45, "learning_rate": 0.0012229330763352737, "loss": 2.3503, "step": 16581 }, { "epoch": 0.45, "learning_rate": 0.001222848226747293, "loss": 2.5422, "step": 16582 }, { "epoch": 0.45, "learning_rate": 0.001222763375471054, "loss": 3.009, "step": 16583 }, { "epoch": 0.45, "learning_rate": 0.001222678522507199, "loss": 2.4603, "step": 16584 }, { "epoch": 0.45, "learning_rate": 0.0012225936678563717, "loss": 2.6973, "step": 16585 }, { "epoch": 0.45, "learning_rate": 0.0012225088115192146, "loss": 2.6706, "step": 16586 }, { "epoch": 0.45, "learning_rate": 0.0012224239534963707, "loss": 2.5262, "step": 16587 }, { "epoch": 0.45, "learning_rate": 0.0012223390937884822, "loss": 2.6266, "step": 16588 }, { "epoch": 0.45, "learning_rate": 0.0012222542323961927, "loss": 2.846, "step": 16589 }, { "epoch": 0.45, "learning_rate": 0.001222169369320145, "loss": 2.5261, "step": 16590 }, { "epoch": 0.45, "learning_rate": 0.0012220845045609816, "loss": 2.3645, "step": 16591 }, { "epoch": 0.45, "learning_rate": 0.0012219996381193459, "loss": 2.5826, "step": 16592 }, { "epoch": 0.45, "learning_rate": 0.0012219147699958808, "loss": 2.5845, "step": 16593 }, { "epoch": 0.45, "learning_rate": 0.0012218299001912289, "loss": 2.4784, "step": 16594 }, { "epoch": 0.45, "learning_rate": 0.0012217450287060332, "loss": 2.4115, "step": 16595 }, { "epoch": 0.45, "learning_rate": 0.001221660155540937, "loss": 2.4094, "step": 16596 }, { "epoch": 0.45, "learning_rate": 0.0012215752806965829, "loss": 2.5045, "step": 16597 }, { "epoch": 0.45, "learning_rate": 0.0012214904041736143, "loss": 2.7688, "step": 16598 }, { "epoch": 0.45, "learning_rate": 0.0012214055259726737, "loss": 2.2951, "step": 16599 }, { "epoch": 0.45, "learning_rate": 0.0012213206460944049, "loss": 2.2958, "step": 16600 }, { "epoch": 0.45, "learning_rate": 0.0012212357645394504, "loss": 2.1393, "step": 16601 }, { "epoch": 0.45, "learning_rate": 0.001221150881308453, "loss": 2.6625, "step": 16602 }, { "epoch": 0.45, "learning_rate": 0.0012210659964020558, "loss": 2.6327, "step": 16603 }, { "epoch": 0.45, "learning_rate": 0.0012209811098209027, "loss": 2.7809, "step": 16604 }, { "epoch": 0.45, "learning_rate": 0.0012208962215656358, "loss": 2.9494, "step": 16605 }, { "epoch": 0.45, "learning_rate": 0.0012208113316368992, "loss": 2.5612, "step": 16606 }, { "epoch": 0.45, "learning_rate": 0.0012207264400353349, "loss": 2.4652, "step": 16607 }, { "epoch": 0.45, "learning_rate": 0.0012206415467615865, "loss": 2.5684, "step": 16608 }, { "epoch": 0.45, "learning_rate": 0.0012205566518162976, "loss": 2.5641, "step": 16609 }, { "epoch": 0.45, "learning_rate": 0.0012204717552001109, "loss": 2.6353, "step": 16610 }, { "epoch": 0.45, "learning_rate": 0.001220386856913669, "loss": 2.7164, "step": 16611 }, { "epoch": 0.45, "learning_rate": 0.001220301956957616, "loss": 3.0818, "step": 16612 }, { "epoch": 0.45, "learning_rate": 0.001220217055332595, "loss": 2.2839, "step": 16613 }, { "epoch": 0.45, "learning_rate": 0.001220132152039249, "loss": 2.5453, "step": 16614 }, { "epoch": 0.45, "learning_rate": 0.0012200472470782207, "loss": 2.8862, "step": 16615 }, { "epoch": 0.45, "learning_rate": 0.0012199623404501544, "loss": 2.3828, "step": 16616 }, { "epoch": 0.45, "learning_rate": 0.0012198774321556924, "loss": 2.6007, "step": 16617 }, { "epoch": 0.45, "learning_rate": 0.0012197925221954782, "loss": 2.655, "step": 16618 }, { "epoch": 0.45, "learning_rate": 0.0012197076105701552, "loss": 2.5381, "step": 16619 }, { "epoch": 0.45, "learning_rate": 0.0012196226972803668, "loss": 2.5582, "step": 16620 }, { "epoch": 0.45, "learning_rate": 0.001219537782326756, "loss": 2.5417, "step": 16621 }, { "epoch": 0.45, "learning_rate": 0.0012194528657099662, "loss": 2.0095, "step": 16622 }, { "epoch": 0.45, "learning_rate": 0.0012193679474306407, "loss": 2.8542, "step": 16623 }, { "epoch": 0.45, "learning_rate": 0.0012192830274894229, "loss": 2.4394, "step": 16624 }, { "epoch": 0.45, "learning_rate": 0.0012191981058869562, "loss": 2.6548, "step": 16625 }, { "epoch": 0.45, "learning_rate": 0.0012191131826238836, "loss": 2.5021, "step": 16626 }, { "epoch": 0.45, "learning_rate": 0.0012190282577008488, "loss": 2.1378, "step": 16627 }, { "epoch": 0.45, "learning_rate": 0.001218943331118495, "loss": 2.4942, "step": 16628 }, { "epoch": 0.45, "learning_rate": 0.001218858402877466, "loss": 3.0848, "step": 16629 }, { "epoch": 0.45, "learning_rate": 0.0012187734729784045, "loss": 2.9079, "step": 16630 }, { "epoch": 0.45, "learning_rate": 0.0012186885414219545, "loss": 2.3754, "step": 16631 }, { "epoch": 0.45, "learning_rate": 0.001218603608208759, "loss": 2.4761, "step": 16632 }, { "epoch": 0.45, "learning_rate": 0.0012185186733394617, "loss": 2.8041, "step": 16633 }, { "epoch": 0.45, "learning_rate": 0.001218433736814706, "loss": 2.2587, "step": 16634 }, { "epoch": 0.45, "learning_rate": 0.0012183487986351352, "loss": 2.5815, "step": 16635 }, { "epoch": 0.45, "learning_rate": 0.0012182638588013933, "loss": 2.978, "step": 16636 }, { "epoch": 0.45, "learning_rate": 0.0012181789173141234, "loss": 2.316, "step": 16637 }, { "epoch": 0.45, "learning_rate": 0.0012180939741739687, "loss": 2.5569, "step": 16638 }, { "epoch": 0.45, "learning_rate": 0.0012180090293815733, "loss": 2.6599, "step": 16639 }, { "epoch": 0.45, "learning_rate": 0.0012179240829375806, "loss": 2.5234, "step": 16640 }, { "epoch": 0.45, "learning_rate": 0.0012178391348426337, "loss": 2.2063, "step": 16641 }, { "epoch": 0.45, "learning_rate": 0.0012177541850973764, "loss": 2.6606, "step": 16642 }, { "epoch": 0.45, "learning_rate": 0.0012176692337024526, "loss": 2.4145, "step": 16643 }, { "epoch": 0.45, "learning_rate": 0.0012175842806585058, "loss": 2.3675, "step": 16644 }, { "epoch": 0.45, "learning_rate": 0.0012174993259661789, "loss": 2.677, "step": 16645 }, { "epoch": 0.45, "learning_rate": 0.0012174143696261162, "loss": 2.6105, "step": 16646 }, { "epoch": 0.45, "learning_rate": 0.001217329411638961, "loss": 2.7072, "step": 16647 }, { "epoch": 0.45, "learning_rate": 0.0012172444520053571, "loss": 2.5011, "step": 16648 }, { "epoch": 0.45, "learning_rate": 0.0012171594907259482, "loss": 2.7363, "step": 16649 }, { "epoch": 0.45, "learning_rate": 0.0012170745278013778, "loss": 2.7338, "step": 16650 }, { "epoch": 0.45, "learning_rate": 0.0012169895632322893, "loss": 2.4072, "step": 16651 }, { "epoch": 0.45, "learning_rate": 0.0012169045970193272, "loss": 2.482, "step": 16652 }, { "epoch": 0.45, "learning_rate": 0.0012168196291631344, "loss": 2.6542, "step": 16653 }, { "epoch": 0.45, "learning_rate": 0.0012167346596643545, "loss": 2.192, "step": 16654 }, { "epoch": 0.45, "learning_rate": 0.0012166496885236318, "loss": 2.6175, "step": 16655 }, { "epoch": 0.45, "learning_rate": 0.00121656471574161, "loss": 1.7129, "step": 16656 }, { "epoch": 0.45, "learning_rate": 0.0012164797413189326, "loss": 2.4775, "step": 16657 }, { "epoch": 0.45, "learning_rate": 0.0012163947652562431, "loss": 2.7313, "step": 16658 }, { "epoch": 0.45, "learning_rate": 0.0012163097875541858, "loss": 2.8703, "step": 16659 }, { "epoch": 0.45, "learning_rate": 0.001216224808213404, "loss": 2.7133, "step": 16660 }, { "epoch": 0.45, "learning_rate": 0.001216139827234542, "loss": 2.5268, "step": 16661 }, { "epoch": 0.45, "learning_rate": 0.0012160548446182428, "loss": 2.6829, "step": 16662 }, { "epoch": 0.45, "learning_rate": 0.0012159698603651512, "loss": 3.2443, "step": 16663 }, { "epoch": 0.45, "learning_rate": 0.0012158848744759103, "loss": 2.7774, "step": 16664 }, { "epoch": 0.45, "learning_rate": 0.0012157998869511647, "loss": 2.6384, "step": 16665 }, { "epoch": 0.45, "learning_rate": 0.0012157148977915571, "loss": 2.4791, "step": 16666 }, { "epoch": 0.45, "learning_rate": 0.0012156299069977323, "loss": 2.4759, "step": 16667 }, { "epoch": 0.45, "learning_rate": 0.0012155449145703336, "loss": 2.6249, "step": 16668 }, { "epoch": 0.45, "learning_rate": 0.0012154599205100056, "loss": 2.7717, "step": 16669 }, { "epoch": 0.45, "learning_rate": 0.0012153749248173915, "loss": 2.3968, "step": 16670 }, { "epoch": 0.45, "learning_rate": 0.0012152899274931355, "loss": 2.3424, "step": 16671 }, { "epoch": 0.45, "learning_rate": 0.0012152049285378817, "loss": 2.5297, "step": 16672 }, { "epoch": 0.45, "learning_rate": 0.0012151199279522736, "loss": 2.6836, "step": 16673 }, { "epoch": 0.45, "learning_rate": 0.0012150349257369552, "loss": 2.4141, "step": 16674 }, { "epoch": 0.45, "learning_rate": 0.001214949921892571, "loss": 2.7889, "step": 16675 }, { "epoch": 0.45, "learning_rate": 0.0012148649164197647, "loss": 2.6073, "step": 16676 }, { "epoch": 0.45, "learning_rate": 0.0012147799093191799, "loss": 2.7072, "step": 16677 }, { "epoch": 0.45, "learning_rate": 0.0012146949005914609, "loss": 2.4989, "step": 16678 }, { "epoch": 0.45, "learning_rate": 0.001214609890237252, "loss": 2.6133, "step": 16679 }, { "epoch": 0.45, "learning_rate": 0.001214524878257197, "loss": 2.5606, "step": 16680 }, { "epoch": 0.45, "learning_rate": 0.0012144398646519391, "loss": 2.5062, "step": 16681 }, { "epoch": 0.45, "learning_rate": 0.001214354849422124, "loss": 2.5241, "step": 16682 }, { "epoch": 0.45, "learning_rate": 0.0012142698325683945, "loss": 2.0682, "step": 16683 }, { "epoch": 0.45, "learning_rate": 0.001214184814091395, "loss": 2.7078, "step": 16684 }, { "epoch": 0.45, "learning_rate": 0.0012140997939917696, "loss": 2.2713, "step": 16685 }, { "epoch": 0.45, "learning_rate": 0.001214014772270163, "loss": 2.7185, "step": 16686 }, { "epoch": 0.45, "learning_rate": 0.0012139297489272183, "loss": 2.6902, "step": 16687 }, { "epoch": 0.45, "learning_rate": 0.0012138447239635802, "loss": 2.5756, "step": 16688 }, { "epoch": 0.45, "learning_rate": 0.0012137596973798926, "loss": 2.6349, "step": 16689 }, { "epoch": 0.45, "learning_rate": 0.0012136746691767998, "loss": 2.5697, "step": 16690 }, { "epoch": 0.45, "learning_rate": 0.0012135896393549457, "loss": 2.6543, "step": 16691 }, { "epoch": 0.45, "learning_rate": 0.0012135046079149749, "loss": 2.3445, "step": 16692 }, { "epoch": 0.45, "learning_rate": 0.0012134195748575315, "loss": 2.7319, "step": 16693 }, { "epoch": 0.45, "learning_rate": 0.0012133345401832592, "loss": 2.4689, "step": 16694 }, { "epoch": 0.45, "learning_rate": 0.001213249503892803, "loss": 2.7517, "step": 16695 }, { "epoch": 0.45, "learning_rate": 0.0012131644659868065, "loss": 2.5959, "step": 16696 }, { "epoch": 0.45, "learning_rate": 0.0012130794264659137, "loss": 2.3189, "step": 16697 }, { "epoch": 0.45, "learning_rate": 0.0012129943853307697, "loss": 2.4822, "step": 16698 }, { "epoch": 0.45, "learning_rate": 0.0012129093425820182, "loss": 2.2413, "step": 16699 }, { "epoch": 0.45, "learning_rate": 0.0012128242982203034, "loss": 2.2573, "step": 16700 }, { "epoch": 0.45, "learning_rate": 0.0012127392522462699, "loss": 2.4299, "step": 16701 }, { "epoch": 0.45, "learning_rate": 0.0012126542046605622, "loss": 2.7614, "step": 16702 }, { "epoch": 0.45, "learning_rate": 0.001212569155463824, "loss": 2.3051, "step": 16703 }, { "epoch": 0.45, "learning_rate": 0.0012124841046567, "loss": 2.352, "step": 16704 }, { "epoch": 0.45, "learning_rate": 0.001212399052239834, "loss": 2.5758, "step": 16705 }, { "epoch": 0.45, "learning_rate": 0.0012123139982138712, "loss": 2.7555, "step": 16706 }, { "epoch": 0.45, "learning_rate": 0.0012122289425794553, "loss": 2.6118, "step": 16707 }, { "epoch": 0.45, "learning_rate": 0.0012121438853372308, "loss": 2.595, "step": 16708 }, { "epoch": 0.45, "learning_rate": 0.0012120588264878424, "loss": 2.6927, "step": 16709 }, { "epoch": 0.45, "learning_rate": 0.0012119737660319342, "loss": 2.4594, "step": 16710 }, { "epoch": 0.45, "learning_rate": 0.0012118887039701506, "loss": 2.386, "step": 16711 }, { "epoch": 0.45, "learning_rate": 0.0012118036403031358, "loss": 2.6483, "step": 16712 }, { "epoch": 0.45, "learning_rate": 0.0012117185750315346, "loss": 2.1966, "step": 16713 }, { "epoch": 0.45, "learning_rate": 0.0012116335081559914, "loss": 2.4829, "step": 16714 }, { "epoch": 0.45, "learning_rate": 0.0012115484396771508, "loss": 2.3543, "step": 16715 }, { "epoch": 0.45, "learning_rate": 0.001211463369595657, "loss": 2.8598, "step": 16716 }, { "epoch": 0.45, "learning_rate": 0.001211378297912154, "loss": 2.7154, "step": 16717 }, { "epoch": 0.45, "learning_rate": 0.0012112932246272875, "loss": 2.5466, "step": 16718 }, { "epoch": 0.45, "learning_rate": 0.001211208149741701, "loss": 2.0834, "step": 16719 }, { "epoch": 0.45, "learning_rate": 0.0012111230732560392, "loss": 2.5482, "step": 16720 }, { "epoch": 0.45, "learning_rate": 0.0012110379951709466, "loss": 2.5436, "step": 16721 }, { "epoch": 0.45, "learning_rate": 0.0012109529154870685, "loss": 2.2217, "step": 16722 }, { "epoch": 0.45, "learning_rate": 0.0012108678342050486, "loss": 2.4653, "step": 16723 }, { "epoch": 0.45, "learning_rate": 0.0012107827513255312, "loss": 2.5551, "step": 16724 }, { "epoch": 0.45, "learning_rate": 0.0012106976668491618, "loss": 3.0445, "step": 16725 }, { "epoch": 0.45, "learning_rate": 0.0012106125807765846, "loss": 2.2259, "step": 16726 }, { "epoch": 0.45, "learning_rate": 0.0012105274931084437, "loss": 2.8734, "step": 16727 }, { "epoch": 0.45, "learning_rate": 0.0012104424038453846, "loss": 2.3735, "step": 16728 }, { "epoch": 0.45, "learning_rate": 0.0012103573129880515, "loss": 2.8045, "step": 16729 }, { "epoch": 0.45, "learning_rate": 0.0012102722205370887, "loss": 2.4352, "step": 16730 }, { "epoch": 0.45, "learning_rate": 0.0012101871264931412, "loss": 2.6629, "step": 16731 }, { "epoch": 0.45, "learning_rate": 0.0012101020308568535, "loss": 2.6234, "step": 16732 }, { "epoch": 0.45, "learning_rate": 0.0012100169336288708, "loss": 2.864, "step": 16733 }, { "epoch": 0.45, "learning_rate": 0.001209931834809837, "loss": 2.5459, "step": 16734 }, { "epoch": 0.45, "learning_rate": 0.0012098467344003974, "loss": 2.4876, "step": 16735 }, { "epoch": 0.45, "learning_rate": 0.0012097616324011962, "loss": 2.6768, "step": 16736 }, { "epoch": 0.45, "learning_rate": 0.0012096765288128783, "loss": 2.5283, "step": 16737 }, { "epoch": 0.45, "learning_rate": 0.001209591423636089, "loss": 2.7577, "step": 16738 }, { "epoch": 0.45, "learning_rate": 0.0012095063168714724, "loss": 2.2449, "step": 16739 }, { "epoch": 0.45, "learning_rate": 0.001209421208519673, "loss": 2.8836, "step": 16740 }, { "epoch": 0.45, "learning_rate": 0.0012093360985813361, "loss": 2.6701, "step": 16741 }, { "epoch": 0.45, "learning_rate": 0.0012092509870571067, "loss": 2.3444, "step": 16742 }, { "epoch": 0.45, "learning_rate": 0.0012091658739476288, "loss": 2.4082, "step": 16743 }, { "epoch": 0.45, "learning_rate": 0.0012090807592535478, "loss": 3.059, "step": 16744 }, { "epoch": 0.45, "learning_rate": 0.0012089956429755084, "loss": 3.1493, "step": 16745 }, { "epoch": 0.45, "learning_rate": 0.0012089105251141554, "loss": 2.1981, "step": 16746 }, { "epoch": 0.45, "learning_rate": 0.0012088254056701333, "loss": 2.6243, "step": 16747 }, { "epoch": 0.45, "learning_rate": 0.0012087402846440878, "loss": 2.5982, "step": 16748 }, { "epoch": 0.45, "learning_rate": 0.001208655162036663, "loss": 2.1615, "step": 16749 }, { "epoch": 0.45, "learning_rate": 0.0012085700378485038, "loss": 2.8175, "step": 16750 }, { "epoch": 0.45, "learning_rate": 0.0012084849120802552, "loss": 2.5349, "step": 16751 }, { "epoch": 0.45, "learning_rate": 0.0012083997847325628, "loss": 2.7031, "step": 16752 }, { "epoch": 0.45, "learning_rate": 0.0012083146558060703, "loss": 2.4856, "step": 16753 }, { "epoch": 0.45, "learning_rate": 0.0012082295253014236, "loss": 2.5069, "step": 16754 }, { "epoch": 0.45, "learning_rate": 0.0012081443932192668, "loss": 2.8685, "step": 16755 }, { "epoch": 0.45, "learning_rate": 0.0012080592595602457, "loss": 2.63, "step": 16756 }, { "epoch": 0.45, "learning_rate": 0.0012079741243250046, "loss": 2.4438, "step": 16757 }, { "epoch": 0.45, "learning_rate": 0.0012078889875141888, "loss": 3.0838, "step": 16758 }, { "epoch": 0.45, "learning_rate": 0.001207803849128443, "loss": 2.6074, "step": 16759 }, { "epoch": 0.45, "learning_rate": 0.0012077187091684126, "loss": 2.629, "step": 16760 }, { "epoch": 0.45, "learning_rate": 0.0012076335676347424, "loss": 2.6192, "step": 16761 }, { "epoch": 0.45, "learning_rate": 0.0012075484245280778, "loss": 2.6382, "step": 16762 }, { "epoch": 0.45, "learning_rate": 0.0012074632798490627, "loss": 2.5774, "step": 16763 }, { "epoch": 0.45, "learning_rate": 0.0012073781335983432, "loss": 2.0892, "step": 16764 }, { "epoch": 0.45, "learning_rate": 0.0012072929857765641, "loss": 2.1603, "step": 16765 }, { "epoch": 0.45, "learning_rate": 0.0012072078363843705, "loss": 2.5316, "step": 16766 }, { "epoch": 0.45, "learning_rate": 0.001207122685422407, "loss": 2.5678, "step": 16767 }, { "epoch": 0.45, "learning_rate": 0.0012070375328913194, "loss": 2.4392, "step": 16768 }, { "epoch": 0.45, "learning_rate": 0.0012069523787917524, "loss": 2.6937, "step": 16769 }, { "epoch": 0.45, "learning_rate": 0.0012068672231243512, "loss": 2.5545, "step": 16770 }, { "epoch": 0.45, "learning_rate": 0.0012067820658897607, "loss": 2.5189, "step": 16771 }, { "epoch": 0.45, "learning_rate": 0.0012066969070886264, "loss": 2.1335, "step": 16772 }, { "epoch": 0.45, "learning_rate": 0.0012066117467215932, "loss": 2.9932, "step": 16773 }, { "epoch": 0.45, "learning_rate": 0.0012065265847893065, "loss": 2.5853, "step": 16774 }, { "epoch": 0.45, "learning_rate": 0.001206441421292411, "loss": 2.6725, "step": 16775 }, { "epoch": 0.45, "learning_rate": 0.0012063562562315527, "loss": 2.7716, "step": 16776 }, { "epoch": 0.45, "learning_rate": 0.0012062710896073759, "loss": 2.4873, "step": 16777 }, { "epoch": 0.45, "learning_rate": 0.0012061859214205265, "loss": 2.7106, "step": 16778 }, { "epoch": 0.45, "learning_rate": 0.001206100751671649, "loss": 2.8113, "step": 16779 }, { "epoch": 0.45, "learning_rate": 0.0012060155803613893, "loss": 2.4529, "step": 16780 }, { "epoch": 0.45, "learning_rate": 0.0012059304074903926, "loss": 2.3653, "step": 16781 }, { "epoch": 0.45, "learning_rate": 0.001205845233059304, "loss": 2.681, "step": 16782 }, { "epoch": 0.45, "learning_rate": 0.0012057600570687678, "loss": 2.7131, "step": 16783 }, { "epoch": 0.45, "learning_rate": 0.0012056748795194311, "loss": 2.6282, "step": 16784 }, { "epoch": 0.45, "learning_rate": 0.0012055897004119383, "loss": 2.4085, "step": 16785 }, { "epoch": 0.45, "learning_rate": 0.0012055045197469343, "loss": 2.2578, "step": 16786 }, { "epoch": 0.45, "learning_rate": 0.0012054193375250649, "loss": 2.9423, "step": 16787 }, { "epoch": 0.45, "learning_rate": 0.0012053341537469754, "loss": 2.5115, "step": 16788 }, { "epoch": 0.45, "learning_rate": 0.001205248968413311, "loss": 2.6646, "step": 16789 }, { "epoch": 0.45, "learning_rate": 0.0012051637815247169, "loss": 2.2282, "step": 16790 }, { "epoch": 0.45, "learning_rate": 0.0012050785930818391, "loss": 2.216, "step": 16791 }, { "epoch": 0.45, "learning_rate": 0.0012049934030853224, "loss": 2.4758, "step": 16792 }, { "epoch": 0.45, "learning_rate": 0.001204908211535812, "loss": 2.9947, "step": 16793 }, { "epoch": 0.45, "learning_rate": 0.0012048230184339538, "loss": 2.585, "step": 16794 }, { "epoch": 0.45, "learning_rate": 0.0012047378237803935, "loss": 2.3289, "step": 16795 }, { "epoch": 0.45, "learning_rate": 0.0012046526275757755, "loss": 2.515, "step": 16796 }, { "epoch": 0.45, "learning_rate": 0.001204567429820746, "loss": 2.3815, "step": 16797 }, { "epoch": 0.45, "learning_rate": 0.0012044822305159499, "loss": 2.535, "step": 16798 }, { "epoch": 0.45, "learning_rate": 0.0012043970296620335, "loss": 2.5729, "step": 16799 }, { "epoch": 0.45, "learning_rate": 0.0012043118272596414, "loss": 2.9728, "step": 16800 }, { "epoch": 0.45, "learning_rate": 0.0012042266233094198, "loss": 2.513, "step": 16801 }, { "epoch": 0.45, "learning_rate": 0.0012041414178120134, "loss": 3.0605, "step": 16802 }, { "epoch": 0.45, "learning_rate": 0.0012040562107680682, "loss": 3.2657, "step": 16803 }, { "epoch": 0.45, "learning_rate": 0.0012039710021782297, "loss": 2.5395, "step": 16804 }, { "epoch": 0.45, "learning_rate": 0.0012038857920431433, "loss": 2.4773, "step": 16805 }, { "epoch": 0.45, "learning_rate": 0.0012038005803634547, "loss": 2.7269, "step": 16806 }, { "epoch": 0.45, "learning_rate": 0.0012037153671398092, "loss": 2.6526, "step": 16807 }, { "epoch": 0.45, "learning_rate": 0.0012036301523728526, "loss": 2.1766, "step": 16808 }, { "epoch": 0.45, "learning_rate": 0.0012035449360632302, "loss": 2.6031, "step": 16809 }, { "epoch": 0.45, "learning_rate": 0.001203459718211588, "loss": 2.2368, "step": 16810 }, { "epoch": 0.45, "learning_rate": 0.0012033744988185714, "loss": 2.9246, "step": 16811 }, { "epoch": 0.45, "learning_rate": 0.0012032892778848256, "loss": 2.7271, "step": 16812 }, { "epoch": 0.45, "learning_rate": 0.0012032040554109968, "loss": 2.696, "step": 16813 }, { "epoch": 0.45, "learning_rate": 0.0012031188313977304, "loss": 2.5381, "step": 16814 }, { "epoch": 0.45, "learning_rate": 0.001203033605845672, "loss": 2.9094, "step": 16815 }, { "epoch": 0.45, "learning_rate": 0.0012029483787554674, "loss": 2.558, "step": 16816 }, { "epoch": 0.45, "learning_rate": 0.001202863150127762, "loss": 2.3881, "step": 16817 }, { "epoch": 0.45, "learning_rate": 0.001202777919963202, "loss": 2.9432, "step": 16818 }, { "epoch": 0.45, "learning_rate": 0.0012026926882624323, "loss": 2.7737, "step": 16819 }, { "epoch": 0.45, "learning_rate": 0.0012026074550260993, "loss": 2.4771, "step": 16820 }, { "epoch": 0.45, "learning_rate": 0.0012025222202548484, "loss": 2.6632, "step": 16821 }, { "epoch": 0.45, "learning_rate": 0.0012024369839493253, "loss": 2.4285, "step": 16822 }, { "epoch": 0.45, "learning_rate": 0.0012023517461101755, "loss": 2.3384, "step": 16823 }, { "epoch": 0.45, "learning_rate": 0.0012022665067380456, "loss": 2.4621, "step": 16824 }, { "epoch": 0.45, "learning_rate": 0.0012021812658335805, "loss": 2.7563, "step": 16825 }, { "epoch": 0.45, "learning_rate": 0.0012020960233974263, "loss": 2.4144, "step": 16826 }, { "epoch": 0.45, "learning_rate": 0.0012020107794302288, "loss": 2.4564, "step": 16827 }, { "epoch": 0.45, "learning_rate": 0.0012019255339326337, "loss": 2.5377, "step": 16828 }, { "epoch": 0.45, "learning_rate": 0.0012018402869052869, "loss": 2.7112, "step": 16829 }, { "epoch": 0.45, "learning_rate": 0.0012017550383488342, "loss": 2.4332, "step": 16830 }, { "epoch": 0.45, "learning_rate": 0.0012016697882639216, "loss": 2.7272, "step": 16831 }, { "epoch": 0.45, "learning_rate": 0.0012015845366511943, "loss": 2.7013, "step": 16832 }, { "epoch": 0.45, "learning_rate": 0.0012014992835112988, "loss": 2.5625, "step": 16833 }, { "epoch": 0.45, "learning_rate": 0.001201414028844881, "loss": 2.3872, "step": 16834 }, { "epoch": 0.45, "learning_rate": 0.0012013287726525864, "loss": 2.8153, "step": 16835 }, { "epoch": 0.45, "learning_rate": 0.0012012435149350606, "loss": 2.5728, "step": 16836 }, { "epoch": 0.45, "learning_rate": 0.00120115825569295, "loss": 2.5128, "step": 16837 }, { "epoch": 0.45, "learning_rate": 0.001201072994926901, "loss": 2.4107, "step": 16838 }, { "epoch": 0.45, "learning_rate": 0.0012009877326375584, "loss": 2.5039, "step": 16839 }, { "epoch": 0.45, "learning_rate": 0.0012009024688255689, "loss": 2.6653, "step": 16840 }, { "epoch": 0.45, "learning_rate": 0.001200817203491578, "loss": 2.6766, "step": 16841 }, { "epoch": 0.45, "learning_rate": 0.0012007319366362324, "loss": 2.754, "step": 16842 }, { "epoch": 0.45, "learning_rate": 0.0012006466682601769, "loss": 2.7763, "step": 16843 }, { "epoch": 0.45, "learning_rate": 0.0012005613983640587, "loss": 2.9666, "step": 16844 }, { "epoch": 0.45, "learning_rate": 0.0012004761269485227, "loss": 2.6163, "step": 16845 }, { "epoch": 0.45, "learning_rate": 0.0012003908540142154, "loss": 2.7895, "step": 16846 }, { "epoch": 0.45, "learning_rate": 0.0012003055795617831, "loss": 2.5712, "step": 16847 }, { "epoch": 0.45, "learning_rate": 0.0012002203035918716, "loss": 2.5539, "step": 16848 }, { "epoch": 0.45, "learning_rate": 0.0012001350261051265, "loss": 2.4121, "step": 16849 }, { "epoch": 0.45, "learning_rate": 0.0012000497471021945, "loss": 2.8308, "step": 16850 }, { "epoch": 0.45, "learning_rate": 0.0011999644665837215, "loss": 2.4337, "step": 16851 }, { "epoch": 0.45, "learning_rate": 0.0011998791845503531, "loss": 2.2278, "step": 16852 }, { "epoch": 0.45, "learning_rate": 0.001199793901002736, "loss": 2.288, "step": 16853 }, { "epoch": 0.45, "learning_rate": 0.0011997086159415157, "loss": 2.7644, "step": 16854 }, { "epoch": 0.45, "learning_rate": 0.001199623329367339, "loss": 2.5611, "step": 16855 }, { "epoch": 0.45, "learning_rate": 0.0011995380412808516, "loss": 3.1658, "step": 16856 }, { "epoch": 0.45, "learning_rate": 0.0011994527516826993, "loss": 2.5074, "step": 16857 }, { "epoch": 0.45, "learning_rate": 0.0011993674605735292, "loss": 2.3848, "step": 16858 }, { "epoch": 0.45, "learning_rate": 0.0011992821679539865, "loss": 2.2402, "step": 16859 }, { "epoch": 0.45, "learning_rate": 0.0011991968738247177, "loss": 2.321, "step": 16860 }, { "epoch": 0.45, "learning_rate": 0.0011991115781863691, "loss": 2.879, "step": 16861 }, { "epoch": 0.45, "learning_rate": 0.0011990262810395867, "loss": 2.4813, "step": 16862 }, { "epoch": 0.45, "learning_rate": 0.0011989409823850168, "loss": 2.1393, "step": 16863 }, { "epoch": 0.45, "learning_rate": 0.0011988556822233056, "loss": 2.299, "step": 16864 }, { "epoch": 0.45, "learning_rate": 0.0011987703805550996, "loss": 2.3898, "step": 16865 }, { "epoch": 0.45, "learning_rate": 0.0011986850773810442, "loss": 2.8384, "step": 16866 }, { "epoch": 0.45, "learning_rate": 0.0011985997727017865, "loss": 2.3343, "step": 16867 }, { "epoch": 0.45, "learning_rate": 0.0011985144665179724, "loss": 2.9255, "step": 16868 }, { "epoch": 0.45, "learning_rate": 0.001198429158830248, "loss": 2.0475, "step": 16869 }, { "epoch": 0.45, "learning_rate": 0.00119834384963926, "loss": 2.6609, "step": 16870 }, { "epoch": 0.45, "learning_rate": 0.0011982585389456546, "loss": 2.8838, "step": 16871 }, { "epoch": 0.45, "learning_rate": 0.0011981732267500776, "loss": 2.47, "step": 16872 }, { "epoch": 0.45, "learning_rate": 0.0011980879130531756, "loss": 2.5071, "step": 16873 }, { "epoch": 0.45, "learning_rate": 0.0011980025978555954, "loss": 2.29, "step": 16874 }, { "epoch": 0.45, "learning_rate": 0.0011979172811579827, "loss": 2.8489, "step": 16875 }, { "epoch": 0.45, "learning_rate": 0.0011978319629609839, "loss": 2.5032, "step": 16876 }, { "epoch": 0.45, "learning_rate": 0.0011977466432652457, "loss": 2.2822, "step": 16877 }, { "epoch": 0.45, "learning_rate": 0.0011976613220714145, "loss": 2.6055, "step": 16878 }, { "epoch": 0.45, "learning_rate": 0.0011975759993801361, "loss": 2.739, "step": 16879 }, { "epoch": 0.45, "learning_rate": 0.0011974906751920573, "loss": 2.7344, "step": 16880 }, { "epoch": 0.45, "learning_rate": 0.0011974053495078247, "loss": 2.2989, "step": 16881 }, { "epoch": 0.45, "learning_rate": 0.0011973200223280842, "loss": 2.5463, "step": 16882 }, { "epoch": 0.45, "learning_rate": 0.0011972346936534827, "loss": 2.4539, "step": 16883 }, { "epoch": 0.45, "learning_rate": 0.0011971493634846662, "loss": 2.5867, "step": 16884 }, { "epoch": 0.45, "learning_rate": 0.0011970640318222816, "loss": 2.6917, "step": 16885 }, { "epoch": 0.45, "learning_rate": 0.0011969786986669748, "loss": 2.2382, "step": 16886 }, { "epoch": 0.45, "learning_rate": 0.001196893364019393, "loss": 3.0146, "step": 16887 }, { "epoch": 0.45, "learning_rate": 0.001196808027880182, "loss": 2.5773, "step": 16888 }, { "epoch": 0.45, "learning_rate": 0.0011967226902499886, "loss": 2.6622, "step": 16889 }, { "epoch": 0.45, "learning_rate": 0.0011966373511294592, "loss": 2.5798, "step": 16890 }, { "epoch": 0.45, "learning_rate": 0.0011965520105192407, "loss": 2.5185, "step": 16891 }, { "epoch": 0.45, "learning_rate": 0.0011964666684199789, "loss": 2.4167, "step": 16892 }, { "epoch": 0.45, "learning_rate": 0.001196381324832321, "loss": 2.6458, "step": 16893 }, { "epoch": 0.45, "learning_rate": 0.0011962959797569132, "loss": 2.5099, "step": 16894 }, { "epoch": 0.45, "learning_rate": 0.0011962106331944024, "loss": 2.525, "step": 16895 }, { "epoch": 0.45, "learning_rate": 0.0011961252851454345, "loss": 2.6905, "step": 16896 }, { "epoch": 0.45, "learning_rate": 0.0011960399356106567, "loss": 2.6976, "step": 16897 }, { "epoch": 0.45, "learning_rate": 0.0011959545845907156, "loss": 2.8279, "step": 16898 }, { "epoch": 0.45, "learning_rate": 0.0011958692320862571, "loss": 2.4437, "step": 16899 }, { "epoch": 0.45, "learning_rate": 0.001195783878097929, "loss": 2.3228, "step": 16900 }, { "epoch": 0.45, "learning_rate": 0.0011956985226263769, "loss": 1.9169, "step": 16901 }, { "epoch": 0.45, "learning_rate": 0.0011956131656722475, "loss": 2.5088, "step": 16902 }, { "epoch": 0.45, "learning_rate": 0.0011955278072361879, "loss": 2.6637, "step": 16903 }, { "epoch": 0.45, "learning_rate": 0.0011954424473188448, "loss": 2.3495, "step": 16904 }, { "epoch": 0.45, "learning_rate": 0.0011953570859208644, "loss": 2.3138, "step": 16905 }, { "epoch": 0.45, "learning_rate": 0.001195271723042894, "loss": 2.6965, "step": 16906 }, { "epoch": 0.45, "learning_rate": 0.0011951863586855795, "loss": 2.6918, "step": 16907 }, { "epoch": 0.45, "learning_rate": 0.0011951009928495683, "loss": 2.436, "step": 16908 }, { "epoch": 0.45, "learning_rate": 0.0011950156255355069, "loss": 2.2591, "step": 16909 }, { "epoch": 0.45, "learning_rate": 0.0011949302567440421, "loss": 2.3075, "step": 16910 }, { "epoch": 0.45, "learning_rate": 0.00119484488647582, "loss": 2.2926, "step": 16911 }, { "epoch": 0.45, "learning_rate": 0.0011947595147314882, "loss": 1.7868, "step": 16912 }, { "epoch": 0.45, "learning_rate": 0.0011946741415116934, "loss": 2.6507, "step": 16913 }, { "epoch": 0.45, "learning_rate": 0.0011945887668170817, "loss": 2.6037, "step": 16914 }, { "epoch": 0.45, "learning_rate": 0.0011945033906483004, "loss": 2.5227, "step": 16915 }, { "epoch": 0.45, "learning_rate": 0.0011944180130059963, "loss": 2.5573, "step": 16916 }, { "epoch": 0.45, "learning_rate": 0.0011943326338908161, "loss": 2.5632, "step": 16917 }, { "epoch": 0.45, "learning_rate": 0.0011942472533034065, "loss": 2.2173, "step": 16918 }, { "epoch": 0.45, "learning_rate": 0.0011941618712444143, "loss": 2.8317, "step": 16919 }, { "epoch": 0.45, "learning_rate": 0.0011940764877144867, "loss": 2.2455, "step": 16920 }, { "epoch": 0.45, "learning_rate": 0.0011939911027142704, "loss": 2.7627, "step": 16921 }, { "epoch": 0.45, "learning_rate": 0.001193905716244412, "loss": 2.6768, "step": 16922 }, { "epoch": 0.45, "learning_rate": 0.0011938203283055585, "loss": 2.6405, "step": 16923 }, { "epoch": 0.45, "learning_rate": 0.0011937349388983572, "loss": 2.3914, "step": 16924 }, { "epoch": 0.45, "learning_rate": 0.001193649548023454, "loss": 2.8231, "step": 16925 }, { "epoch": 0.45, "learning_rate": 0.001193564155681497, "loss": 2.2654, "step": 16926 }, { "epoch": 0.45, "learning_rate": 0.0011934787618731325, "loss": 2.7305, "step": 16927 }, { "epoch": 0.45, "learning_rate": 0.0011933933665990073, "loss": 2.437, "step": 16928 }, { "epoch": 0.45, "learning_rate": 0.0011933079698597689, "loss": 2.6554, "step": 16929 }, { "epoch": 0.45, "learning_rate": 0.0011932225716560637, "loss": 2.2893, "step": 16930 }, { "epoch": 0.45, "learning_rate": 0.0011931371719885386, "loss": 2.5156, "step": 16931 }, { "epoch": 0.46, "learning_rate": 0.0011930517708578408, "loss": 2.3864, "step": 16932 }, { "epoch": 0.46, "learning_rate": 0.0011929663682646178, "loss": 3.0728, "step": 16933 }, { "epoch": 0.46, "learning_rate": 0.0011928809642095155, "loss": 2.5639, "step": 16934 }, { "epoch": 0.46, "learning_rate": 0.0011927955586931815, "loss": 2.6383, "step": 16935 }, { "epoch": 0.46, "learning_rate": 0.0011927101517162633, "loss": 2.4796, "step": 16936 }, { "epoch": 0.46, "learning_rate": 0.0011926247432794072, "loss": 2.5457, "step": 16937 }, { "epoch": 0.46, "learning_rate": 0.0011925393333832605, "loss": 1.8985, "step": 16938 }, { "epoch": 0.46, "learning_rate": 0.0011924539220284703, "loss": 2.0764, "step": 16939 }, { "epoch": 0.46, "learning_rate": 0.0011923685092156836, "loss": 2.3718, "step": 16940 }, { "epoch": 0.46, "learning_rate": 0.0011922830949455472, "loss": 3.0944, "step": 16941 }, { "epoch": 0.46, "learning_rate": 0.0011921976792187085, "loss": 2.2658, "step": 16942 }, { "epoch": 0.46, "learning_rate": 0.0011921122620358149, "loss": 2.6285, "step": 16943 }, { "epoch": 0.46, "learning_rate": 0.001192026843397513, "loss": 2.9137, "step": 16944 }, { "epoch": 0.46, "learning_rate": 0.0011919414233044498, "loss": 2.8312, "step": 16945 }, { "epoch": 0.46, "learning_rate": 0.001191856001757273, "loss": 2.5174, "step": 16946 }, { "epoch": 0.46, "learning_rate": 0.0011917705787566294, "loss": 2.1405, "step": 16947 }, { "epoch": 0.46, "learning_rate": 0.001191685154303166, "loss": 2.8371, "step": 16948 }, { "epoch": 0.46, "learning_rate": 0.0011915997283975304, "loss": 2.8597, "step": 16949 }, { "epoch": 0.46, "learning_rate": 0.0011915143010403694, "loss": 2.5869, "step": 16950 }, { "epoch": 0.46, "learning_rate": 0.0011914288722323302, "loss": 2.3578, "step": 16951 }, { "epoch": 0.46, "learning_rate": 0.00119134344197406, "loss": 2.8517, "step": 16952 }, { "epoch": 0.46, "learning_rate": 0.0011912580102662064, "loss": 2.0965, "step": 16953 }, { "epoch": 0.46, "learning_rate": 0.0011911725771094161, "loss": 2.2807, "step": 16954 }, { "epoch": 0.46, "learning_rate": 0.0011910871425043364, "loss": 2.6677, "step": 16955 }, { "epoch": 0.46, "learning_rate": 0.001191001706451615, "loss": 2.9939, "step": 16956 }, { "epoch": 0.46, "learning_rate": 0.001190916268951899, "loss": 2.6207, "step": 16957 }, { "epoch": 0.46, "learning_rate": 0.0011908308300058346, "loss": 3.0933, "step": 16958 }, { "epoch": 0.46, "learning_rate": 0.0011907453896140708, "loss": 2.1935, "step": 16959 }, { "epoch": 0.46, "learning_rate": 0.0011906599477772538, "loss": 2.3129, "step": 16960 }, { "epoch": 0.46, "learning_rate": 0.001190574504496031, "loss": 2.6472, "step": 16961 }, { "epoch": 0.46, "learning_rate": 0.0011904890597710495, "loss": 3.1314, "step": 16962 }, { "epoch": 0.46, "learning_rate": 0.0011904036136029578, "loss": 2.6384, "step": 16963 }, { "epoch": 0.46, "learning_rate": 0.0011903181659924018, "loss": 2.6054, "step": 16964 }, { "epoch": 0.46, "learning_rate": 0.0011902327169400293, "loss": 2.5291, "step": 16965 }, { "epoch": 0.46, "learning_rate": 0.0011901472664464878, "loss": 2.2939, "step": 16966 }, { "epoch": 0.46, "learning_rate": 0.0011900618145124248, "loss": 2.503, "step": 16967 }, { "epoch": 0.46, "learning_rate": 0.0011899763611384875, "loss": 2.3353, "step": 16968 }, { "epoch": 0.46, "learning_rate": 0.0011898909063253228, "loss": 2.2065, "step": 16969 }, { "epoch": 0.46, "learning_rate": 0.0011898054500735793, "loss": 2.7233, "step": 16970 }, { "epoch": 0.46, "learning_rate": 0.001189719992383903, "loss": 2.4964, "step": 16971 }, { "epoch": 0.46, "learning_rate": 0.0011896345332569425, "loss": 2.69, "step": 16972 }, { "epoch": 0.46, "learning_rate": 0.0011895490726933442, "loss": 2.0661, "step": 16973 }, { "epoch": 0.46, "learning_rate": 0.0011894636106937564, "loss": 2.569, "step": 16974 }, { "epoch": 0.46, "learning_rate": 0.0011893781472588258, "loss": 2.4477, "step": 16975 }, { "epoch": 0.46, "learning_rate": 0.0011892926823892005, "loss": 1.9947, "step": 16976 }, { "epoch": 0.46, "learning_rate": 0.0011892072160855274, "loss": 2.1609, "step": 16977 }, { "epoch": 0.46, "learning_rate": 0.0011891217483484544, "loss": 2.2567, "step": 16978 }, { "epoch": 0.46, "learning_rate": 0.0011890362791786289, "loss": 2.3584, "step": 16979 }, { "epoch": 0.46, "learning_rate": 0.0011889508085766985, "loss": 2.3775, "step": 16980 }, { "epoch": 0.46, "learning_rate": 0.0011888653365433103, "loss": 2.3701, "step": 16981 }, { "epoch": 0.46, "learning_rate": 0.001188779863079112, "loss": 2.4767, "step": 16982 }, { "epoch": 0.46, "learning_rate": 0.0011886943881847514, "loss": 2.557, "step": 16983 }, { "epoch": 0.46, "learning_rate": 0.0011886089118608755, "loss": 2.5812, "step": 16984 }, { "epoch": 0.46, "learning_rate": 0.0011885234341081326, "loss": 2.5007, "step": 16985 }, { "epoch": 0.46, "learning_rate": 0.0011884379549271698, "loss": 2.4522, "step": 16986 }, { "epoch": 0.46, "learning_rate": 0.0011883524743186349, "loss": 2.6392, "step": 16987 }, { "epoch": 0.46, "learning_rate": 0.001188266992283175, "loss": 2.2012, "step": 16988 }, { "epoch": 0.46, "learning_rate": 0.001188181508821438, "loss": 2.4357, "step": 16989 }, { "epoch": 0.46, "learning_rate": 0.001188096023934072, "loss": 2.2732, "step": 16990 }, { "epoch": 0.46, "learning_rate": 0.0011880105376217236, "loss": 2.8898, "step": 16991 }, { "epoch": 0.46, "learning_rate": 0.0011879250498850415, "loss": 2.4832, "step": 16992 }, { "epoch": 0.46, "learning_rate": 0.0011878395607246724, "loss": 2.5674, "step": 16993 }, { "epoch": 0.46, "learning_rate": 0.0011877540701412644, "loss": 2.4075, "step": 16994 }, { "epoch": 0.46, "learning_rate": 0.0011876685781354653, "loss": 2.5653, "step": 16995 }, { "epoch": 0.46, "learning_rate": 0.0011875830847079226, "loss": 2.494, "step": 16996 }, { "epoch": 0.46, "learning_rate": 0.0011874975898592838, "loss": 2.8671, "step": 16997 }, { "epoch": 0.46, "learning_rate": 0.001187412093590197, "loss": 2.7002, "step": 16998 }, { "epoch": 0.46, "learning_rate": 0.0011873265959013095, "loss": 2.7202, "step": 16999 }, { "epoch": 0.46, "learning_rate": 0.0011872410967932697, "loss": 2.3336, "step": 17000 }, { "epoch": 0.46, "learning_rate": 0.001187155596266724, "loss": 2.2476, "step": 17001 }, { "epoch": 0.46, "learning_rate": 0.0011870700943223214, "loss": 2.219, "step": 17002 }, { "epoch": 0.46, "learning_rate": 0.0011869845909607093, "loss": 2.265, "step": 17003 }, { "epoch": 0.46, "learning_rate": 0.0011868990861825352, "loss": 2.2901, "step": 17004 }, { "epoch": 0.46, "learning_rate": 0.001186813579988447, "loss": 2.6465, "step": 17005 }, { "epoch": 0.46, "learning_rate": 0.0011867280723790927, "loss": 2.4427, "step": 17006 }, { "epoch": 0.46, "learning_rate": 0.0011866425633551198, "loss": 2.7932, "step": 17007 }, { "epoch": 0.46, "learning_rate": 0.001186557052917176, "loss": 2.1486, "step": 17008 }, { "epoch": 0.46, "learning_rate": 0.0011864715410659099, "loss": 2.2281, "step": 17009 }, { "epoch": 0.46, "learning_rate": 0.0011863860278019684, "loss": 2.4529, "step": 17010 }, { "epoch": 0.46, "learning_rate": 0.0011863005131259995, "loss": 2.3841, "step": 17011 }, { "epoch": 0.46, "learning_rate": 0.0011862149970386516, "loss": 2.44, "step": 17012 }, { "epoch": 0.46, "learning_rate": 0.001186129479540572, "loss": 2.4499, "step": 17013 }, { "epoch": 0.46, "learning_rate": 0.0011860439606324086, "loss": 2.3737, "step": 17014 }, { "epoch": 0.46, "learning_rate": 0.0011859584403148095, "loss": 2.5787, "step": 17015 }, { "epoch": 0.46, "learning_rate": 0.0011858729185884225, "loss": 2.6628, "step": 17016 }, { "epoch": 0.46, "learning_rate": 0.0011857873954538958, "loss": 2.0267, "step": 17017 }, { "epoch": 0.46, "learning_rate": 0.0011857018709118766, "loss": 2.5036, "step": 17018 }, { "epoch": 0.46, "learning_rate": 0.0011856163449630135, "loss": 2.2721, "step": 17019 }, { "epoch": 0.46, "learning_rate": 0.0011855308176079537, "loss": 3.2163, "step": 17020 }, { "epoch": 0.46, "learning_rate": 0.001185445288847346, "loss": 2.8867, "step": 17021 }, { "epoch": 0.46, "learning_rate": 0.0011853597586818378, "loss": 2.6073, "step": 17022 }, { "epoch": 0.46, "learning_rate": 0.0011852742271120775, "loss": 2.2811, "step": 17023 }, { "epoch": 0.46, "learning_rate": 0.0011851886941387122, "loss": 2.7384, "step": 17024 }, { "epoch": 0.46, "learning_rate": 0.001185103159762391, "loss": 2.2415, "step": 17025 }, { "epoch": 0.46, "learning_rate": 0.0011850176239837614, "loss": 2.3013, "step": 17026 }, { "epoch": 0.46, "learning_rate": 0.001184932086803471, "loss": 2.5273, "step": 17027 }, { "epoch": 0.46, "learning_rate": 0.0011848465482221682, "loss": 2.3636, "step": 17028 }, { "epoch": 0.46, "learning_rate": 0.001184761008240501, "loss": 2.7668, "step": 17029 }, { "epoch": 0.46, "learning_rate": 0.0011846754668591178, "loss": 2.2415, "step": 17030 }, { "epoch": 0.46, "learning_rate": 0.001184589924078666, "loss": 2.2553, "step": 17031 }, { "epoch": 0.46, "learning_rate": 0.0011845043798997938, "loss": 2.4563, "step": 17032 }, { "epoch": 0.46, "learning_rate": 0.0011844188343231496, "loss": 2.4545, "step": 17033 }, { "epoch": 0.46, "learning_rate": 0.0011843332873493814, "loss": 2.2139, "step": 17034 }, { "epoch": 0.46, "learning_rate": 0.0011842477389791368, "loss": 2.4537, "step": 17035 }, { "epoch": 0.46, "learning_rate": 0.0011841621892130646, "loss": 2.7701, "step": 17036 }, { "epoch": 0.46, "learning_rate": 0.0011840766380518122, "loss": 2.5579, "step": 17037 }, { "epoch": 0.46, "learning_rate": 0.0011839910854960286, "loss": 2.3032, "step": 17038 }, { "epoch": 0.46, "learning_rate": 0.0011839055315463613, "loss": 2.4746, "step": 17039 }, { "epoch": 0.46, "learning_rate": 0.0011838199762034584, "loss": 1.946, "step": 17040 }, { "epoch": 0.46, "learning_rate": 0.001183734419467968, "loss": 2.893, "step": 17041 }, { "epoch": 0.46, "learning_rate": 0.0011836488613405389, "loss": 2.7333, "step": 17042 }, { "epoch": 0.46, "learning_rate": 0.001183563301821819, "loss": 2.8777, "step": 17043 }, { "epoch": 0.46, "learning_rate": 0.0011834777409124558, "loss": 2.4422, "step": 17044 }, { "epoch": 0.46, "learning_rate": 0.0011833921786130984, "loss": 2.7811, "step": 17045 }, { "epoch": 0.46, "learning_rate": 0.0011833066149243945, "loss": 2.5087, "step": 17046 }, { "epoch": 0.46, "learning_rate": 0.0011832210498469923, "loss": 2.4173, "step": 17047 }, { "epoch": 0.46, "learning_rate": 0.0011831354833815404, "loss": 2.677, "step": 17048 }, { "epoch": 0.46, "learning_rate": 0.0011830499155286872, "loss": 2.2621, "step": 17049 }, { "epoch": 0.46, "learning_rate": 0.0011829643462890798, "loss": 2.4878, "step": 17050 }, { "epoch": 0.46, "learning_rate": 0.0011828787756633676, "loss": 2.3515, "step": 17051 }, { "epoch": 0.46, "learning_rate": 0.0011827932036521987, "loss": 2.3661, "step": 17052 }, { "epoch": 0.46, "learning_rate": 0.001182707630256221, "loss": 2.4516, "step": 17053 }, { "epoch": 0.46, "learning_rate": 0.0011826220554760826, "loss": 2.3145, "step": 17054 }, { "epoch": 0.46, "learning_rate": 0.0011825364793124327, "loss": 2.8085, "step": 17055 }, { "epoch": 0.46, "learning_rate": 0.001182450901765919, "loss": 2.6404, "step": 17056 }, { "epoch": 0.46, "learning_rate": 0.0011823653228371896, "loss": 3.0923, "step": 17057 }, { "epoch": 0.46, "learning_rate": 0.0011822797425268931, "loss": 2.7206, "step": 17058 }, { "epoch": 0.46, "learning_rate": 0.001182194160835678, "loss": 1.9663, "step": 17059 }, { "epoch": 0.46, "learning_rate": 0.0011821085777641927, "loss": 2.4825, "step": 17060 }, { "epoch": 0.46, "learning_rate": 0.001182022993313085, "loss": 2.6033, "step": 17061 }, { "epoch": 0.46, "learning_rate": 0.001181937407483004, "loss": 3.0894, "step": 17062 }, { "epoch": 0.46, "learning_rate": 0.0011818518202745976, "loss": 2.4303, "step": 17063 }, { "epoch": 0.46, "learning_rate": 0.001181766231688514, "loss": 2.7081, "step": 17064 }, { "epoch": 0.46, "learning_rate": 0.0011816806417254025, "loss": 2.121, "step": 17065 }, { "epoch": 0.46, "learning_rate": 0.0011815950503859108, "loss": 2.375, "step": 17066 }, { "epoch": 0.46, "learning_rate": 0.0011815094576706868, "loss": 3.0211, "step": 17067 }, { "epoch": 0.46, "learning_rate": 0.0011814238635803804, "loss": 1.9648, "step": 17068 }, { "epoch": 0.46, "learning_rate": 0.001181338268115639, "loss": 2.399, "step": 17069 }, { "epoch": 0.46, "learning_rate": 0.0011812526712771112, "loss": 2.6057, "step": 17070 }, { "epoch": 0.46, "learning_rate": 0.0011811670730654455, "loss": 2.4477, "step": 17071 }, { "epoch": 0.46, "learning_rate": 0.0011810814734812907, "loss": 2.7176, "step": 17072 }, { "epoch": 0.46, "learning_rate": 0.001180995872525295, "loss": 2.8175, "step": 17073 }, { "epoch": 0.46, "learning_rate": 0.001180910270198107, "loss": 2.5621, "step": 17074 }, { "epoch": 0.46, "learning_rate": 0.0011808246665003749, "loss": 2.7336, "step": 17075 }, { "epoch": 0.46, "learning_rate": 0.0011807390614327474, "loss": 2.3492, "step": 17076 }, { "epoch": 0.46, "learning_rate": 0.0011806534549958733, "loss": 2.0955, "step": 17077 }, { "epoch": 0.46, "learning_rate": 0.001180567847190401, "loss": 2.3801, "step": 17078 }, { "epoch": 0.46, "learning_rate": 0.0011804822380169786, "loss": 2.399, "step": 17079 }, { "epoch": 0.46, "learning_rate": 0.001180396627476255, "loss": 2.6053, "step": 17080 }, { "epoch": 0.46, "learning_rate": 0.0011803110155688792, "loss": 2.4442, "step": 17081 }, { "epoch": 0.46, "learning_rate": 0.0011802254022954992, "loss": 2.4945, "step": 17082 }, { "epoch": 0.46, "learning_rate": 0.0011801397876567638, "loss": 2.411, "step": 17083 }, { "epoch": 0.46, "learning_rate": 0.0011800541716533216, "loss": 2.4058, "step": 17084 }, { "epoch": 0.46, "learning_rate": 0.0011799685542858212, "loss": 2.8079, "step": 17085 }, { "epoch": 0.46, "learning_rate": 0.001179882935554911, "loss": 2.7369, "step": 17086 }, { "epoch": 0.46, "learning_rate": 0.00117979731546124, "loss": 2.4733, "step": 17087 }, { "epoch": 0.46, "learning_rate": 0.0011797116940054568, "loss": 2.796, "step": 17088 }, { "epoch": 0.46, "learning_rate": 0.0011796260711882099, "loss": 2.8011, "step": 17089 }, { "epoch": 0.46, "learning_rate": 0.0011795404470101476, "loss": 2.1934, "step": 17090 }, { "epoch": 0.46, "learning_rate": 0.0011794548214719195, "loss": 2.5606, "step": 17091 }, { "epoch": 0.46, "learning_rate": 0.0011793691945741736, "loss": 2.5576, "step": 17092 }, { "epoch": 0.46, "learning_rate": 0.0011792835663175585, "loss": 2.9595, "step": 17093 }, { "epoch": 0.46, "learning_rate": 0.0011791979367027235, "loss": 2.9734, "step": 17094 }, { "epoch": 0.46, "learning_rate": 0.0011791123057303169, "loss": 2.852, "step": 17095 }, { "epoch": 0.46, "learning_rate": 0.0011790266734009874, "loss": 2.738, "step": 17096 }, { "epoch": 0.46, "learning_rate": 0.001178941039715384, "loss": 2.3331, "step": 17097 }, { "epoch": 0.46, "learning_rate": 0.0011788554046741548, "loss": 2.9256, "step": 17098 }, { "epoch": 0.46, "learning_rate": 0.0011787697682779494, "loss": 2.7861, "step": 17099 }, { "epoch": 0.46, "learning_rate": 0.001178684130527416, "loss": 3.191, "step": 17100 }, { "epoch": 0.46, "learning_rate": 0.0011785984914232039, "loss": 2.6016, "step": 17101 }, { "epoch": 0.46, "learning_rate": 0.0011785128509659614, "loss": 2.6724, "step": 17102 }, { "epoch": 0.46, "learning_rate": 0.0011784272091563373, "loss": 2.6335, "step": 17103 }, { "epoch": 0.46, "learning_rate": 0.0011783415659949808, "loss": 2.5856, "step": 17104 }, { "epoch": 0.46, "learning_rate": 0.0011782559214825407, "loss": 2.9143, "step": 17105 }, { "epoch": 0.46, "learning_rate": 0.001178170275619665, "loss": 2.2306, "step": 17106 }, { "epoch": 0.46, "learning_rate": 0.0011780846284070035, "loss": 2.4327, "step": 17107 }, { "epoch": 0.46, "learning_rate": 0.0011779989798452047, "loss": 2.6464, "step": 17108 }, { "epoch": 0.46, "learning_rate": 0.0011779133299349173, "loss": 2.4925, "step": 17109 }, { "epoch": 0.46, "learning_rate": 0.0011778276786767903, "loss": 2.9248, "step": 17110 }, { "epoch": 0.46, "learning_rate": 0.001177742026071473, "loss": 2.5407, "step": 17111 }, { "epoch": 0.46, "learning_rate": 0.0011776563721196134, "loss": 2.8227, "step": 17112 }, { "epoch": 0.46, "learning_rate": 0.001177570716821861, "loss": 2.4551, "step": 17113 }, { "epoch": 0.46, "learning_rate": 0.0011774850601788647, "loss": 1.9572, "step": 17114 }, { "epoch": 0.46, "learning_rate": 0.0011773994021912733, "loss": 2.7995, "step": 17115 }, { "epoch": 0.46, "learning_rate": 0.0011773137428597357, "loss": 2.5119, "step": 17116 }, { "epoch": 0.46, "learning_rate": 0.001177228082184901, "loss": 2.2756, "step": 17117 }, { "epoch": 0.46, "learning_rate": 0.001177142420167418, "loss": 2.3378, "step": 17118 }, { "epoch": 0.46, "learning_rate": 0.0011770567568079357, "loss": 1.9736, "step": 17119 }, { "epoch": 0.46, "learning_rate": 0.001176971092107103, "loss": 3.019, "step": 17120 }, { "epoch": 0.46, "learning_rate": 0.0011768854260655686, "loss": 2.2424, "step": 17121 }, { "epoch": 0.46, "learning_rate": 0.0011767997586839825, "loss": 2.8096, "step": 17122 }, { "epoch": 0.46, "learning_rate": 0.0011767140899629925, "loss": 2.6126, "step": 17123 }, { "epoch": 0.46, "learning_rate": 0.0011766284199032483, "loss": 2.3502, "step": 17124 }, { "epoch": 0.46, "learning_rate": 0.001176542748505399, "loss": 2.2368, "step": 17125 }, { "epoch": 0.46, "learning_rate": 0.0011764570757700934, "loss": 2.5003, "step": 17126 }, { "epoch": 0.46, "learning_rate": 0.0011763714016979803, "loss": 2.1492, "step": 17127 }, { "epoch": 0.46, "learning_rate": 0.0011762857262897092, "loss": 2.8692, "step": 17128 }, { "epoch": 0.46, "learning_rate": 0.0011762000495459286, "loss": 2.3043, "step": 17129 }, { "epoch": 0.46, "learning_rate": 0.0011761143714672882, "loss": 2.2909, "step": 17130 }, { "epoch": 0.46, "learning_rate": 0.0011760286920544367, "loss": 2.6511, "step": 17131 }, { "epoch": 0.46, "learning_rate": 0.0011759430113080236, "loss": 2.6126, "step": 17132 }, { "epoch": 0.46, "learning_rate": 0.0011758573292286972, "loss": 2.2353, "step": 17133 }, { "epoch": 0.46, "learning_rate": 0.0011757716458171074, "loss": 2.8157, "step": 17134 }, { "epoch": 0.46, "learning_rate": 0.0011756859610739033, "loss": 2.8334, "step": 17135 }, { "epoch": 0.46, "learning_rate": 0.0011756002749997334, "loss": 2.3946, "step": 17136 }, { "epoch": 0.46, "learning_rate": 0.001175514587595247, "loss": 2.4595, "step": 17137 }, { "epoch": 0.46, "learning_rate": 0.001175428898861094, "loss": 2.1618, "step": 17138 }, { "epoch": 0.46, "learning_rate": 0.001175343208797923, "loss": 2.5794, "step": 17139 }, { "epoch": 0.46, "learning_rate": 0.0011752575174063828, "loss": 2.8113, "step": 17140 }, { "epoch": 0.46, "learning_rate": 0.001175171824687123, "loss": 2.5129, "step": 17141 }, { "epoch": 0.46, "learning_rate": 0.0011750861306407932, "loss": 2.3103, "step": 17142 }, { "epoch": 0.46, "learning_rate": 0.0011750004352680417, "loss": 2.9319, "step": 17143 }, { "epoch": 0.46, "learning_rate": 0.0011749147385695187, "loss": 2.6196, "step": 17144 }, { "epoch": 0.46, "learning_rate": 0.0011748290405458723, "loss": 3.0962, "step": 17145 }, { "epoch": 0.46, "learning_rate": 0.0011747433411977526, "loss": 2.2201, "step": 17146 }, { "epoch": 0.46, "learning_rate": 0.001174657640525809, "loss": 2.2948, "step": 17147 }, { "epoch": 0.46, "learning_rate": 0.00117457193853069, "loss": 3.1189, "step": 17148 }, { "epoch": 0.46, "learning_rate": 0.0011744862352130452, "loss": 2.641, "step": 17149 }, { "epoch": 0.46, "learning_rate": 0.0011744005305735236, "loss": 2.7973, "step": 17150 }, { "epoch": 0.46, "learning_rate": 0.0011743148246127753, "loss": 2.381, "step": 17151 }, { "epoch": 0.46, "learning_rate": 0.001174229117331449, "loss": 2.5193, "step": 17152 }, { "epoch": 0.46, "learning_rate": 0.0011741434087301935, "loss": 2.5853, "step": 17153 }, { "epoch": 0.46, "learning_rate": 0.001174057698809659, "loss": 2.3016, "step": 17154 }, { "epoch": 0.46, "learning_rate": 0.0011739719875704946, "loss": 2.2056, "step": 17155 }, { "epoch": 0.46, "learning_rate": 0.0011738862750133494, "loss": 2.3675, "step": 17156 }, { "epoch": 0.46, "learning_rate": 0.0011738005611388728, "loss": 2.6806, "step": 17157 }, { "epoch": 0.46, "learning_rate": 0.0011737148459477144, "loss": 2.4372, "step": 17158 }, { "epoch": 0.46, "learning_rate": 0.0011736291294405232, "loss": 2.4151, "step": 17159 }, { "epoch": 0.46, "learning_rate": 0.001173543411617949, "loss": 2.4782, "step": 17160 }, { "epoch": 0.46, "learning_rate": 0.001173457692480641, "loss": 2.4657, "step": 17161 }, { "epoch": 0.46, "learning_rate": 0.0011733719720292482, "loss": 2.5346, "step": 17162 }, { "epoch": 0.46, "learning_rate": 0.0011732862502644205, "loss": 2.8945, "step": 17163 }, { "epoch": 0.46, "learning_rate": 0.001173200527186807, "loss": 3.0252, "step": 17164 }, { "epoch": 0.46, "learning_rate": 0.0011731148027970574, "loss": 2.7721, "step": 17165 }, { "epoch": 0.46, "learning_rate": 0.001173029077095821, "loss": 3.3709, "step": 17166 }, { "epoch": 0.46, "learning_rate": 0.0011729433500837474, "loss": 2.5324, "step": 17167 }, { "epoch": 0.46, "learning_rate": 0.0011728576217614856, "loss": 2.1196, "step": 17168 }, { "epoch": 0.46, "learning_rate": 0.0011727718921296854, "loss": 3.015, "step": 17169 }, { "epoch": 0.46, "learning_rate": 0.0011726861611889964, "loss": 2.549, "step": 17170 }, { "epoch": 0.46, "learning_rate": 0.001172600428940068, "loss": 2.4566, "step": 17171 }, { "epoch": 0.46, "learning_rate": 0.0011725146953835495, "loss": 2.3719, "step": 17172 }, { "epoch": 0.46, "learning_rate": 0.0011724289605200904, "loss": 2.6247, "step": 17173 }, { "epoch": 0.46, "learning_rate": 0.0011723432243503406, "loss": 2.55, "step": 17174 }, { "epoch": 0.46, "learning_rate": 0.0011722574868749491, "loss": 2.6661, "step": 17175 }, { "epoch": 0.46, "learning_rate": 0.0011721717480945655, "loss": 2.5811, "step": 17176 }, { "epoch": 0.46, "learning_rate": 0.0011720860080098397, "loss": 2.8232, "step": 17177 }, { "epoch": 0.46, "learning_rate": 0.0011720002666214214, "loss": 2.4391, "step": 17178 }, { "epoch": 0.46, "learning_rate": 0.0011719145239299593, "loss": 2.7088, "step": 17179 }, { "epoch": 0.46, "learning_rate": 0.0011718287799361037, "loss": 3.0578, "step": 17180 }, { "epoch": 0.46, "learning_rate": 0.001171743034640504, "loss": 2.4749, "step": 17181 }, { "epoch": 0.46, "learning_rate": 0.00117165728804381, "loss": 2.7824, "step": 17182 }, { "epoch": 0.46, "learning_rate": 0.0011715715401466708, "loss": 2.5849, "step": 17183 }, { "epoch": 0.46, "learning_rate": 0.0011714857909497364, "loss": 2.827, "step": 17184 }, { "epoch": 0.46, "learning_rate": 0.0011714000404536562, "loss": 2.338, "step": 17185 }, { "epoch": 0.46, "learning_rate": 0.00117131428865908, "loss": 2.4392, "step": 17186 }, { "epoch": 0.46, "learning_rate": 0.0011712285355666575, "loss": 2.651, "step": 17187 }, { "epoch": 0.46, "learning_rate": 0.001171142781177038, "loss": 2.4025, "step": 17188 }, { "epoch": 0.46, "learning_rate": 0.0011710570254908714, "loss": 2.4366, "step": 17189 }, { "epoch": 0.46, "learning_rate": 0.0011709712685088077, "loss": 2.4093, "step": 17190 }, { "epoch": 0.46, "learning_rate": 0.001170885510231496, "loss": 2.9185, "step": 17191 }, { "epoch": 0.46, "learning_rate": 0.0011707997506595863, "loss": 2.4892, "step": 17192 }, { "epoch": 0.46, "learning_rate": 0.0011707139897937278, "loss": 2.6918, "step": 17193 }, { "epoch": 0.46, "learning_rate": 0.0011706282276345713, "loss": 2.3159, "step": 17194 }, { "epoch": 0.46, "learning_rate": 0.0011705424641827653, "loss": 2.8045, "step": 17195 }, { "epoch": 0.46, "learning_rate": 0.0011704566994389604, "loss": 2.4602, "step": 17196 }, { "epoch": 0.46, "learning_rate": 0.0011703709334038059, "loss": 2.6282, "step": 17197 }, { "epoch": 0.46, "learning_rate": 0.0011702851660779516, "loss": 2.339, "step": 17198 }, { "epoch": 0.46, "learning_rate": 0.0011701993974620472, "loss": 2.8242, "step": 17199 }, { "epoch": 0.46, "learning_rate": 0.001170113627556743, "loss": 2.2348, "step": 17200 }, { "epoch": 0.46, "learning_rate": 0.0011700278563626884, "loss": 2.954, "step": 17201 }, { "epoch": 0.46, "learning_rate": 0.0011699420838805327, "loss": 2.3254, "step": 17202 }, { "epoch": 0.46, "learning_rate": 0.0011698563101109262, "loss": 2.4323, "step": 17203 }, { "epoch": 0.46, "learning_rate": 0.0011697705350545192, "loss": 3.0159, "step": 17204 }, { "epoch": 0.46, "learning_rate": 0.0011696847587119607, "loss": 2.6658, "step": 17205 }, { "epoch": 0.46, "learning_rate": 0.0011695989810839007, "loss": 2.5543, "step": 17206 }, { "epoch": 0.46, "learning_rate": 0.0011695132021709892, "loss": 2.5439, "step": 17207 }, { "epoch": 0.46, "learning_rate": 0.001169427421973876, "loss": 2.7776, "step": 17208 }, { "epoch": 0.46, "learning_rate": 0.0011693416404932107, "loss": 2.1262, "step": 17209 }, { "epoch": 0.46, "learning_rate": 0.001169255857729644, "loss": 2.4437, "step": 17210 }, { "epoch": 0.46, "learning_rate": 0.0011691700736838246, "loss": 2.5953, "step": 17211 }, { "epoch": 0.46, "learning_rate": 0.001169084288356403, "loss": 2.7557, "step": 17212 }, { "epoch": 0.46, "learning_rate": 0.0011689985017480293, "loss": 2.4101, "step": 17213 }, { "epoch": 0.46, "learning_rate": 0.0011689127138593534, "loss": 2.3391, "step": 17214 }, { "epoch": 0.46, "learning_rate": 0.0011688269246910245, "loss": 1.945, "step": 17215 }, { "epoch": 0.46, "learning_rate": 0.001168741134243693, "loss": 2.5512, "step": 17216 }, { "epoch": 0.46, "learning_rate": 0.0011686553425180094, "loss": 2.5249, "step": 17217 }, { "epoch": 0.46, "learning_rate": 0.0011685695495146228, "loss": 2.8, "step": 17218 }, { "epoch": 0.46, "learning_rate": 0.0011684837552341828, "loss": 2.5165, "step": 17219 }, { "epoch": 0.46, "learning_rate": 0.0011683979596773407, "loss": 2.506, "step": 17220 }, { "epoch": 0.46, "learning_rate": 0.0011683121628447456, "loss": 2.3405, "step": 17221 }, { "epoch": 0.46, "learning_rate": 0.0011682263647370475, "loss": 2.8635, "step": 17222 }, { "epoch": 0.46, "learning_rate": 0.0011681405653548966, "loss": 1.9325, "step": 17223 }, { "epoch": 0.46, "learning_rate": 0.001168054764698943, "loss": 2.7201, "step": 17224 }, { "epoch": 0.46, "learning_rate": 0.0011679689627698364, "loss": 2.4048, "step": 17225 }, { "epoch": 0.46, "learning_rate": 0.001167883159568227, "loss": 2.6119, "step": 17226 }, { "epoch": 0.46, "learning_rate": 0.001167797355094765, "loss": 2.5216, "step": 17227 }, { "epoch": 0.46, "learning_rate": 0.0011677115493501, "loss": 2.301, "step": 17228 }, { "epoch": 0.46, "learning_rate": 0.0011676257423348822, "loss": 2.6214, "step": 17229 }, { "epoch": 0.46, "learning_rate": 0.0011675399340497618, "loss": 2.3181, "step": 17230 }, { "epoch": 0.46, "learning_rate": 0.001167454124495389, "loss": 2.3628, "step": 17231 }, { "epoch": 0.46, "learning_rate": 0.0011673683136724136, "loss": 2.8496, "step": 17232 }, { "epoch": 0.46, "learning_rate": 0.001167282501581486, "loss": 3.0257, "step": 17233 }, { "epoch": 0.46, "learning_rate": 0.0011671966882232556, "loss": 2.219, "step": 17234 }, { "epoch": 0.46, "learning_rate": 0.0011671108735983734, "loss": 2.6511, "step": 17235 }, { "epoch": 0.46, "learning_rate": 0.0011670250577074889, "loss": 2.9717, "step": 17236 }, { "epoch": 0.46, "learning_rate": 0.0011669392405512524, "loss": 2.5933, "step": 17237 }, { "epoch": 0.46, "learning_rate": 0.001166853422130314, "loss": 2.9356, "step": 17238 }, { "epoch": 0.46, "learning_rate": 0.001166767602445324, "loss": 2.4443, "step": 17239 }, { "epoch": 0.46, "learning_rate": 0.0011666817814969326, "loss": 2.6291, "step": 17240 }, { "epoch": 0.46, "learning_rate": 0.0011665959592857898, "loss": 2.4809, "step": 17241 }, { "epoch": 0.46, "learning_rate": 0.0011665101358125454, "loss": 2.8324, "step": 17242 }, { "epoch": 0.46, "learning_rate": 0.0011664243110778502, "loss": 2.7408, "step": 17243 }, { "epoch": 0.46, "learning_rate": 0.0011663384850823543, "loss": 2.7708, "step": 17244 }, { "epoch": 0.46, "learning_rate": 0.0011662526578267076, "loss": 2.6606, "step": 17245 }, { "epoch": 0.46, "learning_rate": 0.0011661668293115606, "loss": 2.8981, "step": 17246 }, { "epoch": 0.46, "learning_rate": 0.0011660809995375637, "loss": 2.8505, "step": 17247 }, { "epoch": 0.46, "learning_rate": 0.0011659951685053663, "loss": 2.3661, "step": 17248 }, { "epoch": 0.46, "learning_rate": 0.0011659093362156195, "loss": 2.2932, "step": 17249 }, { "epoch": 0.46, "learning_rate": 0.0011658235026689731, "loss": 2.4972, "step": 17250 }, { "epoch": 0.46, "learning_rate": 0.0011657376678660776, "loss": 2.6954, "step": 17251 }, { "epoch": 0.46, "learning_rate": 0.001165651831807583, "loss": 2.1355, "step": 17252 }, { "epoch": 0.46, "learning_rate": 0.0011655659944941402, "loss": 2.1663, "step": 17253 }, { "epoch": 0.46, "learning_rate": 0.0011654801559263985, "loss": 2.6404, "step": 17254 }, { "epoch": 0.46, "learning_rate": 0.0011653943161050089, "loss": 2.3547, "step": 17255 }, { "epoch": 0.46, "learning_rate": 0.0011653084750306215, "loss": 2.7251, "step": 17256 }, { "epoch": 0.46, "learning_rate": 0.001165222632703887, "loss": 3.0003, "step": 17257 }, { "epoch": 0.46, "learning_rate": 0.0011651367891254546, "loss": 2.6447, "step": 17258 }, { "epoch": 0.46, "learning_rate": 0.001165050944295976, "loss": 2.6312, "step": 17259 }, { "epoch": 0.46, "learning_rate": 0.0011649650982161008, "loss": 2.9159, "step": 17260 }, { "epoch": 0.46, "learning_rate": 0.0011648792508864795, "loss": 2.5688, "step": 17261 }, { "epoch": 0.46, "learning_rate": 0.0011647934023077625, "loss": 2.5604, "step": 17262 }, { "epoch": 0.46, "learning_rate": 0.0011647075524806002, "loss": 2.3455, "step": 17263 }, { "epoch": 0.46, "learning_rate": 0.001164621701405643, "loss": 2.8528, "step": 17264 }, { "epoch": 0.46, "learning_rate": 0.0011645358490835409, "loss": 2.52, "step": 17265 }, { "epoch": 0.46, "learning_rate": 0.0011644499955149447, "loss": 2.7792, "step": 17266 }, { "epoch": 0.46, "learning_rate": 0.001164364140700505, "loss": 2.7874, "step": 17267 }, { "epoch": 0.46, "learning_rate": 0.0011642782846408718, "loss": 2.2628, "step": 17268 }, { "epoch": 0.46, "learning_rate": 0.0011641924273366954, "loss": 2.7722, "step": 17269 }, { "epoch": 0.46, "learning_rate": 0.0011641065687886271, "loss": 2.4695, "step": 17270 }, { "epoch": 0.46, "learning_rate": 0.0011640207089973168, "loss": 2.7292, "step": 17271 }, { "epoch": 0.46, "learning_rate": 0.0011639348479634145, "loss": 2.4559, "step": 17272 }, { "epoch": 0.46, "learning_rate": 0.001163848985687571, "loss": 2.275, "step": 17273 }, { "epoch": 0.46, "learning_rate": 0.0011637631221704371, "loss": 2.2956, "step": 17274 }, { "epoch": 0.46, "learning_rate": 0.0011636772574126631, "loss": 2.3791, "step": 17275 }, { "epoch": 0.46, "learning_rate": 0.0011635913914148995, "loss": 2.3501, "step": 17276 }, { "epoch": 0.46, "learning_rate": 0.0011635055241777964, "loss": 2.406, "step": 17277 }, { "epoch": 0.46, "learning_rate": 0.0011634196557020052, "loss": 2.5194, "step": 17278 }, { "epoch": 0.46, "learning_rate": 0.0011633337859881757, "loss": 3.0643, "step": 17279 }, { "epoch": 0.46, "learning_rate": 0.0011632479150369588, "loss": 2.3276, "step": 17280 }, { "epoch": 0.46, "learning_rate": 0.0011631620428490046, "loss": 2.7086, "step": 17281 }, { "epoch": 0.46, "learning_rate": 0.001163076169424964, "loss": 2.3618, "step": 17282 }, { "epoch": 0.46, "learning_rate": 0.0011629902947654877, "loss": 2.7338, "step": 17283 }, { "epoch": 0.46, "learning_rate": 0.0011629044188712259, "loss": 2.8806, "step": 17284 }, { "epoch": 0.46, "learning_rate": 0.001162818541742829, "loss": 2.499, "step": 17285 }, { "epoch": 0.46, "learning_rate": 0.0011627326633809486, "loss": 2.5233, "step": 17286 }, { "epoch": 0.46, "learning_rate": 0.0011626467837862343, "loss": 2.4265, "step": 17287 }, { "epoch": 0.46, "learning_rate": 0.0011625609029593368, "loss": 2.3471, "step": 17288 }, { "epoch": 0.46, "learning_rate": 0.0011624750209009071, "loss": 2.5844, "step": 17289 }, { "epoch": 0.46, "learning_rate": 0.001162389137611596, "loss": 2.3312, "step": 17290 }, { "epoch": 0.46, "learning_rate": 0.0011623032530920536, "loss": 2.5193, "step": 17291 }, { "epoch": 0.46, "learning_rate": 0.0011622173673429311, "loss": 2.2998, "step": 17292 }, { "epoch": 0.46, "learning_rate": 0.0011621314803648784, "loss": 2.3329, "step": 17293 }, { "epoch": 0.46, "learning_rate": 0.0011620455921585466, "loss": 2.213, "step": 17294 }, { "epoch": 0.46, "learning_rate": 0.0011619597027245866, "loss": 2.6027, "step": 17295 }, { "epoch": 0.46, "learning_rate": 0.0011618738120636486, "loss": 2.4704, "step": 17296 }, { "epoch": 0.46, "learning_rate": 0.001161787920176384, "loss": 2.1785, "step": 17297 }, { "epoch": 0.46, "learning_rate": 0.0011617020270634423, "loss": 2.3141, "step": 17298 }, { "epoch": 0.46, "learning_rate": 0.0011616161327254757, "loss": 2.6785, "step": 17299 }, { "epoch": 0.46, "learning_rate": 0.001161530237163134, "loss": 3.0354, "step": 17300 }, { "epoch": 0.46, "learning_rate": 0.0011614443403770679, "loss": 2.4093, "step": 17301 }, { "epoch": 0.46, "learning_rate": 0.0011613584423679282, "loss": 2.6196, "step": 17302 }, { "epoch": 0.46, "learning_rate": 0.001161272543136366, "loss": 2.5075, "step": 17303 }, { "epoch": 0.47, "learning_rate": 0.0011611866426830318, "loss": 2.5542, "step": 17304 }, { "epoch": 0.47, "learning_rate": 0.0011611007410085763, "loss": 2.6209, "step": 17305 }, { "epoch": 0.47, "learning_rate": 0.0011610148381136507, "loss": 2.5884, "step": 17306 }, { "epoch": 0.47, "learning_rate": 0.0011609289339989054, "loss": 2.3489, "step": 17307 }, { "epoch": 0.47, "learning_rate": 0.001160843028664991, "loss": 2.3015, "step": 17308 }, { "epoch": 0.47, "learning_rate": 0.0011607571221125589, "loss": 2.3926, "step": 17309 }, { "epoch": 0.47, "learning_rate": 0.0011606712143422593, "loss": 1.9801, "step": 17310 }, { "epoch": 0.47, "learning_rate": 0.0011605853053547434, "loss": 2.2993, "step": 17311 }, { "epoch": 0.47, "learning_rate": 0.001160499395150662, "loss": 2.9692, "step": 17312 }, { "epoch": 0.47, "learning_rate": 0.0011604134837306659, "loss": 2.9339, "step": 17313 }, { "epoch": 0.47, "learning_rate": 0.001160327571095406, "loss": 3.0026, "step": 17314 }, { "epoch": 0.47, "learning_rate": 0.0011602416572455327, "loss": 2.1746, "step": 17315 }, { "epoch": 0.47, "learning_rate": 0.0011601557421816976, "loss": 2.4394, "step": 17316 }, { "epoch": 0.47, "learning_rate": 0.0011600698259045512, "loss": 2.7298, "step": 17317 }, { "epoch": 0.47, "learning_rate": 0.0011599839084147443, "loss": 2.7689, "step": 17318 }, { "epoch": 0.47, "learning_rate": 0.001159897989712928, "loss": 2.2175, "step": 17319 }, { "epoch": 0.47, "learning_rate": 0.0011598120697997529, "loss": 2.6658, "step": 17320 }, { "epoch": 0.47, "learning_rate": 0.0011597261486758703, "loss": 1.733, "step": 17321 }, { "epoch": 0.47, "learning_rate": 0.0011596402263419313, "loss": 2.5779, "step": 17322 }, { "epoch": 0.47, "learning_rate": 0.0011595543027985863, "loss": 2.3499, "step": 17323 }, { "epoch": 0.47, "learning_rate": 0.0011594683780464861, "loss": 2.5704, "step": 17324 }, { "epoch": 0.47, "learning_rate": 0.0011593824520862819, "loss": 2.5911, "step": 17325 }, { "epoch": 0.47, "learning_rate": 0.001159296524918625, "loss": 2.4688, "step": 17326 }, { "epoch": 0.47, "learning_rate": 0.0011592105965441662, "loss": 2.5246, "step": 17327 }, { "epoch": 0.47, "learning_rate": 0.0011591246669635563, "loss": 2.824, "step": 17328 }, { "epoch": 0.47, "learning_rate": 0.0011590387361774463, "loss": 2.5143, "step": 17329 }, { "epoch": 0.47, "learning_rate": 0.0011589528041864876, "loss": 2.421, "step": 17330 }, { "epoch": 0.47, "learning_rate": 0.0011588668709913304, "loss": 2.1692, "step": 17331 }, { "epoch": 0.47, "learning_rate": 0.0011587809365926263, "loss": 2.6333, "step": 17332 }, { "epoch": 0.47, "learning_rate": 0.0011586950009910264, "loss": 2.5677, "step": 17333 }, { "epoch": 0.47, "learning_rate": 0.0011586090641871813, "loss": 2.638, "step": 17334 }, { "epoch": 0.47, "learning_rate": 0.0011585231261817426, "loss": 2.1904, "step": 17335 }, { "epoch": 0.47, "learning_rate": 0.001158437186975361, "loss": 2.4959, "step": 17336 }, { "epoch": 0.47, "learning_rate": 0.0011583512465686873, "loss": 2.3799, "step": 17337 }, { "epoch": 0.47, "learning_rate": 0.001158265304962373, "loss": 2.2813, "step": 17338 }, { "epoch": 0.47, "learning_rate": 0.0011581793621570694, "loss": 2.3863, "step": 17339 }, { "epoch": 0.47, "learning_rate": 0.0011580934181534266, "loss": 2.2617, "step": 17340 }, { "epoch": 0.47, "learning_rate": 0.0011580074729520967, "loss": 2.4636, "step": 17341 }, { "epoch": 0.47, "learning_rate": 0.0011579215265537304, "loss": 2.7058, "step": 17342 }, { "epoch": 0.47, "learning_rate": 0.0011578355789589787, "loss": 2.2115, "step": 17343 }, { "epoch": 0.47, "learning_rate": 0.001157749630168493, "loss": 2.1441, "step": 17344 }, { "epoch": 0.47, "learning_rate": 0.0011576636801829243, "loss": 2.4823, "step": 17345 }, { "epoch": 0.47, "learning_rate": 0.001157577729002924, "loss": 2.5367, "step": 17346 }, { "epoch": 0.47, "learning_rate": 0.0011574917766291426, "loss": 2.0085, "step": 17347 }, { "epoch": 0.47, "learning_rate": 0.0011574058230622317, "loss": 2.7496, "step": 17348 }, { "epoch": 0.47, "learning_rate": 0.0011573198683028428, "loss": 2.2831, "step": 17349 }, { "epoch": 0.47, "learning_rate": 0.0011572339123516265, "loss": 2.3003, "step": 17350 }, { "epoch": 0.47, "learning_rate": 0.0011571479552092336, "loss": 2.8688, "step": 17351 }, { "epoch": 0.47, "learning_rate": 0.0011570619968763168, "loss": 2.7409, "step": 17352 }, { "epoch": 0.47, "learning_rate": 0.0011569760373535262, "loss": 2.9419, "step": 17353 }, { "epoch": 0.47, "learning_rate": 0.0011568900766415126, "loss": 2.6945, "step": 17354 }, { "epoch": 0.47, "learning_rate": 0.0011568041147409283, "loss": 2.4509, "step": 17355 }, { "epoch": 0.47, "learning_rate": 0.001156718151652424, "loss": 2.6776, "step": 17356 }, { "epoch": 0.47, "learning_rate": 0.001156632187376651, "loss": 2.8842, "step": 17357 }, { "epoch": 0.47, "learning_rate": 0.0011565462219142607, "loss": 2.5999, "step": 17358 }, { "epoch": 0.47, "learning_rate": 0.0011564602552659041, "loss": 2.7119, "step": 17359 }, { "epoch": 0.47, "learning_rate": 0.0011563742874322325, "loss": 2.3431, "step": 17360 }, { "epoch": 0.47, "learning_rate": 0.0011562883184138974, "loss": 2.7449, "step": 17361 }, { "epoch": 0.47, "learning_rate": 0.0011562023482115497, "loss": 2.5947, "step": 17362 }, { "epoch": 0.47, "learning_rate": 0.0011561163768258411, "loss": 2.4465, "step": 17363 }, { "epoch": 0.47, "learning_rate": 0.0011560304042574226, "loss": 2.6869, "step": 17364 }, { "epoch": 0.47, "learning_rate": 0.0011559444305069457, "loss": 2.4829, "step": 17365 }, { "epoch": 0.47, "learning_rate": 0.001155858455575062, "loss": 3.1114, "step": 17366 }, { "epoch": 0.47, "learning_rate": 0.001155772479462422, "loss": 2.2732, "step": 17367 }, { "epoch": 0.47, "learning_rate": 0.0011556865021696778, "loss": 2.8812, "step": 17368 }, { "epoch": 0.47, "learning_rate": 0.0011556005236974807, "loss": 2.2889, "step": 17369 }, { "epoch": 0.47, "learning_rate": 0.0011555145440464813, "loss": 2.5256, "step": 17370 }, { "epoch": 0.47, "learning_rate": 0.001155428563217332, "loss": 2.6629, "step": 17371 }, { "epoch": 0.47, "learning_rate": 0.0011553425812106837, "loss": 3.2993, "step": 17372 }, { "epoch": 0.47, "learning_rate": 0.0011552565980271876, "loss": 2.7998, "step": 17373 }, { "epoch": 0.47, "learning_rate": 0.0011551706136674954, "loss": 2.1739, "step": 17374 }, { "epoch": 0.47, "learning_rate": 0.001155084628132258, "loss": 2.0192, "step": 17375 }, { "epoch": 0.47, "learning_rate": 0.0011549986414221276, "loss": 2.7079, "step": 17376 }, { "epoch": 0.47, "learning_rate": 0.001154912653537755, "loss": 2.4864, "step": 17377 }, { "epoch": 0.47, "learning_rate": 0.0011548266644797918, "loss": 2.2376, "step": 17378 }, { "epoch": 0.47, "learning_rate": 0.0011547406742488896, "loss": 2.124, "step": 17379 }, { "epoch": 0.47, "learning_rate": 0.0011546546828456999, "loss": 2.3859, "step": 17380 }, { "epoch": 0.47, "learning_rate": 0.0011545686902708736, "loss": 2.3748, "step": 17381 }, { "epoch": 0.47, "learning_rate": 0.0011544826965250625, "loss": 2.6328, "step": 17382 }, { "epoch": 0.47, "learning_rate": 0.0011543967016089186, "loss": 2.5884, "step": 17383 }, { "epoch": 0.47, "learning_rate": 0.0011543107055230924, "loss": 2.5171, "step": 17384 }, { "epoch": 0.47, "learning_rate": 0.0011542247082682363, "loss": 2.4597, "step": 17385 }, { "epoch": 0.47, "learning_rate": 0.001154138709845001, "loss": 2.2716, "step": 17386 }, { "epoch": 0.47, "learning_rate": 0.0011540527102540383, "loss": 2.4602, "step": 17387 }, { "epoch": 0.47, "learning_rate": 0.0011539667094960003, "loss": 2.6222, "step": 17388 }, { "epoch": 0.47, "learning_rate": 0.0011538807075715377, "loss": 2.3451, "step": 17389 }, { "epoch": 0.47, "learning_rate": 0.0011537947044813026, "loss": 2.8145, "step": 17390 }, { "epoch": 0.47, "learning_rate": 0.001153708700225946, "loss": 2.887, "step": 17391 }, { "epoch": 0.47, "learning_rate": 0.0011536226948061202, "loss": 2.6253, "step": 17392 }, { "epoch": 0.47, "learning_rate": 0.0011535366882224761, "loss": 2.4407, "step": 17393 }, { "epoch": 0.47, "learning_rate": 0.001153450680475665, "loss": 2.2377, "step": 17394 }, { "epoch": 0.47, "learning_rate": 0.0011533646715663397, "loss": 2.6038, "step": 17395 }, { "epoch": 0.47, "learning_rate": 0.001153278661495151, "loss": 3.2095, "step": 17396 }, { "epoch": 0.47, "learning_rate": 0.00115319265026275, "loss": 2.8102, "step": 17397 }, { "epoch": 0.47, "learning_rate": 0.0011531066378697894, "loss": 2.0797, "step": 17398 }, { "epoch": 0.47, "learning_rate": 0.00115302062431692, "loss": 2.8775, "step": 17399 }, { "epoch": 0.47, "learning_rate": 0.001152934609604794, "loss": 2.8975, "step": 17400 }, { "epoch": 0.47, "learning_rate": 0.0011528485937340627, "loss": 2.4952, "step": 17401 }, { "epoch": 0.47, "learning_rate": 0.0011527625767053776, "loss": 2.6576, "step": 17402 }, { "epoch": 0.47, "learning_rate": 0.0011526765585193905, "loss": 2.5508, "step": 17403 }, { "epoch": 0.47, "learning_rate": 0.0011525905391767534, "loss": 2.3569, "step": 17404 }, { "epoch": 0.47, "learning_rate": 0.0011525045186781173, "loss": 2.5085, "step": 17405 }, { "epoch": 0.47, "learning_rate": 0.0011524184970241342, "loss": 2.3513, "step": 17406 }, { "epoch": 0.47, "learning_rate": 0.0011523324742154562, "loss": 2.461, "step": 17407 }, { "epoch": 0.47, "learning_rate": 0.0011522464502527344, "loss": 2.4744, "step": 17408 }, { "epoch": 0.47, "learning_rate": 0.001152160425136621, "loss": 2.8976, "step": 17409 }, { "epoch": 0.47, "learning_rate": 0.0011520743988677666, "loss": 2.228, "step": 17410 }, { "epoch": 0.47, "learning_rate": 0.0011519883714468245, "loss": 2.5592, "step": 17411 }, { "epoch": 0.47, "learning_rate": 0.0011519023428744454, "loss": 2.3727, "step": 17412 }, { "epoch": 0.47, "learning_rate": 0.0011518163131512813, "loss": 2.6267, "step": 17413 }, { "epoch": 0.47, "learning_rate": 0.001151730282277984, "loss": 2.7338, "step": 17414 }, { "epoch": 0.47, "learning_rate": 0.0011516442502552053, "loss": 2.4424, "step": 17415 }, { "epoch": 0.47, "learning_rate": 0.001151558217083597, "loss": 2.5514, "step": 17416 }, { "epoch": 0.47, "learning_rate": 0.0011514721827638101, "loss": 2.5615, "step": 17417 }, { "epoch": 0.47, "learning_rate": 0.0011513861472964978, "loss": 2.6431, "step": 17418 }, { "epoch": 0.47, "learning_rate": 0.0011513001106823106, "loss": 2.2806, "step": 17419 }, { "epoch": 0.47, "learning_rate": 0.001151214072921901, "loss": 2.5064, "step": 17420 }, { "epoch": 0.47, "learning_rate": 0.0011511280340159205, "loss": 2.3676, "step": 17421 }, { "epoch": 0.47, "learning_rate": 0.0011510419939650212, "loss": 2.0708, "step": 17422 }, { "epoch": 0.47, "learning_rate": 0.0011509559527698545, "loss": 2.2998, "step": 17423 }, { "epoch": 0.47, "learning_rate": 0.0011508699104310729, "loss": 2.6637, "step": 17424 }, { "epoch": 0.47, "learning_rate": 0.0011507838669493275, "loss": 2.479, "step": 17425 }, { "epoch": 0.47, "learning_rate": 0.0011506978223252706, "loss": 2.3982, "step": 17426 }, { "epoch": 0.47, "learning_rate": 0.001150611776559554, "loss": 2.6418, "step": 17427 }, { "epoch": 0.47, "learning_rate": 0.0011505257296528296, "loss": 2.767, "step": 17428 }, { "epoch": 0.47, "learning_rate": 0.001150439681605749, "loss": 2.4344, "step": 17429 }, { "epoch": 0.47, "learning_rate": 0.001150353632418964, "loss": 2.5469, "step": 17430 }, { "epoch": 0.47, "learning_rate": 0.0011502675820931271, "loss": 2.8436, "step": 17431 }, { "epoch": 0.47, "learning_rate": 0.0011501815306288901, "loss": 2.8839, "step": 17432 }, { "epoch": 0.47, "learning_rate": 0.0011500954780269042, "loss": 2.3798, "step": 17433 }, { "epoch": 0.47, "learning_rate": 0.0011500094242878221, "loss": 2.1521, "step": 17434 }, { "epoch": 0.47, "learning_rate": 0.0011499233694122952, "loss": 2.3261, "step": 17435 }, { "epoch": 0.47, "learning_rate": 0.0011498373134009759, "loss": 2.7384, "step": 17436 }, { "epoch": 0.47, "learning_rate": 0.0011497512562545155, "loss": 2.6091, "step": 17437 }, { "epoch": 0.47, "learning_rate": 0.0011496651979735668, "loss": 2.5975, "step": 17438 }, { "epoch": 0.47, "learning_rate": 0.0011495791385587812, "loss": 2.5208, "step": 17439 }, { "epoch": 0.47, "learning_rate": 0.0011494930780108106, "loss": 2.7203, "step": 17440 }, { "epoch": 0.47, "learning_rate": 0.0011494070163303072, "loss": 2.2448, "step": 17441 }, { "epoch": 0.47, "learning_rate": 0.0011493209535179232, "loss": 2.3982, "step": 17442 }, { "epoch": 0.47, "learning_rate": 0.0011492348895743101, "loss": 2.4502, "step": 17443 }, { "epoch": 0.47, "learning_rate": 0.0011491488245001205, "loss": 2.5404, "step": 17444 }, { "epoch": 0.47, "learning_rate": 0.0011490627582960056, "loss": 3.016, "step": 17445 }, { "epoch": 0.47, "learning_rate": 0.0011489766909626182, "loss": 2.5289, "step": 17446 }, { "epoch": 0.47, "learning_rate": 0.00114889062250061, "loss": 2.8471, "step": 17447 }, { "epoch": 0.47, "learning_rate": 0.001148804552910633, "loss": 2.4051, "step": 17448 }, { "epoch": 0.47, "learning_rate": 0.0011487184821933393, "loss": 2.5667, "step": 17449 }, { "epoch": 0.47, "learning_rate": 0.001148632410349381, "loss": 2.1117, "step": 17450 }, { "epoch": 0.47, "learning_rate": 0.00114854633737941, "loss": 2.9852, "step": 17451 }, { "epoch": 0.47, "learning_rate": 0.0011484602632840788, "loss": 2.6439, "step": 17452 }, { "epoch": 0.47, "learning_rate": 0.001148374188064039, "loss": 2.6646, "step": 17453 }, { "epoch": 0.47, "learning_rate": 0.0011482881117199429, "loss": 2.3772, "step": 17454 }, { "epoch": 0.47, "learning_rate": 0.0011482020342524425, "loss": 2.514, "step": 17455 }, { "epoch": 0.47, "learning_rate": 0.0011481159556621901, "loss": 2.3557, "step": 17456 }, { "epoch": 0.47, "learning_rate": 0.0011480298759498375, "loss": 2.4167, "step": 17457 }, { "epoch": 0.47, "learning_rate": 0.0011479437951160373, "loss": 2.2333, "step": 17458 }, { "epoch": 0.47, "learning_rate": 0.0011478577131614413, "loss": 2.7377, "step": 17459 }, { "epoch": 0.47, "learning_rate": 0.0011477716300867015, "loss": 2.4019, "step": 17460 }, { "epoch": 0.47, "learning_rate": 0.0011476855458924704, "loss": 2.4851, "step": 17461 }, { "epoch": 0.47, "learning_rate": 0.0011475994605794, "loss": 2.8281, "step": 17462 }, { "epoch": 0.47, "learning_rate": 0.0011475133741481426, "loss": 2.6429, "step": 17463 }, { "epoch": 0.47, "learning_rate": 0.0011474272865993498, "loss": 2.329, "step": 17464 }, { "epoch": 0.47, "learning_rate": 0.0011473411979336747, "loss": 2.5322, "step": 17465 }, { "epoch": 0.47, "learning_rate": 0.0011472551081517688, "loss": 2.4418, "step": 17466 }, { "epoch": 0.47, "learning_rate": 0.0011471690172542848, "loss": 1.764, "step": 17467 }, { "epoch": 0.47, "learning_rate": 0.0011470829252418744, "loss": 2.1302, "step": 17468 }, { "epoch": 0.47, "learning_rate": 0.0011469968321151903, "loss": 2.5915, "step": 17469 }, { "epoch": 0.47, "learning_rate": 0.001146910737874884, "loss": 2.8591, "step": 17470 }, { "epoch": 0.47, "learning_rate": 0.0011468246425216087, "loss": 2.6686, "step": 17471 }, { "epoch": 0.47, "learning_rate": 0.0011467385460560157, "loss": 2.5933, "step": 17472 }, { "epoch": 0.47, "learning_rate": 0.001146652448478758, "loss": 2.5597, "step": 17473 }, { "epoch": 0.47, "learning_rate": 0.0011465663497904877, "loss": 2.5138, "step": 17474 }, { "epoch": 0.47, "learning_rate": 0.0011464802499918567, "loss": 2.36, "step": 17475 }, { "epoch": 0.47, "learning_rate": 0.0011463941490835175, "loss": 2.8633, "step": 17476 }, { "epoch": 0.47, "learning_rate": 0.0011463080470661224, "loss": 2.5182, "step": 17477 }, { "epoch": 0.47, "learning_rate": 0.001146221943940324, "loss": 2.2559, "step": 17478 }, { "epoch": 0.47, "learning_rate": 0.0011461358397067741, "loss": 2.3503, "step": 17479 }, { "epoch": 0.47, "learning_rate": 0.0011460497343661249, "loss": 2.4385, "step": 17480 }, { "epoch": 0.47, "learning_rate": 0.0011459636279190295, "loss": 2.9175, "step": 17481 }, { "epoch": 0.47, "learning_rate": 0.0011458775203661395, "loss": 2.4091, "step": 17482 }, { "epoch": 0.47, "learning_rate": 0.0011457914117081077, "loss": 2.5747, "step": 17483 }, { "epoch": 0.47, "learning_rate": 0.0011457053019455858, "loss": 2.8347, "step": 17484 }, { "epoch": 0.47, "learning_rate": 0.0011456191910792272, "loss": 2.3743, "step": 17485 }, { "epoch": 0.47, "learning_rate": 0.001145533079109683, "loss": 2.657, "step": 17486 }, { "epoch": 0.47, "learning_rate": 0.0011454469660376065, "loss": 2.3828, "step": 17487 }, { "epoch": 0.47, "learning_rate": 0.0011453608518636497, "loss": 2.7412, "step": 17488 }, { "epoch": 0.47, "learning_rate": 0.0011452747365884655, "loss": 2.8241, "step": 17489 }, { "epoch": 0.47, "learning_rate": 0.0011451886202127053, "loss": 2.5917, "step": 17490 }, { "epoch": 0.47, "learning_rate": 0.0011451025027370224, "loss": 2.5602, "step": 17491 }, { "epoch": 0.47, "learning_rate": 0.0011450163841620687, "loss": 1.9806, "step": 17492 }, { "epoch": 0.47, "learning_rate": 0.0011449302644884968, "loss": 2.2281, "step": 17493 }, { "epoch": 0.47, "learning_rate": 0.0011448441437169595, "loss": 2.4627, "step": 17494 }, { "epoch": 0.47, "learning_rate": 0.0011447580218481085, "loss": 2.3557, "step": 17495 }, { "epoch": 0.47, "learning_rate": 0.0011446718988825963, "loss": 2.0292, "step": 17496 }, { "epoch": 0.47, "learning_rate": 0.0011445857748210763, "loss": 2.7413, "step": 17497 }, { "epoch": 0.47, "learning_rate": 0.0011444996496642003, "loss": 2.5079, "step": 17498 }, { "epoch": 0.47, "learning_rate": 0.0011444135234126203, "loss": 2.4395, "step": 17499 }, { "epoch": 0.47, "learning_rate": 0.0011443273960669896, "loss": 2.6667, "step": 17500 }, { "epoch": 0.47, "learning_rate": 0.0011442412676279604, "loss": 2.8746, "step": 17501 }, { "epoch": 0.47, "learning_rate": 0.0011441551380961847, "loss": 2.8656, "step": 17502 }, { "epoch": 0.47, "learning_rate": 0.0011440690074723157, "loss": 2.1901, "step": 17503 }, { "epoch": 0.47, "learning_rate": 0.001143982875757006, "loss": 2.55, "step": 17504 }, { "epoch": 0.47, "learning_rate": 0.0011438967429509075, "loss": 2.633, "step": 17505 }, { "epoch": 0.47, "learning_rate": 0.0011438106090546727, "loss": 2.4518, "step": 17506 }, { "epoch": 0.47, "learning_rate": 0.0011437244740689547, "loss": 2.5286, "step": 17507 }, { "epoch": 0.47, "learning_rate": 0.0011436383379944059, "loss": 2.8266, "step": 17508 }, { "epoch": 0.47, "learning_rate": 0.0011435522008316785, "loss": 2.671, "step": 17509 }, { "epoch": 0.47, "learning_rate": 0.0011434660625814258, "loss": 2.549, "step": 17510 }, { "epoch": 0.47, "learning_rate": 0.001143379923244299, "loss": 2.559, "step": 17511 }, { "epoch": 0.47, "learning_rate": 0.0011432937828209525, "loss": 2.8596, "step": 17512 }, { "epoch": 0.47, "learning_rate": 0.0011432076413120371, "loss": 2.4868, "step": 17513 }, { "epoch": 0.47, "learning_rate": 0.001143121498718207, "loss": 2.5282, "step": 17514 }, { "epoch": 0.47, "learning_rate": 0.0011430353550401133, "loss": 3.0768, "step": 17515 }, { "epoch": 0.47, "learning_rate": 0.0011429492102784096, "loss": 2.7298, "step": 17516 }, { "epoch": 0.47, "learning_rate": 0.0011428630644337483, "loss": 2.5701, "step": 17517 }, { "epoch": 0.47, "learning_rate": 0.001142776917506782, "loss": 2.5953, "step": 17518 }, { "epoch": 0.47, "learning_rate": 0.0011426907694981627, "loss": 2.5705, "step": 17519 }, { "epoch": 0.47, "learning_rate": 0.0011426046204085444, "loss": 2.4382, "step": 17520 }, { "epoch": 0.47, "learning_rate": 0.001142518470238579, "loss": 2.7352, "step": 17521 }, { "epoch": 0.47, "learning_rate": 0.0011424323189889185, "loss": 2.5322, "step": 17522 }, { "epoch": 0.47, "learning_rate": 0.0011423461666602167, "loss": 3.0864, "step": 17523 }, { "epoch": 0.47, "learning_rate": 0.0011422600132531258, "loss": 2.6644, "step": 17524 }, { "epoch": 0.47, "learning_rate": 0.0011421738587682985, "loss": 2.3839, "step": 17525 }, { "epoch": 0.47, "learning_rate": 0.001142087703206387, "loss": 2.3415, "step": 17526 }, { "epoch": 0.47, "learning_rate": 0.0011420015465680449, "loss": 2.9927, "step": 17527 }, { "epoch": 0.47, "learning_rate": 0.0011419153888539244, "loss": 2.3319, "step": 17528 }, { "epoch": 0.47, "learning_rate": 0.0011418292300646783, "loss": 3.1283, "step": 17529 }, { "epoch": 0.47, "learning_rate": 0.001141743070200959, "loss": 3.0967, "step": 17530 }, { "epoch": 0.47, "learning_rate": 0.00114165690926342, "loss": 2.2398, "step": 17531 }, { "epoch": 0.47, "learning_rate": 0.0011415707472527132, "loss": 2.3692, "step": 17532 }, { "epoch": 0.47, "learning_rate": 0.001141484584169492, "loss": 2.5983, "step": 17533 }, { "epoch": 0.47, "learning_rate": 0.0011413984200144087, "loss": 2.8139, "step": 17534 }, { "epoch": 0.47, "learning_rate": 0.0011413122547881166, "loss": 2.3806, "step": 17535 }, { "epoch": 0.47, "learning_rate": 0.0011412260884912674, "loss": 2.3677, "step": 17536 }, { "epoch": 0.47, "learning_rate": 0.0011411399211245154, "loss": 2.5474, "step": 17537 }, { "epoch": 0.47, "learning_rate": 0.0011410537526885122, "loss": 2.5767, "step": 17538 }, { "epoch": 0.47, "learning_rate": 0.0011409675831839108, "loss": 2.8695, "step": 17539 }, { "epoch": 0.47, "learning_rate": 0.0011408814126113646, "loss": 2.7033, "step": 17540 }, { "epoch": 0.47, "learning_rate": 0.0011407952409715262, "loss": 2.4979, "step": 17541 }, { "epoch": 0.47, "learning_rate": 0.0011407090682650476, "loss": 2.899, "step": 17542 }, { "epoch": 0.47, "learning_rate": 0.0011406228944925822, "loss": 2.3582, "step": 17543 }, { "epoch": 0.47, "learning_rate": 0.0011405367196547836, "loss": 2.7763, "step": 17544 }, { "epoch": 0.47, "learning_rate": 0.0011404505437523035, "loss": 2.1369, "step": 17545 }, { "epoch": 0.47, "learning_rate": 0.001140364366785795, "loss": 2.21, "step": 17546 }, { "epoch": 0.47, "learning_rate": 0.0011402781887559115, "loss": 2.9514, "step": 17547 }, { "epoch": 0.47, "learning_rate": 0.0011401920096633057, "loss": 2.4361, "step": 17548 }, { "epoch": 0.47, "learning_rate": 0.0011401058295086297, "loss": 2.7951, "step": 17549 }, { "epoch": 0.47, "learning_rate": 0.0011400196482925374, "loss": 2.6681, "step": 17550 }, { "epoch": 0.47, "learning_rate": 0.0011399334660156812, "loss": 2.5997, "step": 17551 }, { "epoch": 0.47, "learning_rate": 0.0011398472826787138, "loss": 2.5677, "step": 17552 }, { "epoch": 0.47, "learning_rate": 0.001139761098282289, "loss": 2.8538, "step": 17553 }, { "epoch": 0.47, "learning_rate": 0.0011396749128270585, "loss": 2.5191, "step": 17554 }, { "epoch": 0.47, "learning_rate": 0.001139588726313676, "loss": 2.9363, "step": 17555 }, { "epoch": 0.47, "learning_rate": 0.0011395025387427944, "loss": 2.5603, "step": 17556 }, { "epoch": 0.47, "learning_rate": 0.0011394163501150668, "loss": 2.4123, "step": 17557 }, { "epoch": 0.47, "learning_rate": 0.0011393301604311452, "loss": 2.7231, "step": 17558 }, { "epoch": 0.47, "learning_rate": 0.0011392439696916834, "loss": 2.7122, "step": 17559 }, { "epoch": 0.47, "learning_rate": 0.0011391577778973345, "loss": 2.672, "step": 17560 }, { "epoch": 0.47, "learning_rate": 0.0011390715850487512, "loss": 2.6858, "step": 17561 }, { "epoch": 0.47, "learning_rate": 0.0011389853911465857, "loss": 2.2479, "step": 17562 }, { "epoch": 0.47, "learning_rate": 0.0011388991961914926, "loss": 2.2773, "step": 17563 }, { "epoch": 0.47, "learning_rate": 0.0011388130001841238, "loss": 2.7037, "step": 17564 }, { "epoch": 0.47, "learning_rate": 0.001138726803125132, "loss": 2.2991, "step": 17565 }, { "epoch": 0.47, "learning_rate": 0.0011386406050151712, "loss": 2.6685, "step": 17566 }, { "epoch": 0.47, "learning_rate": 0.0011385544058548937, "loss": 2.3231, "step": 17567 }, { "epoch": 0.47, "learning_rate": 0.0011384682056449534, "loss": 2.3524, "step": 17568 }, { "epoch": 0.47, "learning_rate": 0.0011383820043860018, "loss": 3.0007, "step": 17569 }, { "epoch": 0.47, "learning_rate": 0.0011382958020786935, "loss": 2.5654, "step": 17570 }, { "epoch": 0.47, "learning_rate": 0.001138209598723681, "loss": 2.6391, "step": 17571 }, { "epoch": 0.47, "learning_rate": 0.001138123394321617, "loss": 2.65, "step": 17572 }, { "epoch": 0.47, "learning_rate": 0.001138037188873155, "loss": 2.4276, "step": 17573 }, { "epoch": 0.47, "learning_rate": 0.0011379509823789477, "loss": 2.7795, "step": 17574 }, { "epoch": 0.47, "learning_rate": 0.0011378647748396488, "loss": 2.5612, "step": 17575 }, { "epoch": 0.47, "learning_rate": 0.0011377785662559107, "loss": 2.8522, "step": 17576 }, { "epoch": 0.47, "learning_rate": 0.001137692356628387, "loss": 1.9874, "step": 17577 }, { "epoch": 0.47, "learning_rate": 0.0011376061459577307, "loss": 2.7777, "step": 17578 }, { "epoch": 0.47, "learning_rate": 0.0011375199342445945, "loss": 2.7241, "step": 17579 }, { "epoch": 0.47, "learning_rate": 0.0011374337214896321, "loss": 2.5134, "step": 17580 }, { "epoch": 0.47, "learning_rate": 0.0011373475076934963, "loss": 2.1487, "step": 17581 }, { "epoch": 0.47, "learning_rate": 0.0011372612928568404, "loss": 2.5186, "step": 17582 }, { "epoch": 0.47, "learning_rate": 0.0011371750769803176, "loss": 2.9288, "step": 17583 }, { "epoch": 0.47, "learning_rate": 0.0011370888600645808, "loss": 2.4815, "step": 17584 }, { "epoch": 0.47, "learning_rate": 0.001137002642110283, "loss": 2.6015, "step": 17585 }, { "epoch": 0.47, "learning_rate": 0.001136916423118078, "loss": 2.7049, "step": 17586 }, { "epoch": 0.47, "learning_rate": 0.001136830203088619, "loss": 2.3136, "step": 17587 }, { "epoch": 0.47, "learning_rate": 0.0011367439820225585, "loss": 2.4632, "step": 17588 }, { "epoch": 0.47, "learning_rate": 0.0011366577599205498, "loss": 2.5229, "step": 17589 }, { "epoch": 0.47, "learning_rate": 0.0011365715367832468, "loss": 1.8449, "step": 17590 }, { "epoch": 0.47, "learning_rate": 0.001136485312611302, "loss": 2.5754, "step": 17591 }, { "epoch": 0.47, "learning_rate": 0.001136399087405369, "loss": 2.2168, "step": 17592 }, { "epoch": 0.47, "learning_rate": 0.0011363128611661007, "loss": 2.6769, "step": 17593 }, { "epoch": 0.47, "learning_rate": 0.0011362266338941507, "loss": 2.352, "step": 17594 }, { "epoch": 0.47, "learning_rate": 0.001136140405590172, "loss": 2.3479, "step": 17595 }, { "epoch": 0.47, "learning_rate": 0.001136054176254818, "loss": 2.3296, "step": 17596 }, { "epoch": 0.47, "learning_rate": 0.0011359679458887418, "loss": 2.8367, "step": 17597 }, { "epoch": 0.47, "learning_rate": 0.0011358817144925966, "loss": 2.2017, "step": 17598 }, { "epoch": 0.47, "learning_rate": 0.0011357954820670362, "loss": 2.7169, "step": 17599 }, { "epoch": 0.47, "learning_rate": 0.0011357092486127135, "loss": 2.4914, "step": 17600 }, { "epoch": 0.47, "learning_rate": 0.0011356230141302815, "loss": 2.7615, "step": 17601 }, { "epoch": 0.47, "learning_rate": 0.0011355367786203938, "loss": 2.5813, "step": 17602 }, { "epoch": 0.47, "learning_rate": 0.0011354505420837038, "loss": 2.1669, "step": 17603 }, { "epoch": 0.47, "learning_rate": 0.0011353643045208647, "loss": 2.0171, "step": 17604 }, { "epoch": 0.47, "learning_rate": 0.0011352780659325296, "loss": 2.401, "step": 17605 }, { "epoch": 0.47, "learning_rate": 0.0011351918263193526, "loss": 2.2645, "step": 17606 }, { "epoch": 0.47, "learning_rate": 0.0011351055856819864, "loss": 2.274, "step": 17607 }, { "epoch": 0.47, "learning_rate": 0.001135019344021084, "loss": 2.3286, "step": 17608 }, { "epoch": 0.47, "learning_rate": 0.0011349331013372995, "loss": 2.9229, "step": 17609 }, { "epoch": 0.47, "learning_rate": 0.0011348468576312858, "loss": 2.8575, "step": 17610 }, { "epoch": 0.47, "learning_rate": 0.0011347606129036964, "loss": 2.3541, "step": 17611 }, { "epoch": 0.47, "learning_rate": 0.0011346743671551847, "loss": 2.6243, "step": 17612 }, { "epoch": 0.47, "learning_rate": 0.0011345881203864044, "loss": 2.5597, "step": 17613 }, { "epoch": 0.47, "learning_rate": 0.0011345018725980084, "loss": 2.5619, "step": 17614 }, { "epoch": 0.47, "learning_rate": 0.00113441562379065, "loss": 2.6015, "step": 17615 }, { "epoch": 0.47, "learning_rate": 0.001134329373964983, "loss": 2.9887, "step": 17616 }, { "epoch": 0.47, "learning_rate": 0.0011342431231216607, "loss": 2.9514, "step": 17617 }, { "epoch": 0.47, "learning_rate": 0.0011341568712613364, "loss": 2.7848, "step": 17618 }, { "epoch": 0.47, "learning_rate": 0.0011340706183846638, "loss": 2.063, "step": 17619 }, { "epoch": 0.47, "learning_rate": 0.001133984364492296, "loss": 2.7314, "step": 17620 }, { "epoch": 0.47, "learning_rate": 0.0011338981095848871, "loss": 2.7071, "step": 17621 }, { "epoch": 0.47, "learning_rate": 0.0011338118536630894, "loss": 2.7102, "step": 17622 }, { "epoch": 0.47, "learning_rate": 0.0011337255967275575, "loss": 2.5373, "step": 17623 }, { "epoch": 0.47, "learning_rate": 0.001133639338778944, "loss": 2.7451, "step": 17624 }, { "epoch": 0.47, "learning_rate": 0.0011335530798179028, "loss": 2.9571, "step": 17625 }, { "epoch": 0.47, "learning_rate": 0.0011334668198450877, "loss": 2.5329, "step": 17626 }, { "epoch": 0.47, "learning_rate": 0.0011333805588611516, "loss": 2.3477, "step": 17627 }, { "epoch": 0.47, "learning_rate": 0.0011332942968667482, "loss": 2.3872, "step": 17628 }, { "epoch": 0.47, "learning_rate": 0.001133208033862531, "loss": 2.56, "step": 17629 }, { "epoch": 0.47, "learning_rate": 0.0011331217698491538, "loss": 2.1293, "step": 17630 }, { "epoch": 0.47, "learning_rate": 0.0011330355048272695, "loss": 2.7788, "step": 17631 }, { "epoch": 0.47, "learning_rate": 0.0011329492387975322, "loss": 2.5526, "step": 17632 }, { "epoch": 0.47, "learning_rate": 0.0011328629717605955, "loss": 2.6747, "step": 17633 }, { "epoch": 0.47, "learning_rate": 0.0011327767037171124, "loss": 2.1735, "step": 17634 }, { "epoch": 0.47, "learning_rate": 0.0011326904346677367, "loss": 2.4865, "step": 17635 }, { "epoch": 0.47, "learning_rate": 0.001132604164613122, "loss": 2.3069, "step": 17636 }, { "epoch": 0.47, "learning_rate": 0.001132517893553922, "loss": 3.3942, "step": 17637 }, { "epoch": 0.47, "learning_rate": 0.00113243162149079, "loss": 2.7497, "step": 17638 }, { "epoch": 0.47, "learning_rate": 0.0011323453484243795, "loss": 2.6649, "step": 17639 }, { "epoch": 0.47, "learning_rate": 0.0011322590743553446, "loss": 2.529, "step": 17640 }, { "epoch": 0.47, "learning_rate": 0.0011321727992843387, "loss": 2.7686, "step": 17641 }, { "epoch": 0.47, "learning_rate": 0.0011320865232120152, "loss": 2.0444, "step": 17642 }, { "epoch": 0.47, "learning_rate": 0.0011320002461390278, "loss": 2.2792, "step": 17643 }, { "epoch": 0.47, "learning_rate": 0.00113191396806603, "loss": 3.0206, "step": 17644 }, { "epoch": 0.47, "learning_rate": 0.0011318276889936757, "loss": 2.5648, "step": 17645 }, { "epoch": 0.47, "learning_rate": 0.0011317414089226183, "loss": 2.5772, "step": 17646 }, { "epoch": 0.47, "learning_rate": 0.0011316551278535117, "loss": 2.7156, "step": 17647 }, { "epoch": 0.47, "learning_rate": 0.0011315688457870091, "loss": 2.6049, "step": 17648 }, { "epoch": 0.47, "learning_rate": 0.0011314825627237648, "loss": 2.7676, "step": 17649 }, { "epoch": 0.47, "learning_rate": 0.001131396278664432, "loss": 2.4065, "step": 17650 }, { "epoch": 0.47, "learning_rate": 0.0011313099936096644, "loss": 2.6412, "step": 17651 }, { "epoch": 0.47, "learning_rate": 0.0011312237075601157, "loss": 2.5619, "step": 17652 }, { "epoch": 0.47, "learning_rate": 0.0011311374205164398, "loss": 2.4673, "step": 17653 }, { "epoch": 0.47, "learning_rate": 0.00113105113247929, "loss": 2.0451, "step": 17654 }, { "epoch": 0.47, "learning_rate": 0.0011309648434493205, "loss": 2.2933, "step": 17655 }, { "epoch": 0.47, "learning_rate": 0.0011308785534271848, "loss": 2.212, "step": 17656 }, { "epoch": 0.47, "learning_rate": 0.0011307922624135367, "loss": 2.5097, "step": 17657 }, { "epoch": 0.47, "learning_rate": 0.0011307059704090295, "loss": 2.9861, "step": 17658 }, { "epoch": 0.47, "learning_rate": 0.0011306196774143172, "loss": 2.6606, "step": 17659 }, { "epoch": 0.47, "learning_rate": 0.0011305333834300537, "loss": 2.4059, "step": 17660 }, { "epoch": 0.47, "learning_rate": 0.0011304470884568928, "loss": 2.874, "step": 17661 }, { "epoch": 0.47, "learning_rate": 0.0011303607924954878, "loss": 2.7862, "step": 17662 }, { "epoch": 0.47, "learning_rate": 0.0011302744955464929, "loss": 2.4156, "step": 17663 }, { "epoch": 0.47, "learning_rate": 0.0011301881976105614, "loss": 2.3069, "step": 17664 }, { "epoch": 0.47, "learning_rate": 0.0011301018986883478, "loss": 2.2941, "step": 17665 }, { "epoch": 0.47, "learning_rate": 0.0011300155987805055, "loss": 2.8205, "step": 17666 }, { "epoch": 0.47, "learning_rate": 0.0011299292978876878, "loss": 2.618, "step": 17667 }, { "epoch": 0.47, "learning_rate": 0.0011298429960105493, "loss": 2.1807, "step": 17668 }, { "epoch": 0.47, "learning_rate": 0.0011297566931497435, "loss": 2.5766, "step": 17669 }, { "epoch": 0.47, "learning_rate": 0.0011296703893059245, "loss": 2.6172, "step": 17670 }, { "epoch": 0.47, "learning_rate": 0.001129584084479745, "loss": 2.7036, "step": 17671 }, { "epoch": 0.47, "learning_rate": 0.0011294977786718602, "loss": 2.5976, "step": 17672 }, { "epoch": 0.47, "learning_rate": 0.0011294114718829234, "loss": 2.3631, "step": 17673 }, { "epoch": 0.47, "learning_rate": 0.0011293251641135882, "loss": 2.5285, "step": 17674 }, { "epoch": 0.47, "learning_rate": 0.0011292388553645085, "loss": 2.4674, "step": 17675 }, { "epoch": 0.48, "learning_rate": 0.0011291525456363386, "loss": 2.4074, "step": 17676 }, { "epoch": 0.48, "learning_rate": 0.0011290662349297323, "loss": 2.8268, "step": 17677 }, { "epoch": 0.48, "learning_rate": 0.0011289799232453428, "loss": 2.4285, "step": 17678 }, { "epoch": 0.48, "learning_rate": 0.001128893610583825, "loss": 2.7259, "step": 17679 }, { "epoch": 0.48, "learning_rate": 0.001128807296945832, "loss": 2.157, "step": 17680 }, { "epoch": 0.48, "learning_rate": 0.001128720982332018, "loss": 2.5714, "step": 17681 }, { "epoch": 0.48, "learning_rate": 0.0011286346667430368, "loss": 2.1819, "step": 17682 }, { "epoch": 0.48, "learning_rate": 0.0011285483501795423, "loss": 2.51, "step": 17683 }, { "epoch": 0.48, "learning_rate": 0.0011284620326421884, "loss": 2.3068, "step": 17684 }, { "epoch": 0.48, "learning_rate": 0.0011283757141316295, "loss": 2.5232, "step": 17685 }, { "epoch": 0.48, "learning_rate": 0.001128289394648519, "loss": 2.6039, "step": 17686 }, { "epoch": 0.48, "learning_rate": 0.0011282030741935109, "loss": 2.9133, "step": 17687 }, { "epoch": 0.48, "learning_rate": 0.0011281167527672589, "loss": 2.2945, "step": 17688 }, { "epoch": 0.48, "learning_rate": 0.0011280304303704178, "loss": 3.0018, "step": 17689 }, { "epoch": 0.48, "learning_rate": 0.0011279441070036406, "loss": 2.7317, "step": 17690 }, { "epoch": 0.48, "learning_rate": 0.001127857782667582, "loss": 2.5972, "step": 17691 }, { "epoch": 0.48, "learning_rate": 0.0011277714573628957, "loss": 2.0535, "step": 17692 }, { "epoch": 0.48, "learning_rate": 0.001127685131090236, "loss": 2.2949, "step": 17693 }, { "epoch": 0.48, "learning_rate": 0.0011275988038502555, "loss": 2.2849, "step": 17694 }, { "epoch": 0.48, "learning_rate": 0.0011275124756436104, "loss": 3.0574, "step": 17695 }, { "epoch": 0.48, "learning_rate": 0.0011274261464709532, "loss": 2.6845, "step": 17696 }, { "epoch": 0.48, "learning_rate": 0.0011273398163329383, "loss": 2.4896, "step": 17697 }, { "epoch": 0.48, "learning_rate": 0.0011272534852302194, "loss": 2.5278, "step": 17698 }, { "epoch": 0.48, "learning_rate": 0.0011271671531634512, "loss": 2.5441, "step": 17699 }, { "epoch": 0.48, "learning_rate": 0.0011270808201332876, "loss": 2.9365, "step": 17700 }, { "epoch": 0.48, "learning_rate": 0.001126994486140382, "loss": 2.378, "step": 17701 }, { "epoch": 0.48, "learning_rate": 0.001126908151185389, "loss": 2.5692, "step": 17702 }, { "epoch": 0.48, "learning_rate": 0.0011268218152689627, "loss": 2.4886, "step": 17703 }, { "epoch": 0.48, "learning_rate": 0.0011267354783917568, "loss": 2.1179, "step": 17704 }, { "epoch": 0.48, "learning_rate": 0.0011266491405544255, "loss": 2.9031, "step": 17705 }, { "epoch": 0.48, "learning_rate": 0.001126562801757623, "loss": 2.6344, "step": 17706 }, { "epoch": 0.48, "learning_rate": 0.0011264764620020034, "loss": 2.5155, "step": 17707 }, { "epoch": 0.48, "learning_rate": 0.001126390121288221, "loss": 2.0807, "step": 17708 }, { "epoch": 0.48, "learning_rate": 0.0011263037796169293, "loss": 3.2802, "step": 17709 }, { "epoch": 0.48, "learning_rate": 0.0011262174369887827, "loss": 2.3537, "step": 17710 }, { "epoch": 0.48, "learning_rate": 0.0011261310934044355, "loss": 2.7503, "step": 17711 }, { "epoch": 0.48, "learning_rate": 0.0011260447488645419, "loss": 2.0632, "step": 17712 }, { "epoch": 0.48, "learning_rate": 0.0011259584033697554, "loss": 2.8093, "step": 17713 }, { "epoch": 0.48, "learning_rate": 0.0011258720569207307, "loss": 2.7076, "step": 17714 }, { "epoch": 0.48, "learning_rate": 0.001125785709518122, "loss": 2.5864, "step": 17715 }, { "epoch": 0.48, "learning_rate": 0.001125699361162583, "loss": 2.8303, "step": 17716 }, { "epoch": 0.48, "learning_rate": 0.0011256130118547682, "loss": 2.7784, "step": 17717 }, { "epoch": 0.48, "learning_rate": 0.0011255266615953319, "loss": 2.7027, "step": 17718 }, { "epoch": 0.48, "learning_rate": 0.0011254403103849277, "loss": 2.298, "step": 17719 }, { "epoch": 0.48, "learning_rate": 0.0011253539582242104, "loss": 2.408, "step": 17720 }, { "epoch": 0.48, "learning_rate": 0.0011252676051138337, "loss": 2.7484, "step": 17721 }, { "epoch": 0.48, "learning_rate": 0.0011251812510544525, "loss": 2.0826, "step": 17722 }, { "epoch": 0.48, "learning_rate": 0.00112509489604672, "loss": 2.7226, "step": 17723 }, { "epoch": 0.48, "learning_rate": 0.001125008540091291, "loss": 2.2223, "step": 17724 }, { "epoch": 0.48, "learning_rate": 0.0011249221831888196, "loss": 2.4202, "step": 17725 }, { "epoch": 0.48, "learning_rate": 0.0011248358253399605, "loss": 3.0537, "step": 17726 }, { "epoch": 0.48, "learning_rate": 0.001124749466545367, "loss": 2.5264, "step": 17727 }, { "epoch": 0.48, "learning_rate": 0.0011246631068056942, "loss": 2.6934, "step": 17728 }, { "epoch": 0.48, "learning_rate": 0.001124576746121596, "loss": 2.5079, "step": 17729 }, { "epoch": 0.48, "learning_rate": 0.0011244903844937265, "loss": 2.8345, "step": 17730 }, { "epoch": 0.48, "learning_rate": 0.00112440402192274, "loss": 2.5139, "step": 17731 }, { "epoch": 0.48, "learning_rate": 0.0011243176584092912, "loss": 2.4139, "step": 17732 }, { "epoch": 0.48, "learning_rate": 0.0011242312939540335, "loss": 2.6059, "step": 17733 }, { "epoch": 0.48, "learning_rate": 0.0011241449285576222, "loss": 2.2254, "step": 17734 }, { "epoch": 0.48, "learning_rate": 0.001124058562220711, "loss": 2.6407, "step": 17735 }, { "epoch": 0.48, "learning_rate": 0.0011239721949439542, "loss": 2.6252, "step": 17736 }, { "epoch": 0.48, "learning_rate": 0.0011238858267280062, "loss": 2.7959, "step": 17737 }, { "epoch": 0.48, "learning_rate": 0.0011237994575735216, "loss": 2.0249, "step": 17738 }, { "epoch": 0.48, "learning_rate": 0.0011237130874811544, "loss": 2.6173, "step": 17739 }, { "epoch": 0.48, "learning_rate": 0.0011236267164515586, "loss": 2.8066, "step": 17740 }, { "epoch": 0.48, "learning_rate": 0.0011235403444853891, "loss": 2.6915, "step": 17741 }, { "epoch": 0.48, "learning_rate": 0.0011234539715833, "loss": 2.7235, "step": 17742 }, { "epoch": 0.48, "learning_rate": 0.0011233675977459462, "loss": 2.4961, "step": 17743 }, { "epoch": 0.48, "learning_rate": 0.001123281222973981, "loss": 2.4805, "step": 17744 }, { "epoch": 0.48, "learning_rate": 0.0011231948472680592, "loss": 2.4889, "step": 17745 }, { "epoch": 0.48, "learning_rate": 0.0011231084706288354, "loss": 2.969, "step": 17746 }, { "epoch": 0.48, "learning_rate": 0.0011230220930569638, "loss": 2.1119, "step": 17747 }, { "epoch": 0.48, "learning_rate": 0.0011229357145530992, "loss": 2.2382, "step": 17748 }, { "epoch": 0.48, "learning_rate": 0.001122849335117895, "loss": 2.9524, "step": 17749 }, { "epoch": 0.48, "learning_rate": 0.0011227629547520064, "loss": 2.808, "step": 17750 }, { "epoch": 0.48, "learning_rate": 0.001122676573456088, "loss": 2.431, "step": 17751 }, { "epoch": 0.48, "learning_rate": 0.0011225901912307935, "loss": 2.5486, "step": 17752 }, { "epoch": 0.48, "learning_rate": 0.0011225038080767775, "loss": 2.7117, "step": 17753 }, { "epoch": 0.48, "learning_rate": 0.0011224174239946947, "loss": 2.6615, "step": 17754 }, { "epoch": 0.48, "learning_rate": 0.0011223310389851995, "loss": 2.7277, "step": 17755 }, { "epoch": 0.48, "learning_rate": 0.001122244653048946, "loss": 2.5541, "step": 17756 }, { "epoch": 0.48, "learning_rate": 0.001122158266186589, "loss": 2.4321, "step": 17757 }, { "epoch": 0.48, "learning_rate": 0.0011220718783987828, "loss": 2.294, "step": 17758 }, { "epoch": 0.48, "learning_rate": 0.0011219854896861818, "loss": 2.7132, "step": 17759 }, { "epoch": 0.48, "learning_rate": 0.0011218991000494405, "loss": 2.341, "step": 17760 }, { "epoch": 0.48, "learning_rate": 0.0011218127094892137, "loss": 2.2834, "step": 17761 }, { "epoch": 0.48, "learning_rate": 0.0011217263180061555, "loss": 3.0068, "step": 17762 }, { "epoch": 0.48, "learning_rate": 0.0011216399256009201, "loss": 2.7285, "step": 17763 }, { "epoch": 0.48, "learning_rate": 0.0011215535322741626, "loss": 2.6269, "step": 17764 }, { "epoch": 0.48, "learning_rate": 0.0011214671380265374, "loss": 2.3955, "step": 17765 }, { "epoch": 0.48, "learning_rate": 0.0011213807428586988, "loss": 2.7768, "step": 17766 }, { "epoch": 0.48, "learning_rate": 0.0011212943467713015, "loss": 2.0386, "step": 17767 }, { "epoch": 0.48, "learning_rate": 0.0011212079497649997, "loss": 2.6128, "step": 17768 }, { "epoch": 0.48, "learning_rate": 0.0011211215518404482, "loss": 2.2814, "step": 17769 }, { "epoch": 0.48, "learning_rate": 0.0011210351529983016, "loss": 2.4737, "step": 17770 }, { "epoch": 0.48, "learning_rate": 0.0011209487532392141, "loss": 2.3483, "step": 17771 }, { "epoch": 0.48, "learning_rate": 0.0011208623525638406, "loss": 2.3491, "step": 17772 }, { "epoch": 0.48, "learning_rate": 0.0011207759509728355, "loss": 2.3024, "step": 17773 }, { "epoch": 0.48, "learning_rate": 0.0011206895484668535, "loss": 2.5098, "step": 17774 }, { "epoch": 0.48, "learning_rate": 0.0011206031450465492, "loss": 2.7756, "step": 17775 }, { "epoch": 0.48, "learning_rate": 0.0011205167407125768, "loss": 2.1472, "step": 17776 }, { "epoch": 0.48, "learning_rate": 0.001120430335465591, "loss": 2.7946, "step": 17777 }, { "epoch": 0.48, "learning_rate": 0.0011203439293062467, "loss": 2.2127, "step": 17778 }, { "epoch": 0.48, "learning_rate": 0.0011202575222351984, "loss": 2.3859, "step": 17779 }, { "epoch": 0.48, "learning_rate": 0.0011201711142531001, "loss": 2.3809, "step": 17780 }, { "epoch": 0.48, "learning_rate": 0.0011200847053606073, "loss": 2.6557, "step": 17781 }, { "epoch": 0.48, "learning_rate": 0.0011199982955583745, "loss": 2.3008, "step": 17782 }, { "epoch": 0.48, "learning_rate": 0.0011199118848470558, "loss": 2.5593, "step": 17783 }, { "epoch": 0.48, "learning_rate": 0.001119825473227306, "loss": 2.4457, "step": 17784 }, { "epoch": 0.48, "learning_rate": 0.0011197390606997799, "loss": 2.735, "step": 17785 }, { "epoch": 0.48, "learning_rate": 0.001119652647265132, "loss": 2.7428, "step": 17786 }, { "epoch": 0.48, "learning_rate": 0.0011195662329240173, "loss": 2.5315, "step": 17787 }, { "epoch": 0.48, "learning_rate": 0.00111947981767709, "loss": 2.2645, "step": 17788 }, { "epoch": 0.48, "learning_rate": 0.001119393401525005, "loss": 2.7251, "step": 17789 }, { "epoch": 0.48, "learning_rate": 0.001119306984468417, "loss": 2.115, "step": 17790 }, { "epoch": 0.48, "learning_rate": 0.0011192205665079805, "loss": 2.1879, "step": 17791 }, { "epoch": 0.48, "learning_rate": 0.0011191341476443504, "loss": 2.7526, "step": 17792 }, { "epoch": 0.48, "learning_rate": 0.0011190477278781813, "loss": 2.3023, "step": 17793 }, { "epoch": 0.48, "learning_rate": 0.001118961307210128, "loss": 2.314, "step": 17794 }, { "epoch": 0.48, "learning_rate": 0.0011188748856408447, "loss": 2.5056, "step": 17795 }, { "epoch": 0.48, "learning_rate": 0.0011187884631709867, "loss": 2.4706, "step": 17796 }, { "epoch": 0.48, "learning_rate": 0.0011187020398012086, "loss": 2.5857, "step": 17797 }, { "epoch": 0.48, "learning_rate": 0.0011186156155321655, "loss": 2.7903, "step": 17798 }, { "epoch": 0.48, "learning_rate": 0.0011185291903645109, "loss": 2.517, "step": 17799 }, { "epoch": 0.48, "learning_rate": 0.0011184427642989007, "loss": 2.7095, "step": 17800 }, { "epoch": 0.48, "learning_rate": 0.0011183563373359895, "loss": 2.8631, "step": 17801 }, { "epoch": 0.48, "learning_rate": 0.0011182699094764317, "loss": 2.5182, "step": 17802 }, { "epoch": 0.48, "learning_rate": 0.001118183480720882, "loss": 2.7289, "step": 17803 }, { "epoch": 0.48, "learning_rate": 0.0011180970510699956, "loss": 2.2768, "step": 17804 }, { "epoch": 0.48, "learning_rate": 0.0011180106205244272, "loss": 2.4863, "step": 17805 }, { "epoch": 0.48, "learning_rate": 0.001117924189084831, "loss": 2.3841, "step": 17806 }, { "epoch": 0.48, "learning_rate": 0.0011178377567518626, "loss": 2.7721, "step": 17807 }, { "epoch": 0.48, "learning_rate": 0.0011177513235261765, "loss": 2.4815, "step": 17808 }, { "epoch": 0.48, "learning_rate": 0.001117664889408427, "loss": 2.0944, "step": 17809 }, { "epoch": 0.48, "learning_rate": 0.0011175784543992697, "loss": 2.6183, "step": 17810 }, { "epoch": 0.48, "learning_rate": 0.0011174920184993588, "loss": 2.7817, "step": 17811 }, { "epoch": 0.48, "learning_rate": 0.0011174055817093497, "loss": 2.6017, "step": 17812 }, { "epoch": 0.48, "learning_rate": 0.0011173191440298966, "loss": 2.7444, "step": 17813 }, { "epoch": 0.48, "learning_rate": 0.001117232705461655, "loss": 2.7006, "step": 17814 }, { "epoch": 0.48, "learning_rate": 0.0011171462660052789, "loss": 2.3993, "step": 17815 }, { "epoch": 0.48, "learning_rate": 0.0011170598256614237, "loss": 2.1894, "step": 17816 }, { "epoch": 0.48, "learning_rate": 0.0011169733844307445, "loss": 2.8032, "step": 17817 }, { "epoch": 0.48, "learning_rate": 0.0011168869423138956, "loss": 2.8025, "step": 17818 }, { "epoch": 0.48, "learning_rate": 0.0011168004993115323, "loss": 2.4475, "step": 17819 }, { "epoch": 0.48, "learning_rate": 0.0011167140554243092, "loss": 2.3841, "step": 17820 }, { "epoch": 0.48, "learning_rate": 0.0011166276106528812, "loss": 2.3305, "step": 17821 }, { "epoch": 0.48, "learning_rate": 0.0011165411649979036, "loss": 2.7185, "step": 17822 }, { "epoch": 0.48, "learning_rate": 0.0011164547184600304, "loss": 2.5849, "step": 17823 }, { "epoch": 0.48, "learning_rate": 0.0011163682710399175, "loss": 2.501, "step": 17824 }, { "epoch": 0.48, "learning_rate": 0.0011162818227382194, "loss": 1.9884, "step": 17825 }, { "epoch": 0.48, "learning_rate": 0.0011161953735555907, "loss": 2.7129, "step": 17826 }, { "epoch": 0.48, "learning_rate": 0.0011161089234926868, "loss": 2.4031, "step": 17827 }, { "epoch": 0.48, "learning_rate": 0.0011160224725501626, "loss": 2.7148, "step": 17828 }, { "epoch": 0.48, "learning_rate": 0.0011159360207286728, "loss": 2.4921, "step": 17829 }, { "epoch": 0.48, "learning_rate": 0.0011158495680288723, "loss": 2.3798, "step": 17830 }, { "epoch": 0.48, "learning_rate": 0.0011157631144514165, "loss": 2.3587, "step": 17831 }, { "epoch": 0.48, "learning_rate": 0.00111567665999696, "loss": 2.4995, "step": 17832 }, { "epoch": 0.48, "learning_rate": 0.0011155902046661571, "loss": 2.2953, "step": 17833 }, { "epoch": 0.48, "learning_rate": 0.0011155037484596641, "loss": 2.7474, "step": 17834 }, { "epoch": 0.48, "learning_rate": 0.0011154172913781352, "loss": 2.0919, "step": 17835 }, { "epoch": 0.48, "learning_rate": 0.0011153308334222256, "loss": 2.462, "step": 17836 }, { "epoch": 0.48, "learning_rate": 0.0011152443745925905, "loss": 2.7884, "step": 17837 }, { "epoch": 0.48, "learning_rate": 0.0011151579148898842, "loss": 2.6023, "step": 17838 }, { "epoch": 0.48, "learning_rate": 0.0011150714543147623, "loss": 2.0992, "step": 17839 }, { "epoch": 0.48, "learning_rate": 0.0011149849928678796, "loss": 2.5676, "step": 17840 }, { "epoch": 0.48, "learning_rate": 0.0011148985305498914, "loss": 2.8018, "step": 17841 }, { "epoch": 0.48, "learning_rate": 0.0011148120673614519, "loss": 2.4751, "step": 17842 }, { "epoch": 0.48, "learning_rate": 0.0011147256033032168, "loss": 3.0501, "step": 17843 }, { "epoch": 0.48, "learning_rate": 0.0011146391383758416, "loss": 2.6767, "step": 17844 }, { "epoch": 0.48, "learning_rate": 0.0011145526725799806, "loss": 2.3955, "step": 17845 }, { "epoch": 0.48, "learning_rate": 0.0011144662059162885, "loss": 2.1651, "step": 17846 }, { "epoch": 0.48, "learning_rate": 0.0011143797383854216, "loss": 2.7213, "step": 17847 }, { "epoch": 0.48, "learning_rate": 0.001114293269988034, "loss": 2.9216, "step": 17848 }, { "epoch": 0.48, "learning_rate": 0.0011142068007247807, "loss": 2.4757, "step": 17849 }, { "epoch": 0.48, "learning_rate": 0.0011141203305963172, "loss": 2.8197, "step": 17850 }, { "epoch": 0.48, "learning_rate": 0.0011140338596032989, "loss": 2.452, "step": 17851 }, { "epoch": 0.48, "learning_rate": 0.00111394738774638, "loss": 2.6506, "step": 17852 }, { "epoch": 0.48, "learning_rate": 0.0011138609150262164, "loss": 2.5007, "step": 17853 }, { "epoch": 0.48, "learning_rate": 0.0011137744414434626, "loss": 2.5743, "step": 17854 }, { "epoch": 0.48, "learning_rate": 0.0011136879669987742, "loss": 2.5862, "step": 17855 }, { "epoch": 0.48, "learning_rate": 0.001113601491692806, "loss": 2.8965, "step": 17856 }, { "epoch": 0.48, "learning_rate": 0.001113515015526213, "loss": 2.6234, "step": 17857 }, { "epoch": 0.48, "learning_rate": 0.0011134285384996508, "loss": 2.2003, "step": 17858 }, { "epoch": 0.48, "learning_rate": 0.001113342060613774, "loss": 2.7055, "step": 17859 }, { "epoch": 0.48, "learning_rate": 0.0011132555818692382, "loss": 2.4858, "step": 17860 }, { "epoch": 0.48, "learning_rate": 0.0011131691022666988, "loss": 2.8639, "step": 17861 }, { "epoch": 0.48, "learning_rate": 0.0011130826218068096, "loss": 3.0645, "step": 17862 }, { "epoch": 0.48, "learning_rate": 0.0011129961404902273, "loss": 2.8687, "step": 17863 }, { "epoch": 0.48, "learning_rate": 0.0011129096583176064, "loss": 2.5998, "step": 17864 }, { "epoch": 0.48, "learning_rate": 0.0011128231752896018, "loss": 2.6622, "step": 17865 }, { "epoch": 0.48, "learning_rate": 0.0011127366914068693, "loss": 2.7502, "step": 17866 }, { "epoch": 0.48, "learning_rate": 0.0011126502066700636, "loss": 2.4289, "step": 17867 }, { "epoch": 0.48, "learning_rate": 0.0011125637210798406, "loss": 2.4387, "step": 17868 }, { "epoch": 0.48, "learning_rate": 0.001112477234636854, "loss": 2.6728, "step": 17869 }, { "epoch": 0.48, "learning_rate": 0.0011123907473417607, "loss": 2.3646, "step": 17870 }, { "epoch": 0.48, "learning_rate": 0.0011123042591952151, "loss": 2.6119, "step": 17871 }, { "epoch": 0.48, "learning_rate": 0.0011122177701978723, "loss": 2.6374, "step": 17872 }, { "epoch": 0.48, "learning_rate": 0.0011121312803503878, "loss": 2.5645, "step": 17873 }, { "epoch": 0.48, "learning_rate": 0.0011120447896534168, "loss": 2.669, "step": 17874 }, { "epoch": 0.48, "learning_rate": 0.0011119582981076147, "loss": 2.3199, "step": 17875 }, { "epoch": 0.48, "learning_rate": 0.0011118718057136364, "loss": 2.7917, "step": 17876 }, { "epoch": 0.48, "learning_rate": 0.001111785312472137, "loss": 2.8094, "step": 17877 }, { "epoch": 0.48, "learning_rate": 0.0011116988183837724, "loss": 2.6731, "step": 17878 }, { "epoch": 0.48, "learning_rate": 0.0011116123234491974, "loss": 2.9266, "step": 17879 }, { "epoch": 0.48, "learning_rate": 0.0011115258276690675, "loss": 2.4685, "step": 17880 }, { "epoch": 0.48, "learning_rate": 0.0011114393310440378, "loss": 2.5977, "step": 17881 }, { "epoch": 0.48, "learning_rate": 0.0011113528335747636, "loss": 2.652, "step": 17882 }, { "epoch": 0.48, "learning_rate": 0.0011112663352619003, "loss": 2.5091, "step": 17883 }, { "epoch": 0.48, "learning_rate": 0.0011111798361061033, "loss": 2.5196, "step": 17884 }, { "epoch": 0.48, "learning_rate": 0.0011110933361080275, "loss": 2.4519, "step": 17885 }, { "epoch": 0.48, "learning_rate": 0.0011110068352683286, "loss": 2.4494, "step": 17886 }, { "epoch": 0.48, "learning_rate": 0.0011109203335876617, "loss": 2.4053, "step": 17887 }, { "epoch": 0.48, "learning_rate": 0.0011108338310666824, "loss": 2.9039, "step": 17888 }, { "epoch": 0.48, "learning_rate": 0.001110747327706045, "loss": 2.6939, "step": 17889 }, { "epoch": 0.48, "learning_rate": 0.0011106608235064064, "loss": 2.0932, "step": 17890 }, { "epoch": 0.48, "learning_rate": 0.0011105743184684211, "loss": 2.4526, "step": 17891 }, { "epoch": 0.48, "learning_rate": 0.0011104878125927445, "loss": 2.3166, "step": 17892 }, { "epoch": 0.48, "learning_rate": 0.0011104013058800318, "loss": 2.6446, "step": 17893 }, { "epoch": 0.48, "learning_rate": 0.0011103147983309387, "loss": 2.66, "step": 17894 }, { "epoch": 0.48, "learning_rate": 0.0011102282899461205, "loss": 2.4852, "step": 17895 }, { "epoch": 0.48, "learning_rate": 0.0011101417807262324, "loss": 2.5947, "step": 17896 }, { "epoch": 0.48, "learning_rate": 0.0011100552706719297, "loss": 2.5078, "step": 17897 }, { "epoch": 0.48, "learning_rate": 0.0011099687597838682, "loss": 2.7785, "step": 17898 }, { "epoch": 0.48, "learning_rate": 0.001109882248062703, "loss": 2.3817, "step": 17899 }, { "epoch": 0.48, "learning_rate": 0.0011097957355090894, "loss": 2.3518, "step": 17900 }, { "epoch": 0.48, "learning_rate": 0.001109709222123683, "loss": 2.4111, "step": 17901 }, { "epoch": 0.48, "learning_rate": 0.001109622707907139, "loss": 2.3275, "step": 17902 }, { "epoch": 0.48, "learning_rate": 0.001109536192860113, "loss": 2.1023, "step": 17903 }, { "epoch": 0.48, "learning_rate": 0.0011094496769832604, "loss": 2.441, "step": 17904 }, { "epoch": 0.48, "learning_rate": 0.001109363160277237, "loss": 2.1769, "step": 17905 }, { "epoch": 0.48, "learning_rate": 0.0011092766427426974, "loss": 2.721, "step": 17906 }, { "epoch": 0.48, "learning_rate": 0.0011091901243802979, "loss": 2.3285, "step": 17907 }, { "epoch": 0.48, "learning_rate": 0.001109103605190693, "loss": 2.5304, "step": 17908 }, { "epoch": 0.48, "learning_rate": 0.001109017085174539, "loss": 2.4836, "step": 17909 }, { "epoch": 0.48, "learning_rate": 0.001108930564332491, "loss": 2.8377, "step": 17910 }, { "epoch": 0.48, "learning_rate": 0.0011088440426652046, "loss": 2.2032, "step": 17911 }, { "epoch": 0.48, "learning_rate": 0.0011087575201733349, "loss": 2.4816, "step": 17912 }, { "epoch": 0.48, "learning_rate": 0.0011086709968575379, "loss": 2.5056, "step": 17913 }, { "epoch": 0.48, "learning_rate": 0.001108584472718469, "loss": 2.5373, "step": 17914 }, { "epoch": 0.48, "learning_rate": 0.0011084979477567834, "loss": 2.9405, "step": 17915 }, { "epoch": 0.48, "learning_rate": 0.0011084114219731367, "loss": 2.5863, "step": 17916 }, { "epoch": 0.48, "learning_rate": 0.0011083248953681847, "loss": 2.1974, "step": 17917 }, { "epoch": 0.48, "learning_rate": 0.0011082383679425823, "loss": 2.728, "step": 17918 }, { "epoch": 0.48, "learning_rate": 0.0011081518396969857, "loss": 2.4301, "step": 17919 }, { "epoch": 0.48, "learning_rate": 0.0011080653106320497, "loss": 2.6283, "step": 17920 }, { "epoch": 0.48, "learning_rate": 0.0011079787807484307, "loss": 2.5321, "step": 17921 }, { "epoch": 0.48, "learning_rate": 0.0011078922500467835, "loss": 2.5469, "step": 17922 }, { "epoch": 0.48, "learning_rate": 0.0011078057185277639, "loss": 2.4974, "step": 17923 }, { "epoch": 0.48, "learning_rate": 0.0011077191861920276, "loss": 2.9072, "step": 17924 }, { "epoch": 0.48, "learning_rate": 0.0011076326530402296, "loss": 2.7089, "step": 17925 }, { "epoch": 0.48, "learning_rate": 0.0011075461190730262, "loss": 2.7284, "step": 17926 }, { "epoch": 0.48, "learning_rate": 0.0011074595842910729, "loss": 2.2796, "step": 17927 }, { "epoch": 0.48, "learning_rate": 0.0011073730486950244, "loss": 2.3757, "step": 17928 }, { "epoch": 0.48, "learning_rate": 0.0011072865122855372, "loss": 2.606, "step": 17929 }, { "epoch": 0.48, "learning_rate": 0.0011071999750632664, "loss": 2.5825, "step": 17930 }, { "epoch": 0.48, "learning_rate": 0.0011071134370288678, "loss": 2.7487, "step": 17931 }, { "epoch": 0.48, "learning_rate": 0.001107026898182997, "loss": 2.7934, "step": 17932 }, { "epoch": 0.48, "learning_rate": 0.0011069403585263098, "loss": 2.4584, "step": 17933 }, { "epoch": 0.48, "learning_rate": 0.0011068538180594614, "loss": 2.6959, "step": 17934 }, { "epoch": 0.48, "learning_rate": 0.0011067672767831073, "loss": 2.5458, "step": 17935 }, { "epoch": 0.48, "learning_rate": 0.0011066807346979035, "loss": 2.2481, "step": 17936 }, { "epoch": 0.48, "learning_rate": 0.001106594191804506, "loss": 2.4792, "step": 17937 }, { "epoch": 0.48, "learning_rate": 0.0011065076481035694, "loss": 2.6825, "step": 17938 }, { "epoch": 0.48, "learning_rate": 0.00110642110359575, "loss": 2.268, "step": 17939 }, { "epoch": 0.48, "learning_rate": 0.0011063345582817035, "loss": 2.5069, "step": 17940 }, { "epoch": 0.48, "learning_rate": 0.0011062480121620856, "loss": 2.3871, "step": 17941 }, { "epoch": 0.48, "learning_rate": 0.0011061614652375514, "loss": 2.6092, "step": 17942 }, { "epoch": 0.48, "learning_rate": 0.001106074917508757, "loss": 2.5851, "step": 17943 }, { "epoch": 0.48, "learning_rate": 0.001105988368976358, "loss": 2.5877, "step": 17944 }, { "epoch": 0.48, "learning_rate": 0.00110590181964101, "loss": 2.4763, "step": 17945 }, { "epoch": 0.48, "learning_rate": 0.001105815269503369, "loss": 2.7502, "step": 17946 }, { "epoch": 0.48, "learning_rate": 0.00110572871856409, "loss": 2.4686, "step": 17947 }, { "epoch": 0.48, "learning_rate": 0.0011056421668238295, "loss": 2.5701, "step": 17948 }, { "epoch": 0.48, "learning_rate": 0.0011055556142832428, "loss": 2.6243, "step": 17949 }, { "epoch": 0.48, "learning_rate": 0.0011054690609429857, "loss": 2.3517, "step": 17950 }, { "epoch": 0.48, "learning_rate": 0.0011053825068037136, "loss": 2.5497, "step": 17951 }, { "epoch": 0.48, "learning_rate": 0.0011052959518660823, "loss": 2.6973, "step": 17952 }, { "epoch": 0.48, "learning_rate": 0.001105209396130748, "loss": 2.8239, "step": 17953 }, { "epoch": 0.48, "learning_rate": 0.0011051228395983664, "loss": 2.9068, "step": 17954 }, { "epoch": 0.48, "learning_rate": 0.0011050362822695922, "loss": 2.5289, "step": 17955 }, { "epoch": 0.48, "learning_rate": 0.0011049497241450827, "loss": 2.4885, "step": 17956 }, { "epoch": 0.48, "learning_rate": 0.0011048631652254926, "loss": 2.3867, "step": 17957 }, { "epoch": 0.48, "learning_rate": 0.0011047766055114778, "loss": 2.3428, "step": 17958 }, { "epoch": 0.48, "learning_rate": 0.001104690045003694, "loss": 2.1343, "step": 17959 }, { "epoch": 0.48, "learning_rate": 0.0011046034837027974, "loss": 2.7939, "step": 17960 }, { "epoch": 0.48, "learning_rate": 0.0011045169216094435, "loss": 2.1574, "step": 17961 }, { "epoch": 0.48, "learning_rate": 0.0011044303587242881, "loss": 2.7768, "step": 17962 }, { "epoch": 0.48, "learning_rate": 0.001104343795047987, "loss": 2.8994, "step": 17963 }, { "epoch": 0.48, "learning_rate": 0.0011042572305811958, "loss": 2.5973, "step": 17964 }, { "epoch": 0.48, "learning_rate": 0.0011041706653245704, "loss": 2.203, "step": 17965 }, { "epoch": 0.48, "learning_rate": 0.0011040840992787668, "loss": 2.4232, "step": 17966 }, { "epoch": 0.48, "learning_rate": 0.0011039975324444408, "loss": 2.4914, "step": 17967 }, { "epoch": 0.48, "learning_rate": 0.0011039109648222478, "loss": 2.5043, "step": 17968 }, { "epoch": 0.48, "learning_rate": 0.001103824396412844, "loss": 2.4401, "step": 17969 }, { "epoch": 0.48, "learning_rate": 0.0011037378272168855, "loss": 2.4437, "step": 17970 }, { "epoch": 0.48, "learning_rate": 0.0011036512572350273, "loss": 2.9121, "step": 17971 }, { "epoch": 0.48, "learning_rate": 0.0011035646864679257, "loss": 2.2194, "step": 17972 }, { "epoch": 0.48, "learning_rate": 0.0011034781149162369, "loss": 2.3611, "step": 17973 }, { "epoch": 0.48, "learning_rate": 0.001103391542580616, "loss": 2.5471, "step": 17974 }, { "epoch": 0.48, "learning_rate": 0.0011033049694617195, "loss": 2.5058, "step": 17975 }, { "epoch": 0.48, "learning_rate": 0.001103218395560203, "loss": 2.3623, "step": 17976 }, { "epoch": 0.48, "learning_rate": 0.0011031318208767227, "loss": 2.336, "step": 17977 }, { "epoch": 0.48, "learning_rate": 0.0011030452454119336, "loss": 2.3157, "step": 17978 }, { "epoch": 0.48, "learning_rate": 0.0011029586691664924, "loss": 2.7327, "step": 17979 }, { "epoch": 0.48, "learning_rate": 0.001102872092141055, "loss": 1.9975, "step": 17980 }, { "epoch": 0.48, "learning_rate": 0.0011027855143362765, "loss": 2.2511, "step": 17981 }, { "epoch": 0.48, "learning_rate": 0.0011026989357528134, "loss": 2.4783, "step": 17982 }, { "epoch": 0.48, "learning_rate": 0.0011026123563913218, "loss": 2.4036, "step": 17983 }, { "epoch": 0.48, "learning_rate": 0.0011025257762524575, "loss": 2.1277, "step": 17984 }, { "epoch": 0.48, "learning_rate": 0.0011024391953368758, "loss": 2.5785, "step": 17985 }, { "epoch": 0.48, "learning_rate": 0.0011023526136452332, "loss": 2.5344, "step": 17986 }, { "epoch": 0.48, "learning_rate": 0.0011022660311781857, "loss": 2.7093, "step": 17987 }, { "epoch": 0.48, "learning_rate": 0.0011021794479363885, "loss": 2.2885, "step": 17988 }, { "epoch": 0.48, "learning_rate": 0.0011020928639204986, "loss": 2.5126, "step": 17989 }, { "epoch": 0.48, "learning_rate": 0.001102006279131171, "loss": 2.6738, "step": 17990 }, { "epoch": 0.48, "learning_rate": 0.0011019196935690625, "loss": 2.967, "step": 17991 }, { "epoch": 0.48, "learning_rate": 0.0011018331072348284, "loss": 2.3395, "step": 17992 }, { "epoch": 0.48, "learning_rate": 0.0011017465201291253, "loss": 2.6402, "step": 17993 }, { "epoch": 0.48, "learning_rate": 0.0011016599322526083, "loss": 2.5602, "step": 17994 }, { "epoch": 0.48, "learning_rate": 0.0011015733436059336, "loss": 2.5561, "step": 17995 }, { "epoch": 0.48, "learning_rate": 0.001101486754189758, "loss": 2.2256, "step": 17996 }, { "epoch": 0.48, "learning_rate": 0.0011014001640047364, "loss": 2.803, "step": 17997 }, { "epoch": 0.48, "learning_rate": 0.0011013135730515253, "loss": 2.3235, "step": 17998 }, { "epoch": 0.48, "learning_rate": 0.0011012269813307812, "loss": 2.715, "step": 17999 }, { "epoch": 0.48, "learning_rate": 0.0011011403888431593, "loss": 2.572, "step": 18000 }, { "epoch": 0.48, "learning_rate": 0.0011010537955893158, "loss": 2.8497, "step": 18001 }, { "epoch": 0.48, "learning_rate": 0.0011009672015699068, "loss": 2.3228, "step": 18002 }, { "epoch": 0.48, "learning_rate": 0.0011008806067855886, "loss": 2.65, "step": 18003 }, { "epoch": 0.48, "learning_rate": 0.0011007940112370165, "loss": 2.3506, "step": 18004 }, { "epoch": 0.48, "learning_rate": 0.0011007074149248475, "loss": 2.708, "step": 18005 }, { "epoch": 0.48, "learning_rate": 0.0011006208178497368, "loss": 2.2433, "step": 18006 }, { "epoch": 0.48, "learning_rate": 0.0011005342200123408, "loss": 2.4219, "step": 18007 }, { "epoch": 0.48, "learning_rate": 0.0011004476214133156, "loss": 2.4882, "step": 18008 }, { "epoch": 0.48, "learning_rate": 0.0011003610220533173, "loss": 2.6118, "step": 18009 }, { "epoch": 0.48, "learning_rate": 0.0011002744219330016, "loss": 2.5706, "step": 18010 }, { "epoch": 0.48, "learning_rate": 0.0011001878210530247, "loss": 2.5564, "step": 18011 }, { "epoch": 0.48, "learning_rate": 0.0011001012194140432, "loss": 2.4887, "step": 18012 }, { "epoch": 0.48, "learning_rate": 0.0011000146170167125, "loss": 2.0065, "step": 18013 }, { "epoch": 0.48, "learning_rate": 0.001099928013861689, "loss": 2.6985, "step": 18014 }, { "epoch": 0.48, "learning_rate": 0.0010998414099496288, "loss": 2.7701, "step": 18015 }, { "epoch": 0.48, "learning_rate": 0.001099754805281188, "loss": 3.0419, "step": 18016 }, { "epoch": 0.48, "learning_rate": 0.0010996681998570225, "loss": 2.5582, "step": 18017 }, { "epoch": 0.48, "learning_rate": 0.0010995815936777882, "loss": 2.5765, "step": 18018 }, { "epoch": 0.48, "learning_rate": 0.001099494986744142, "loss": 2.81, "step": 18019 }, { "epoch": 0.48, "learning_rate": 0.0010994083790567394, "loss": 3.2125, "step": 18020 }, { "epoch": 0.48, "learning_rate": 0.0010993217706162365, "loss": 2.5036, "step": 18021 }, { "epoch": 0.48, "learning_rate": 0.0010992351614232902, "loss": 2.512, "step": 18022 }, { "epoch": 0.48, "learning_rate": 0.0010991485514785558, "loss": 2.7115, "step": 18023 }, { "epoch": 0.48, "learning_rate": 0.0010990619407826893, "loss": 2.7013, "step": 18024 }, { "epoch": 0.48, "learning_rate": 0.0010989753293363476, "loss": 2.324, "step": 18025 }, { "epoch": 0.48, "learning_rate": 0.0010988887171401865, "loss": 2.4344, "step": 18026 }, { "epoch": 0.48, "learning_rate": 0.0010988021041948622, "loss": 2.2236, "step": 18027 }, { "epoch": 0.48, "learning_rate": 0.0010987154905010307, "loss": 2.3734, "step": 18028 }, { "epoch": 0.48, "learning_rate": 0.001098628876059348, "loss": 2.3427, "step": 18029 }, { "epoch": 0.48, "learning_rate": 0.0010985422608704712, "loss": 2.1962, "step": 18030 }, { "epoch": 0.48, "learning_rate": 0.0010984556449350556, "loss": 2.5124, "step": 18031 }, { "epoch": 0.48, "learning_rate": 0.0010983690282537575, "loss": 2.5924, "step": 18032 }, { "epoch": 0.48, "learning_rate": 0.0010982824108272332, "loss": 2.6551, "step": 18033 }, { "epoch": 0.48, "learning_rate": 0.001098195792656139, "loss": 2.648, "step": 18034 }, { "epoch": 0.48, "learning_rate": 0.0010981091737411312, "loss": 2.8386, "step": 18035 }, { "epoch": 0.48, "learning_rate": 0.0010980225540828659, "loss": 2.6347, "step": 18036 }, { "epoch": 0.48, "learning_rate": 0.0010979359336819989, "loss": 3.0201, "step": 18037 }, { "epoch": 0.48, "learning_rate": 0.001097849312539187, "loss": 2.5985, "step": 18038 }, { "epoch": 0.48, "learning_rate": 0.0010977626906550862, "loss": 2.3525, "step": 18039 }, { "epoch": 0.48, "learning_rate": 0.0010976760680303525, "loss": 2.1198, "step": 18040 }, { "epoch": 0.48, "learning_rate": 0.0010975894446656426, "loss": 2.1019, "step": 18041 }, { "epoch": 0.48, "learning_rate": 0.0010975028205616123, "loss": 2.1579, "step": 18042 }, { "epoch": 0.48, "learning_rate": 0.0010974161957189186, "loss": 2.687, "step": 18043 }, { "epoch": 0.48, "learning_rate": 0.0010973295701382166, "loss": 2.6126, "step": 18044 }, { "epoch": 0.48, "learning_rate": 0.0010972429438201635, "loss": 2.4274, "step": 18045 }, { "epoch": 0.48, "learning_rate": 0.0010971563167654153, "loss": 2.2699, "step": 18046 }, { "epoch": 0.48, "learning_rate": 0.001097069688974628, "loss": 2.1777, "step": 18047 }, { "epoch": 0.49, "learning_rate": 0.001096983060448458, "loss": 2.9669, "step": 18048 }, { "epoch": 0.49, "learning_rate": 0.001096896431187562, "loss": 2.2885, "step": 18049 }, { "epoch": 0.49, "learning_rate": 0.0010968098011925958, "loss": 2.6049, "step": 18050 }, { "epoch": 0.49, "learning_rate": 0.0010967231704642158, "loss": 2.4747, "step": 18051 }, { "epoch": 0.49, "learning_rate": 0.0010966365390030783, "loss": 2.6313, "step": 18052 }, { "epoch": 0.49, "learning_rate": 0.00109654990680984, "loss": 2.5402, "step": 18053 }, { "epoch": 0.49, "learning_rate": 0.0010964632738851565, "loss": 2.7923, "step": 18054 }, { "epoch": 0.49, "learning_rate": 0.0010963766402296846, "loss": 2.4942, "step": 18055 }, { "epoch": 0.49, "learning_rate": 0.0010962900058440806, "loss": 3.1168, "step": 18056 }, { "epoch": 0.49, "learning_rate": 0.0010962033707290005, "loss": 2.232, "step": 18057 }, { "epoch": 0.49, "learning_rate": 0.0010961167348851012, "loss": 2.2626, "step": 18058 }, { "epoch": 0.49, "learning_rate": 0.0010960300983130387, "loss": 2.4161, "step": 18059 }, { "epoch": 0.49, "learning_rate": 0.0010959434610134688, "loss": 2.8082, "step": 18060 }, { "epoch": 0.49, "learning_rate": 0.0010958568229870488, "loss": 2.4929, "step": 18061 }, { "epoch": 0.49, "learning_rate": 0.0010957701842344348, "loss": 2.7569, "step": 18062 }, { "epoch": 0.49, "learning_rate": 0.001095683544756283, "loss": 2.309, "step": 18063 }, { "epoch": 0.49, "learning_rate": 0.0010955969045532493, "loss": 2.3344, "step": 18064 }, { "epoch": 0.49, "learning_rate": 0.0010955102636259909, "loss": 2.4688, "step": 18065 }, { "epoch": 0.49, "learning_rate": 0.0010954236219751637, "loss": 2.5312, "step": 18066 }, { "epoch": 0.49, "learning_rate": 0.001095336979601424, "loss": 2.7815, "step": 18067 }, { "epoch": 0.49, "learning_rate": 0.0010952503365054286, "loss": 2.3379, "step": 18068 }, { "epoch": 0.49, "learning_rate": 0.0010951636926878339, "loss": 2.8285, "step": 18069 }, { "epoch": 0.49, "learning_rate": 0.0010950770481492958, "loss": 2.6858, "step": 18070 }, { "epoch": 0.49, "learning_rate": 0.001094990402890471, "loss": 2.4881, "step": 18071 }, { "epoch": 0.49, "learning_rate": 0.001094903756912016, "loss": 1.972, "step": 18072 }, { "epoch": 0.49, "learning_rate": 0.0010948171102145871, "loss": 2.4768, "step": 18073 }, { "epoch": 0.49, "learning_rate": 0.0010947304627988408, "loss": 2.1493, "step": 18074 }, { "epoch": 0.49, "learning_rate": 0.0010946438146654334, "loss": 2.7782, "step": 18075 }, { "epoch": 0.49, "learning_rate": 0.0010945571658150213, "loss": 2.3699, "step": 18076 }, { "epoch": 0.49, "learning_rate": 0.0010944705162482609, "loss": 2.8286, "step": 18077 }, { "epoch": 0.49, "learning_rate": 0.001094383865965809, "loss": 2.3041, "step": 18078 }, { "epoch": 0.49, "learning_rate": 0.001094297214968322, "loss": 2.5795, "step": 18079 }, { "epoch": 0.49, "learning_rate": 0.0010942105632564553, "loss": 2.1398, "step": 18080 }, { "epoch": 0.49, "learning_rate": 0.001094123910830867, "loss": 2.478, "step": 18081 }, { "epoch": 0.49, "learning_rate": 0.0010940372576922126, "loss": 2.3463, "step": 18082 }, { "epoch": 0.49, "learning_rate": 0.0010939506038411487, "loss": 2.9084, "step": 18083 }, { "epoch": 0.49, "learning_rate": 0.0010938639492783318, "loss": 2.7875, "step": 18084 }, { "epoch": 0.49, "learning_rate": 0.0010937772940044185, "loss": 2.3511, "step": 18085 }, { "epoch": 0.49, "learning_rate": 0.001093690638020065, "loss": 2.4969, "step": 18086 }, { "epoch": 0.49, "learning_rate": 0.001093603981325928, "loss": 2.3571, "step": 18087 }, { "epoch": 0.49, "learning_rate": 0.001093517323922664, "loss": 2.7315, "step": 18088 }, { "epoch": 0.49, "learning_rate": 0.0010934306658109297, "loss": 2.5994, "step": 18089 }, { "epoch": 0.49, "learning_rate": 0.0010933440069913812, "loss": 2.3935, "step": 18090 }, { "epoch": 0.49, "learning_rate": 0.001093257347464675, "loss": 2.8266, "step": 18091 }, { "epoch": 0.49, "learning_rate": 0.0010931706872314682, "loss": 2.4936, "step": 18092 }, { "epoch": 0.49, "learning_rate": 0.0010930840262924166, "loss": 2.8671, "step": 18093 }, { "epoch": 0.49, "learning_rate": 0.0010929973646481774, "loss": 2.4593, "step": 18094 }, { "epoch": 0.49, "learning_rate": 0.0010929107022994065, "loss": 2.4165, "step": 18095 }, { "epoch": 0.49, "learning_rate": 0.001092824039246761, "loss": 2.4143, "step": 18096 }, { "epoch": 0.49, "learning_rate": 0.001092737375490897, "loss": 2.4522, "step": 18097 }, { "epoch": 0.49, "learning_rate": 0.001092650711032471, "loss": 2.4275, "step": 18098 }, { "epoch": 0.49, "learning_rate": 0.00109256404587214, "loss": 2.9312, "step": 18099 }, { "epoch": 0.49, "learning_rate": 0.0010924773800105602, "loss": 2.5118, "step": 18100 }, { "epoch": 0.49, "learning_rate": 0.0010923907134483886, "loss": 2.3735, "step": 18101 }, { "epoch": 0.49, "learning_rate": 0.0010923040461862815, "loss": 2.5689, "step": 18102 }, { "epoch": 0.49, "learning_rate": 0.0010922173782248951, "loss": 2.5714, "step": 18103 }, { "epoch": 0.49, "learning_rate": 0.0010921307095648864, "loss": 2.3204, "step": 18104 }, { "epoch": 0.49, "learning_rate": 0.0010920440402069121, "loss": 2.3407, "step": 18105 }, { "epoch": 0.49, "learning_rate": 0.0010919573701516285, "loss": 2.3576, "step": 18106 }, { "epoch": 0.49, "learning_rate": 0.0010918706993996922, "loss": 2.6356, "step": 18107 }, { "epoch": 0.49, "learning_rate": 0.0010917840279517602, "loss": 2.697, "step": 18108 }, { "epoch": 0.49, "learning_rate": 0.0010916973558084886, "loss": 2.8138, "step": 18109 }, { "epoch": 0.49, "learning_rate": 0.0010916106829705343, "loss": 2.4516, "step": 18110 }, { "epoch": 0.49, "learning_rate": 0.0010915240094385536, "loss": 2.269, "step": 18111 }, { "epoch": 0.49, "learning_rate": 0.0010914373352132038, "loss": 2.71, "step": 18112 }, { "epoch": 0.49, "learning_rate": 0.0010913506602951409, "loss": 2.2693, "step": 18113 }, { "epoch": 0.49, "learning_rate": 0.0010912639846850215, "loss": 2.6231, "step": 18114 }, { "epoch": 0.49, "learning_rate": 0.0010911773083835028, "loss": 2.5865, "step": 18115 }, { "epoch": 0.49, "learning_rate": 0.001091090631391241, "loss": 2.5964, "step": 18116 }, { "epoch": 0.49, "learning_rate": 0.0010910039537088928, "loss": 2.6481, "step": 18117 }, { "epoch": 0.49, "learning_rate": 0.0010909172753371151, "loss": 2.2661, "step": 18118 }, { "epoch": 0.49, "learning_rate": 0.001090830596276564, "loss": 2.4532, "step": 18119 }, { "epoch": 0.49, "learning_rate": 0.0010907439165278967, "loss": 2.1849, "step": 18120 }, { "epoch": 0.49, "learning_rate": 0.00109065723609177, "loss": 2.4397, "step": 18121 }, { "epoch": 0.49, "learning_rate": 0.0010905705549688403, "loss": 2.7863, "step": 18122 }, { "epoch": 0.49, "learning_rate": 0.0010904838731597636, "loss": 2.6513, "step": 18123 }, { "epoch": 0.49, "learning_rate": 0.001090397190665198, "loss": 2.5166, "step": 18124 }, { "epoch": 0.49, "learning_rate": 0.001090310507485799, "loss": 2.7846, "step": 18125 }, { "epoch": 0.49, "learning_rate": 0.001090223823622224, "loss": 2.6504, "step": 18126 }, { "epoch": 0.49, "learning_rate": 0.0010901371390751292, "loss": 2.7213, "step": 18127 }, { "epoch": 0.49, "learning_rate": 0.0010900504538451717, "loss": 2.3336, "step": 18128 }, { "epoch": 0.49, "learning_rate": 0.0010899637679330084, "loss": 2.4214, "step": 18129 }, { "epoch": 0.49, "learning_rate": 0.0010898770813392948, "loss": 2.6971, "step": 18130 }, { "epoch": 0.49, "learning_rate": 0.001089790394064689, "loss": 2.6931, "step": 18131 }, { "epoch": 0.49, "learning_rate": 0.0010897037061098475, "loss": 3.1359, "step": 18132 }, { "epoch": 0.49, "learning_rate": 0.0010896170174754265, "loss": 2.3997, "step": 18133 }, { "epoch": 0.49, "learning_rate": 0.0010895303281620828, "loss": 2.372, "step": 18134 }, { "epoch": 0.49, "learning_rate": 0.0010894436381704738, "loss": 2.1442, "step": 18135 }, { "epoch": 0.49, "learning_rate": 0.0010893569475012553, "loss": 2.4355, "step": 18136 }, { "epoch": 0.49, "learning_rate": 0.0010892702561550848, "loss": 2.6988, "step": 18137 }, { "epoch": 0.49, "learning_rate": 0.001089183564132619, "loss": 2.0275, "step": 18138 }, { "epoch": 0.49, "learning_rate": 0.0010890968714345143, "loss": 2.8445, "step": 18139 }, { "epoch": 0.49, "learning_rate": 0.0010890101780614274, "loss": 2.4063, "step": 18140 }, { "epoch": 0.49, "learning_rate": 0.0010889234840140154, "loss": 2.6396, "step": 18141 }, { "epoch": 0.49, "learning_rate": 0.0010888367892929352, "loss": 2.5186, "step": 18142 }, { "epoch": 0.49, "learning_rate": 0.001088750093898843, "loss": 3.0067, "step": 18143 }, { "epoch": 0.49, "learning_rate": 0.0010886633978323963, "loss": 2.4926, "step": 18144 }, { "epoch": 0.49, "learning_rate": 0.0010885767010942516, "loss": 2.5121, "step": 18145 }, { "epoch": 0.49, "learning_rate": 0.0010884900036850654, "loss": 2.9278, "step": 18146 }, { "epoch": 0.49, "learning_rate": 0.0010884033056054946, "loss": 2.5095, "step": 18147 }, { "epoch": 0.49, "learning_rate": 0.0010883166068561966, "loss": 2.3521, "step": 18148 }, { "epoch": 0.49, "learning_rate": 0.0010882299074378274, "loss": 2.6384, "step": 18149 }, { "epoch": 0.49, "learning_rate": 0.0010881432073510443, "loss": 2.474, "step": 18150 }, { "epoch": 0.49, "learning_rate": 0.0010880565065965043, "loss": 2.2459, "step": 18151 }, { "epoch": 0.49, "learning_rate": 0.0010879698051748637, "loss": 3.0087, "step": 18152 }, { "epoch": 0.49, "learning_rate": 0.0010878831030867796, "loss": 2.628, "step": 18153 }, { "epoch": 0.49, "learning_rate": 0.0010877964003329086, "loss": 2.8704, "step": 18154 }, { "epoch": 0.49, "learning_rate": 0.0010877096969139082, "loss": 2.3192, "step": 18155 }, { "epoch": 0.49, "learning_rate": 0.0010876229928304347, "loss": 2.6548, "step": 18156 }, { "epoch": 0.49, "learning_rate": 0.001087536288083145, "loss": 2.7597, "step": 18157 }, { "epoch": 0.49, "learning_rate": 0.0010874495826726958, "loss": 2.3786, "step": 18158 }, { "epoch": 0.49, "learning_rate": 0.0010873628765997445, "loss": 2.2116, "step": 18159 }, { "epoch": 0.49, "learning_rate": 0.0010872761698649475, "loss": 2.5894, "step": 18160 }, { "epoch": 0.49, "learning_rate": 0.001087189462468962, "loss": 2.4517, "step": 18161 }, { "epoch": 0.49, "learning_rate": 0.0010871027544124448, "loss": 2.4493, "step": 18162 }, { "epoch": 0.49, "learning_rate": 0.0010870160456960523, "loss": 2.3979, "step": 18163 }, { "epoch": 0.49, "learning_rate": 0.0010869293363204421, "loss": 2.4355, "step": 18164 }, { "epoch": 0.49, "learning_rate": 0.0010868426262862706, "loss": 2.0479, "step": 18165 }, { "epoch": 0.49, "learning_rate": 0.001086755915594195, "loss": 2.7797, "step": 18166 }, { "epoch": 0.49, "learning_rate": 0.0010866692042448723, "loss": 2.9846, "step": 18167 }, { "epoch": 0.49, "learning_rate": 0.001086582492238959, "loss": 2.3558, "step": 18168 }, { "epoch": 0.49, "learning_rate": 0.0010864957795771125, "loss": 2.4851, "step": 18169 }, { "epoch": 0.49, "learning_rate": 0.0010864090662599888, "loss": 2.2577, "step": 18170 }, { "epoch": 0.49, "learning_rate": 0.0010863223522882461, "loss": 2.8626, "step": 18171 }, { "epoch": 0.49, "learning_rate": 0.0010862356376625405, "loss": 2.5445, "step": 18172 }, { "epoch": 0.49, "learning_rate": 0.0010861489223835288, "loss": 2.8062, "step": 18173 }, { "epoch": 0.49, "learning_rate": 0.0010860622064518687, "loss": 2.9575, "step": 18174 }, { "epoch": 0.49, "learning_rate": 0.0010859754898682166, "loss": 2.8692, "step": 18175 }, { "epoch": 0.49, "learning_rate": 0.0010858887726332294, "loss": 2.7054, "step": 18176 }, { "epoch": 0.49, "learning_rate": 0.0010858020547475642, "loss": 2.5788, "step": 18177 }, { "epoch": 0.49, "learning_rate": 0.0010857153362118781, "loss": 2.4119, "step": 18178 }, { "epoch": 0.49, "learning_rate": 0.001085628617026828, "loss": 2.541, "step": 18179 }, { "epoch": 0.49, "learning_rate": 0.001085541897193071, "loss": 2.1584, "step": 18180 }, { "epoch": 0.49, "learning_rate": 0.0010854551767112632, "loss": 2.524, "step": 18181 }, { "epoch": 0.49, "learning_rate": 0.001085368455582063, "loss": 2.3255, "step": 18182 }, { "epoch": 0.49, "learning_rate": 0.0010852817338061261, "loss": 2.2863, "step": 18183 }, { "epoch": 0.49, "learning_rate": 0.0010851950113841102, "loss": 3.1414, "step": 18184 }, { "epoch": 0.49, "learning_rate": 0.0010851082883166724, "loss": 2.7683, "step": 18185 }, { "epoch": 0.49, "learning_rate": 0.001085021564604469, "loss": 2.2991, "step": 18186 }, { "epoch": 0.49, "learning_rate": 0.0010849348402481576, "loss": 2.7283, "step": 18187 }, { "epoch": 0.49, "learning_rate": 0.0010848481152483953, "loss": 2.5751, "step": 18188 }, { "epoch": 0.49, "learning_rate": 0.001084761389605838, "loss": 2.8257, "step": 18189 }, { "epoch": 0.49, "learning_rate": 0.0010846746633211444, "loss": 2.2528, "step": 18190 }, { "epoch": 0.49, "learning_rate": 0.0010845879363949706, "loss": 2.8866, "step": 18191 }, { "epoch": 0.49, "learning_rate": 0.0010845012088279734, "loss": 2.5678, "step": 18192 }, { "epoch": 0.49, "learning_rate": 0.0010844144806208102, "loss": 2.7917, "step": 18193 }, { "epoch": 0.49, "learning_rate": 0.0010843277517741383, "loss": 2.2997, "step": 18194 }, { "epoch": 0.49, "learning_rate": 0.0010842410222886146, "loss": 2.5403, "step": 18195 }, { "epoch": 0.49, "learning_rate": 0.0010841542921648953, "loss": 2.7419, "step": 18196 }, { "epoch": 0.49, "learning_rate": 0.0010840675614036384, "loss": 2.3746, "step": 18197 }, { "epoch": 0.49, "learning_rate": 0.001083980830005501, "loss": 2.8842, "step": 18198 }, { "epoch": 0.49, "learning_rate": 0.0010838940979711394, "loss": 3.1095, "step": 18199 }, { "epoch": 0.49, "learning_rate": 0.001083807365301211, "loss": 2.6291, "step": 18200 }, { "epoch": 0.49, "learning_rate": 0.0010837206319963735, "loss": 2.3588, "step": 18201 }, { "epoch": 0.49, "learning_rate": 0.0010836338980572831, "loss": 2.3372, "step": 18202 }, { "epoch": 0.49, "learning_rate": 0.0010835471634845974, "loss": 2.542, "step": 18203 }, { "epoch": 0.49, "learning_rate": 0.0010834604282789733, "loss": 2.4714, "step": 18204 }, { "epoch": 0.49, "learning_rate": 0.001083373692441068, "loss": 2.6864, "step": 18205 }, { "epoch": 0.49, "learning_rate": 0.0010832869559715384, "loss": 2.6061, "step": 18206 }, { "epoch": 0.49, "learning_rate": 0.0010832002188710418, "loss": 2.0994, "step": 18207 }, { "epoch": 0.49, "learning_rate": 0.0010831134811402352, "loss": 2.2855, "step": 18208 }, { "epoch": 0.49, "learning_rate": 0.0010830267427797756, "loss": 2.3084, "step": 18209 }, { "epoch": 0.49, "learning_rate": 0.0010829400037903204, "loss": 2.9761, "step": 18210 }, { "epoch": 0.49, "learning_rate": 0.0010828532641725267, "loss": 2.5068, "step": 18211 }, { "epoch": 0.49, "learning_rate": 0.001082766523927051, "loss": 2.3438, "step": 18212 }, { "epoch": 0.49, "learning_rate": 0.0010826797830545511, "loss": 3.0982, "step": 18213 }, { "epoch": 0.49, "learning_rate": 0.0010825930415556842, "loss": 3.1889, "step": 18214 }, { "epoch": 0.49, "learning_rate": 0.0010825062994311069, "loss": 2.3073, "step": 18215 }, { "epoch": 0.49, "learning_rate": 0.0010824195566814766, "loss": 2.7603, "step": 18216 }, { "epoch": 0.49, "learning_rate": 0.0010823328133074506, "loss": 2.6572, "step": 18217 }, { "epoch": 0.49, "learning_rate": 0.001082246069309686, "loss": 2.2432, "step": 18218 }, { "epoch": 0.49, "learning_rate": 0.00108215932468884, "loss": 1.9025, "step": 18219 }, { "epoch": 0.49, "learning_rate": 0.0010820725794455693, "loss": 2.5285, "step": 18220 }, { "epoch": 0.49, "learning_rate": 0.0010819858335805318, "loss": 2.9949, "step": 18221 }, { "epoch": 0.49, "learning_rate": 0.0010818990870943837, "loss": 2.3326, "step": 18222 }, { "epoch": 0.49, "learning_rate": 0.0010818123399877833, "loss": 2.7957, "step": 18223 }, { "epoch": 0.49, "learning_rate": 0.0010817255922613868, "loss": 2.7914, "step": 18224 }, { "epoch": 0.49, "learning_rate": 0.0010816388439158521, "loss": 2.5004, "step": 18225 }, { "epoch": 0.49, "learning_rate": 0.0010815520949518363, "loss": 2.4745, "step": 18226 }, { "epoch": 0.49, "learning_rate": 0.0010814653453699963, "loss": 2.4979, "step": 18227 }, { "epoch": 0.49, "learning_rate": 0.0010813785951709891, "loss": 2.6341, "step": 18228 }, { "epoch": 0.49, "learning_rate": 0.0010812918443554725, "loss": 2.5428, "step": 18229 }, { "epoch": 0.49, "learning_rate": 0.0010812050929241033, "loss": 2.871, "step": 18230 }, { "epoch": 0.49, "learning_rate": 0.001081118340877539, "loss": 2.3126, "step": 18231 }, { "epoch": 0.49, "learning_rate": 0.0010810315882164364, "loss": 2.2036, "step": 18232 }, { "epoch": 0.49, "learning_rate": 0.001080944834941453, "loss": 2.83, "step": 18233 }, { "epoch": 0.49, "learning_rate": 0.0010808580810532462, "loss": 2.7534, "step": 18234 }, { "epoch": 0.49, "learning_rate": 0.0010807713265524727, "loss": 2.7555, "step": 18235 }, { "epoch": 0.49, "learning_rate": 0.0010806845714397904, "loss": 2.4581, "step": 18236 }, { "epoch": 0.49, "learning_rate": 0.0010805978157158562, "loss": 2.1164, "step": 18237 }, { "epoch": 0.49, "learning_rate": 0.0010805110593813275, "loss": 2.2262, "step": 18238 }, { "epoch": 0.49, "learning_rate": 0.0010804243024368607, "loss": 2.7806, "step": 18239 }, { "epoch": 0.49, "learning_rate": 0.0010803375448831145, "loss": 2.8238, "step": 18240 }, { "epoch": 0.49, "learning_rate": 0.0010802507867207452, "loss": 2.5036, "step": 18241 }, { "epoch": 0.49, "learning_rate": 0.0010801640279504102, "loss": 2.7647, "step": 18242 }, { "epoch": 0.49, "learning_rate": 0.001080077268572767, "loss": 2.3921, "step": 18243 }, { "epoch": 0.49, "learning_rate": 0.0010799905085884726, "loss": 2.7857, "step": 18244 }, { "epoch": 0.49, "learning_rate": 0.0010799037479981843, "loss": 2.4897, "step": 18245 }, { "epoch": 0.49, "learning_rate": 0.0010798169868025597, "loss": 2.5977, "step": 18246 }, { "epoch": 0.49, "learning_rate": 0.0010797302250022559, "loss": 2.3256, "step": 18247 }, { "epoch": 0.49, "learning_rate": 0.0010796434625979302, "loss": 2.4386, "step": 18248 }, { "epoch": 0.49, "learning_rate": 0.0010795566995902394, "loss": 2.0423, "step": 18249 }, { "epoch": 0.49, "learning_rate": 0.0010794699359798418, "loss": 2.453, "step": 18250 }, { "epoch": 0.49, "learning_rate": 0.001079383171767394, "loss": 3.0143, "step": 18251 }, { "epoch": 0.49, "learning_rate": 0.0010792964069535533, "loss": 2.4956, "step": 18252 }, { "epoch": 0.49, "learning_rate": 0.0010792096415389776, "loss": 2.6403, "step": 18253 }, { "epoch": 0.49, "learning_rate": 0.0010791228755243237, "loss": 2.4814, "step": 18254 }, { "epoch": 0.49, "learning_rate": 0.0010790361089102487, "loss": 2.9903, "step": 18255 }, { "epoch": 0.49, "learning_rate": 0.0010789493416974107, "loss": 2.2297, "step": 18256 }, { "epoch": 0.49, "learning_rate": 0.0010788625738864664, "loss": 2.3699, "step": 18257 }, { "epoch": 0.49, "learning_rate": 0.0010787758054780733, "loss": 2.4782, "step": 18258 }, { "epoch": 0.49, "learning_rate": 0.0010786890364728888, "loss": 2.4262, "step": 18259 }, { "epoch": 0.49, "learning_rate": 0.0010786022668715703, "loss": 2.4444, "step": 18260 }, { "epoch": 0.49, "learning_rate": 0.001078515496674775, "loss": 2.5596, "step": 18261 }, { "epoch": 0.49, "learning_rate": 0.0010784287258831604, "loss": 2.4597, "step": 18262 }, { "epoch": 0.49, "learning_rate": 0.0010783419544973835, "loss": 2.126, "step": 18263 }, { "epoch": 0.49, "learning_rate": 0.0010782551825181024, "loss": 2.471, "step": 18264 }, { "epoch": 0.49, "learning_rate": 0.0010781684099459739, "loss": 2.362, "step": 18265 }, { "epoch": 0.49, "learning_rate": 0.0010780816367816554, "loss": 2.5548, "step": 18266 }, { "epoch": 0.49, "learning_rate": 0.0010779948630258046, "loss": 2.3156, "step": 18267 }, { "epoch": 0.49, "learning_rate": 0.0010779080886790782, "loss": 2.672, "step": 18268 }, { "epoch": 0.49, "learning_rate": 0.0010778213137421343, "loss": 2.7085, "step": 18269 }, { "epoch": 0.49, "learning_rate": 0.0010777345382156304, "loss": 2.3808, "step": 18270 }, { "epoch": 0.49, "learning_rate": 0.0010776477621002231, "loss": 2.3692, "step": 18271 }, { "epoch": 0.49, "learning_rate": 0.0010775609853965703, "loss": 2.654, "step": 18272 }, { "epoch": 0.49, "learning_rate": 0.0010774742081053295, "loss": 2.4726, "step": 18273 }, { "epoch": 0.49, "learning_rate": 0.001077387430227158, "loss": 2.3181, "step": 18274 }, { "epoch": 0.49, "learning_rate": 0.0010773006517627126, "loss": 2.1585, "step": 18275 }, { "epoch": 0.49, "learning_rate": 0.001077213872712652, "loss": 2.5404, "step": 18276 }, { "epoch": 0.49, "learning_rate": 0.0010771270930776324, "loss": 2.7823, "step": 18277 }, { "epoch": 0.49, "learning_rate": 0.001077040312858312, "loss": 2.5256, "step": 18278 }, { "epoch": 0.49, "learning_rate": 0.0010769535320553478, "loss": 2.7406, "step": 18279 }, { "epoch": 0.49, "learning_rate": 0.0010768667506693976, "loss": 2.6288, "step": 18280 }, { "epoch": 0.49, "learning_rate": 0.0010767799687011184, "loss": 2.535, "step": 18281 }, { "epoch": 0.49, "learning_rate": 0.001076693186151168, "loss": 2.3764, "step": 18282 }, { "epoch": 0.49, "learning_rate": 0.001076606403020204, "loss": 2.3892, "step": 18283 }, { "epoch": 0.49, "learning_rate": 0.0010765196193088832, "loss": 2.7118, "step": 18284 }, { "epoch": 0.49, "learning_rate": 0.0010764328350178637, "loss": 2.171, "step": 18285 }, { "epoch": 0.49, "learning_rate": 0.0010763460501478023, "loss": 2.6964, "step": 18286 }, { "epoch": 0.49, "learning_rate": 0.0010762592646993575, "loss": 2.572, "step": 18287 }, { "epoch": 0.49, "learning_rate": 0.0010761724786731855, "loss": 2.2788, "step": 18288 }, { "epoch": 0.49, "learning_rate": 0.0010760856920699448, "loss": 2.2823, "step": 18289 }, { "epoch": 0.49, "learning_rate": 0.0010759989048902924, "loss": 2.3551, "step": 18290 }, { "epoch": 0.49, "learning_rate": 0.001075912117134886, "loss": 2.6398, "step": 18291 }, { "epoch": 0.49, "learning_rate": 0.001075825328804383, "loss": 2.6334, "step": 18292 }, { "epoch": 0.49, "learning_rate": 0.0010757385398994406, "loss": 2.1861, "step": 18293 }, { "epoch": 0.49, "learning_rate": 0.0010756517504207166, "loss": 2.5557, "step": 18294 }, { "epoch": 0.49, "learning_rate": 0.0010755649603688686, "loss": 2.68, "step": 18295 }, { "epoch": 0.49, "learning_rate": 0.0010754781697445539, "loss": 2.8905, "step": 18296 }, { "epoch": 0.49, "learning_rate": 0.0010753913785484304, "loss": 2.7124, "step": 18297 }, { "epoch": 0.49, "learning_rate": 0.0010753045867811547, "loss": 2.9208, "step": 18298 }, { "epoch": 0.49, "learning_rate": 0.0010752177944433853, "loss": 2.5604, "step": 18299 }, { "epoch": 0.49, "learning_rate": 0.0010751310015357793, "loss": 2.5389, "step": 18300 }, { "epoch": 0.49, "learning_rate": 0.0010750442080589941, "loss": 2.6111, "step": 18301 }, { "epoch": 0.49, "learning_rate": 0.0010749574140136876, "loss": 2.3525, "step": 18302 }, { "epoch": 0.49, "learning_rate": 0.0010748706194005171, "loss": 2.6581, "step": 18303 }, { "epoch": 0.49, "learning_rate": 0.0010747838242201402, "loss": 2.7841, "step": 18304 }, { "epoch": 0.49, "learning_rate": 0.0010746970284732143, "loss": 2.6466, "step": 18305 }, { "epoch": 0.49, "learning_rate": 0.001074610232160397, "loss": 2.4725, "step": 18306 }, { "epoch": 0.49, "learning_rate": 0.0010745234352823464, "loss": 2.692, "step": 18307 }, { "epoch": 0.49, "learning_rate": 0.001074436637839719, "loss": 2.8415, "step": 18308 }, { "epoch": 0.49, "learning_rate": 0.001074349839833173, "loss": 2.8059, "step": 18309 }, { "epoch": 0.49, "learning_rate": 0.0010742630412633662, "loss": 2.4261, "step": 18310 }, { "epoch": 0.49, "learning_rate": 0.0010741762421309555, "loss": 2.0518, "step": 18311 }, { "epoch": 0.49, "learning_rate": 0.0010740894424365992, "loss": 2.6586, "step": 18312 }, { "epoch": 0.49, "learning_rate": 0.0010740026421809544, "loss": 2.3622, "step": 18313 }, { "epoch": 0.49, "learning_rate": 0.001073915841364679, "loss": 2.3267, "step": 18314 }, { "epoch": 0.49, "learning_rate": 0.00107382903998843, "loss": 2.2894, "step": 18315 }, { "epoch": 0.49, "learning_rate": 0.0010737422380528658, "loss": 2.6949, "step": 18316 }, { "epoch": 0.49, "learning_rate": 0.0010736554355586434, "loss": 2.283, "step": 18317 }, { "epoch": 0.49, "learning_rate": 0.0010735686325064205, "loss": 2.3036, "step": 18318 }, { "epoch": 0.49, "learning_rate": 0.001073481828896855, "loss": 2.7401, "step": 18319 }, { "epoch": 0.49, "learning_rate": 0.0010733950247306043, "loss": 2.5622, "step": 18320 }, { "epoch": 0.49, "learning_rate": 0.0010733082200083258, "loss": 2.4721, "step": 18321 }, { "epoch": 0.49, "learning_rate": 0.0010732214147306774, "loss": 2.298, "step": 18322 }, { "epoch": 0.49, "learning_rate": 0.0010731346088983166, "loss": 2.6644, "step": 18323 }, { "epoch": 0.49, "learning_rate": 0.0010730478025119013, "loss": 2.854, "step": 18324 }, { "epoch": 0.49, "learning_rate": 0.0010729609955720887, "loss": 2.6605, "step": 18325 }, { "epoch": 0.49, "learning_rate": 0.0010728741880795367, "loss": 2.3466, "step": 18326 }, { "epoch": 0.49, "learning_rate": 0.001072787380034903, "loss": 2.3527, "step": 18327 }, { "epoch": 0.49, "learning_rate": 0.0010727005714388452, "loss": 2.3162, "step": 18328 }, { "epoch": 0.49, "learning_rate": 0.0010726137622920206, "loss": 2.2102, "step": 18329 }, { "epoch": 0.49, "learning_rate": 0.001072526952595087, "loss": 2.2944, "step": 18330 }, { "epoch": 0.49, "learning_rate": 0.0010724401423487025, "loss": 2.6456, "step": 18331 }, { "epoch": 0.49, "learning_rate": 0.0010723533315535243, "loss": 2.5673, "step": 18332 }, { "epoch": 0.49, "learning_rate": 0.0010722665202102103, "loss": 2.7177, "step": 18333 }, { "epoch": 0.49, "learning_rate": 0.0010721797083194178, "loss": 2.4547, "step": 18334 }, { "epoch": 0.49, "learning_rate": 0.0010720928958818051, "loss": 2.6379, "step": 18335 }, { "epoch": 0.49, "learning_rate": 0.0010720060828980293, "loss": 2.8376, "step": 18336 }, { "epoch": 0.49, "learning_rate": 0.0010719192693687482, "loss": 2.5309, "step": 18337 }, { "epoch": 0.49, "learning_rate": 0.0010718324552946197, "loss": 2.1136, "step": 18338 }, { "epoch": 0.49, "learning_rate": 0.0010717456406763015, "loss": 2.6937, "step": 18339 }, { "epoch": 0.49, "learning_rate": 0.0010716588255144511, "loss": 2.7918, "step": 18340 }, { "epoch": 0.49, "learning_rate": 0.001071572009809726, "loss": 2.8965, "step": 18341 }, { "epoch": 0.49, "learning_rate": 0.0010714851935627843, "loss": 2.9357, "step": 18342 }, { "epoch": 0.49, "learning_rate": 0.0010713983767742837, "loss": 2.8074, "step": 18343 }, { "epoch": 0.49, "learning_rate": 0.0010713115594448814, "loss": 2.2542, "step": 18344 }, { "epoch": 0.49, "learning_rate": 0.0010712247415752356, "loss": 2.9479, "step": 18345 }, { "epoch": 0.49, "learning_rate": 0.0010711379231660041, "loss": 2.1791, "step": 18346 }, { "epoch": 0.49, "learning_rate": 0.0010710511042178442, "loss": 2.5917, "step": 18347 }, { "epoch": 0.49, "learning_rate": 0.0010709642847314138, "loss": 2.8034, "step": 18348 }, { "epoch": 0.49, "learning_rate": 0.001070877464707371, "loss": 2.4633, "step": 18349 }, { "epoch": 0.49, "learning_rate": 0.001070790644146373, "loss": 2.642, "step": 18350 }, { "epoch": 0.49, "learning_rate": 0.0010707038230490778, "loss": 2.4278, "step": 18351 }, { "epoch": 0.49, "learning_rate": 0.0010706170014161429, "loss": 2.7428, "step": 18352 }, { "epoch": 0.49, "learning_rate": 0.0010705301792482262, "loss": 2.4636, "step": 18353 }, { "epoch": 0.49, "learning_rate": 0.0010704433565459856, "loss": 2.5943, "step": 18354 }, { "epoch": 0.49, "learning_rate": 0.0010703565333100788, "loss": 2.3684, "step": 18355 }, { "epoch": 0.49, "learning_rate": 0.0010702697095411634, "loss": 2.6073, "step": 18356 }, { "epoch": 0.49, "learning_rate": 0.0010701828852398975, "loss": 1.8928, "step": 18357 }, { "epoch": 0.49, "learning_rate": 0.0010700960604069381, "loss": 2.7153, "step": 18358 }, { "epoch": 0.49, "learning_rate": 0.0010700092350429441, "loss": 2.1936, "step": 18359 }, { "epoch": 0.49, "learning_rate": 0.001069922409148572, "loss": 2.6827, "step": 18360 }, { "epoch": 0.49, "learning_rate": 0.0010698355827244805, "loss": 2.4605, "step": 18361 }, { "epoch": 0.49, "learning_rate": 0.0010697487557713272, "loss": 2.0054, "step": 18362 }, { "epoch": 0.49, "learning_rate": 0.0010696619282897699, "loss": 2.4382, "step": 18363 }, { "epoch": 0.49, "learning_rate": 0.0010695751002804657, "loss": 2.3869, "step": 18364 }, { "epoch": 0.49, "learning_rate": 0.0010694882717440736, "loss": 2.7329, "step": 18365 }, { "epoch": 0.49, "learning_rate": 0.0010694014426812506, "loss": 2.4052, "step": 18366 }, { "epoch": 0.49, "learning_rate": 0.0010693146130926546, "loss": 2.6404, "step": 18367 }, { "epoch": 0.49, "learning_rate": 0.0010692277829789435, "loss": 2.8298, "step": 18368 }, { "epoch": 0.49, "learning_rate": 0.0010691409523407751, "loss": 2.5228, "step": 18369 }, { "epoch": 0.49, "learning_rate": 0.0010690541211788075, "loss": 3.2177, "step": 18370 }, { "epoch": 0.49, "learning_rate": 0.0010689672894936978, "loss": 2.4691, "step": 18371 }, { "epoch": 0.49, "learning_rate": 0.0010688804572861043, "loss": 2.7011, "step": 18372 }, { "epoch": 0.49, "learning_rate": 0.001068793624556685, "loss": 2.8184, "step": 18373 }, { "epoch": 0.49, "learning_rate": 0.0010687067913060972, "loss": 2.8664, "step": 18374 }, { "epoch": 0.49, "learning_rate": 0.0010686199575349992, "loss": 2.3276, "step": 18375 }, { "epoch": 0.49, "learning_rate": 0.0010685331232440486, "loss": 3.156, "step": 18376 }, { "epoch": 0.49, "learning_rate": 0.0010684462884339035, "loss": 2.9461, "step": 18377 }, { "epoch": 0.49, "learning_rate": 0.0010683594531052214, "loss": 2.4642, "step": 18378 }, { "epoch": 0.49, "learning_rate": 0.0010682726172586605, "loss": 2.4493, "step": 18379 }, { "epoch": 0.49, "learning_rate": 0.0010681857808948782, "loss": 2.6093, "step": 18380 }, { "epoch": 0.49, "learning_rate": 0.0010680989440145327, "loss": 2.4345, "step": 18381 }, { "epoch": 0.49, "learning_rate": 0.001068012106618282, "loss": 2.5542, "step": 18382 }, { "epoch": 0.49, "learning_rate": 0.0010679252687067833, "loss": 2.5212, "step": 18383 }, { "epoch": 0.49, "learning_rate": 0.0010678384302806952, "loss": 2.566, "step": 18384 }, { "epoch": 0.49, "learning_rate": 0.0010677515913406752, "loss": 2.607, "step": 18385 }, { "epoch": 0.49, "learning_rate": 0.0010676647518873814, "loss": 2.3659, "step": 18386 }, { "epoch": 0.49, "learning_rate": 0.0010675779119214712, "loss": 2.5515, "step": 18387 }, { "epoch": 0.49, "learning_rate": 0.001067491071443603, "loss": 2.8372, "step": 18388 }, { "epoch": 0.49, "learning_rate": 0.0010674042304544347, "loss": 2.4904, "step": 18389 }, { "epoch": 0.49, "learning_rate": 0.0010673173889546236, "loss": 2.674, "step": 18390 }, { "epoch": 0.49, "learning_rate": 0.0010672305469448281, "loss": 2.9309, "step": 18391 }, { "epoch": 0.49, "learning_rate": 0.0010671437044257063, "loss": 2.6654, "step": 18392 }, { "epoch": 0.49, "learning_rate": 0.001067056861397916, "loss": 2.7464, "step": 18393 }, { "epoch": 0.49, "learning_rate": 0.0010669700178621145, "loss": 2.4539, "step": 18394 }, { "epoch": 0.49, "learning_rate": 0.00106688317381896, "loss": 2.7355, "step": 18395 }, { "epoch": 0.49, "learning_rate": 0.0010667963292691107, "loss": 2.308, "step": 18396 }, { "epoch": 0.49, "learning_rate": 0.0010667094842132243, "loss": 2.4813, "step": 18397 }, { "epoch": 0.49, "learning_rate": 0.0010666226386519592, "loss": 2.2542, "step": 18398 }, { "epoch": 0.49, "learning_rate": 0.0010665357925859723, "loss": 2.6537, "step": 18399 }, { "epoch": 0.49, "learning_rate": 0.0010664489460159223, "loss": 2.4806, "step": 18400 }, { "epoch": 0.49, "learning_rate": 0.001066362098942467, "loss": 2.6656, "step": 18401 }, { "epoch": 0.49, "learning_rate": 0.0010662752513662644, "loss": 2.6698, "step": 18402 }, { "epoch": 0.49, "learning_rate": 0.0010661884032879723, "loss": 2.554, "step": 18403 }, { "epoch": 0.49, "learning_rate": 0.0010661015547082484, "loss": 2.6985, "step": 18404 }, { "epoch": 0.49, "learning_rate": 0.0010660147056277514, "loss": 2.3827, "step": 18405 }, { "epoch": 0.49, "learning_rate": 0.0010659278560471387, "loss": 2.4012, "step": 18406 }, { "epoch": 0.49, "learning_rate": 0.0010658410059670679, "loss": 2.4722, "step": 18407 }, { "epoch": 0.49, "learning_rate": 0.0010657541553881977, "loss": 2.5496, "step": 18408 }, { "epoch": 0.49, "learning_rate": 0.001065667304311186, "loss": 2.3738, "step": 18409 }, { "epoch": 0.49, "learning_rate": 0.0010655804527366904, "loss": 2.768, "step": 18410 }, { "epoch": 0.49, "learning_rate": 0.0010654936006653688, "loss": 2.5703, "step": 18411 }, { "epoch": 0.49, "learning_rate": 0.0010654067480978797, "loss": 2.4657, "step": 18412 }, { "epoch": 0.49, "learning_rate": 0.0010653198950348805, "loss": 2.4513, "step": 18413 }, { "epoch": 0.49, "learning_rate": 0.0010652330414770298, "loss": 2.4205, "step": 18414 }, { "epoch": 0.49, "learning_rate": 0.0010651461874249847, "loss": 2.9083, "step": 18415 }, { "epoch": 0.49, "learning_rate": 0.0010650593328794043, "loss": 2.3335, "step": 18416 }, { "epoch": 0.49, "learning_rate": 0.0010649724778409458, "loss": 2.5072, "step": 18417 }, { "epoch": 0.49, "learning_rate": 0.0010648856223102673, "loss": 2.4434, "step": 18418 }, { "epoch": 0.49, "learning_rate": 0.0010647987662880272, "loss": 1.9283, "step": 18419 }, { "epoch": 0.5, "learning_rate": 0.001064711909774883, "loss": 2.7489, "step": 18420 }, { "epoch": 0.5, "learning_rate": 0.0010646250527714932, "loss": 2.7392, "step": 18421 }, { "epoch": 0.5, "learning_rate": 0.0010645381952785152, "loss": 2.2303, "step": 18422 }, { "epoch": 0.5, "learning_rate": 0.0010644513372966076, "loss": 2.3484, "step": 18423 }, { "epoch": 0.5, "learning_rate": 0.0010643644788264279, "loss": 2.2765, "step": 18424 }, { "epoch": 0.5, "learning_rate": 0.001064277619868635, "loss": 2.6064, "step": 18425 }, { "epoch": 0.5, "learning_rate": 0.0010641907604238855, "loss": 2.2599, "step": 18426 }, { "epoch": 0.5, "learning_rate": 0.0010641039004928388, "loss": 2.6982, "step": 18427 }, { "epoch": 0.5, "learning_rate": 0.0010640170400761527, "loss": 2.4426, "step": 18428 }, { "epoch": 0.5, "learning_rate": 0.0010639301791744848, "loss": 2.3522, "step": 18429 }, { "epoch": 0.5, "learning_rate": 0.0010638433177884924, "loss": 2.6003, "step": 18430 }, { "epoch": 0.5, "learning_rate": 0.0010637564559188356, "loss": 2.5421, "step": 18431 }, { "epoch": 0.5, "learning_rate": 0.001063669593566171, "loss": 2.6734, "step": 18432 }, { "epoch": 0.5, "learning_rate": 0.0010635827307311566, "loss": 2.6616, "step": 18433 }, { "epoch": 0.5, "learning_rate": 0.0010634958674144508, "loss": 3.0095, "step": 18434 }, { "epoch": 0.5, "learning_rate": 0.001063409003616712, "loss": 2.6271, "step": 18435 }, { "epoch": 0.5, "learning_rate": 0.001063322139338598, "loss": 2.703, "step": 18436 }, { "epoch": 0.5, "learning_rate": 0.0010632352745807664, "loss": 2.7801, "step": 18437 }, { "epoch": 0.5, "learning_rate": 0.0010631484093438757, "loss": 2.7385, "step": 18438 }, { "epoch": 0.5, "learning_rate": 0.0010630615436285841, "loss": 2.7136, "step": 18439 }, { "epoch": 0.5, "learning_rate": 0.0010629746774355494, "loss": 2.7816, "step": 18440 }, { "epoch": 0.5, "learning_rate": 0.00106288781076543, "loss": 2.8852, "step": 18441 }, { "epoch": 0.5, "learning_rate": 0.0010628009436188836, "loss": 2.4721, "step": 18442 }, { "epoch": 0.5, "learning_rate": 0.0010627140759965686, "loss": 2.5835, "step": 18443 }, { "epoch": 0.5, "learning_rate": 0.001062627207899143, "loss": 2.7159, "step": 18444 }, { "epoch": 0.5, "learning_rate": 0.0010625403393272647, "loss": 2.5359, "step": 18445 }, { "epoch": 0.5, "learning_rate": 0.0010624534702815922, "loss": 2.4583, "step": 18446 }, { "epoch": 0.5, "learning_rate": 0.001062366600762783, "loss": 2.863, "step": 18447 }, { "epoch": 0.5, "learning_rate": 0.001062279730771496, "loss": 2.1999, "step": 18448 }, { "epoch": 0.5, "learning_rate": 0.0010621928603083888, "loss": 2.327, "step": 18449 }, { "epoch": 0.5, "learning_rate": 0.0010621059893741191, "loss": 2.5081, "step": 18450 }, { "epoch": 0.5, "learning_rate": 0.001062019117969346, "loss": 2.2108, "step": 18451 }, { "epoch": 0.5, "learning_rate": 0.0010619322460947273, "loss": 2.3302, "step": 18452 }, { "epoch": 0.5, "learning_rate": 0.001061845373750921, "loss": 2.2919, "step": 18453 }, { "epoch": 0.5, "learning_rate": 0.0010617585009385848, "loss": 2.6858, "step": 18454 }, { "epoch": 0.5, "learning_rate": 0.0010616716276583775, "loss": 2.1123, "step": 18455 }, { "epoch": 0.5, "learning_rate": 0.0010615847539109568, "loss": 2.427, "step": 18456 }, { "epoch": 0.5, "learning_rate": 0.0010614978796969813, "loss": 2.7125, "step": 18457 }, { "epoch": 0.5, "learning_rate": 0.0010614110050171086, "loss": 2.3067, "step": 18458 }, { "epoch": 0.5, "learning_rate": 0.0010613241298719973, "loss": 2.2283, "step": 18459 }, { "epoch": 0.5, "learning_rate": 0.001061237254262305, "loss": 2.5809, "step": 18460 }, { "epoch": 0.5, "learning_rate": 0.0010611503781886905, "loss": 2.7123, "step": 18461 }, { "epoch": 0.5, "learning_rate": 0.0010610635016518118, "loss": 2.4174, "step": 18462 }, { "epoch": 0.5, "learning_rate": 0.0010609766246523265, "loss": 2.3197, "step": 18463 }, { "epoch": 0.5, "learning_rate": 0.0010608897471908935, "loss": 2.6022, "step": 18464 }, { "epoch": 0.5, "learning_rate": 0.0010608028692681707, "loss": 2.2585, "step": 18465 }, { "epoch": 0.5, "learning_rate": 0.001060715990884816, "loss": 2.3625, "step": 18466 }, { "epoch": 0.5, "learning_rate": 0.0010606291120414878, "loss": 2.7836, "step": 18467 }, { "epoch": 0.5, "learning_rate": 0.0010605422327388447, "loss": 2.0806, "step": 18468 }, { "epoch": 0.5, "learning_rate": 0.001060455352977544, "loss": 2.5117, "step": 18469 }, { "epoch": 0.5, "learning_rate": 0.0010603684727582446, "loss": 2.8498, "step": 18470 }, { "epoch": 0.5, "learning_rate": 0.0010602815920816044, "loss": 2.8488, "step": 18471 }, { "epoch": 0.5, "learning_rate": 0.001060194710948282, "loss": 2.465, "step": 18472 }, { "epoch": 0.5, "learning_rate": 0.0010601078293589344, "loss": 2.757, "step": 18473 }, { "epoch": 0.5, "learning_rate": 0.001060020947314221, "loss": 2.036, "step": 18474 }, { "epoch": 0.5, "learning_rate": 0.0010599340648148, "loss": 2.2841, "step": 18475 }, { "epoch": 0.5, "learning_rate": 0.001059847181861329, "loss": 2.2511, "step": 18476 }, { "epoch": 0.5, "learning_rate": 0.001059760298454466, "loss": 2.3321, "step": 18477 }, { "epoch": 0.5, "learning_rate": 0.0010596734145948703, "loss": 2.3275, "step": 18478 }, { "epoch": 0.5, "learning_rate": 0.0010595865302831995, "loss": 2.3228, "step": 18479 }, { "epoch": 0.5, "learning_rate": 0.0010594996455201113, "loss": 2.3698, "step": 18480 }, { "epoch": 0.5, "learning_rate": 0.0010594127603062646, "loss": 2.6086, "step": 18481 }, { "epoch": 0.5, "learning_rate": 0.0010593258746423178, "loss": 2.6143, "step": 18482 }, { "epoch": 0.5, "learning_rate": 0.0010592389885289283, "loss": 2.5109, "step": 18483 }, { "epoch": 0.5, "learning_rate": 0.0010591521019667552, "loss": 2.4699, "step": 18484 }, { "epoch": 0.5, "learning_rate": 0.0010590652149564562, "loss": 2.7193, "step": 18485 }, { "epoch": 0.5, "learning_rate": 0.0010589783274986895, "loss": 2.0874, "step": 18486 }, { "epoch": 0.5, "learning_rate": 0.0010588914395941139, "loss": 2.8947, "step": 18487 }, { "epoch": 0.5, "learning_rate": 0.001058804551243387, "loss": 2.333, "step": 18488 }, { "epoch": 0.5, "learning_rate": 0.0010587176624471673, "loss": 2.4766, "step": 18489 }, { "epoch": 0.5, "learning_rate": 0.0010586307732061131, "loss": 2.6276, "step": 18490 }, { "epoch": 0.5, "learning_rate": 0.0010585438835208829, "loss": 2.3034, "step": 18491 }, { "epoch": 0.5, "learning_rate": 0.0010584569933921345, "loss": 2.5943, "step": 18492 }, { "epoch": 0.5, "learning_rate": 0.0010583701028205263, "loss": 2.636, "step": 18493 }, { "epoch": 0.5, "learning_rate": 0.0010582832118067168, "loss": 2.473, "step": 18494 }, { "epoch": 0.5, "learning_rate": 0.0010581963203513643, "loss": 2.4606, "step": 18495 }, { "epoch": 0.5, "learning_rate": 0.0010581094284551262, "loss": 2.3952, "step": 18496 }, { "epoch": 0.5, "learning_rate": 0.001058022536118662, "loss": 2.3604, "step": 18497 }, { "epoch": 0.5, "learning_rate": 0.0010579356433426297, "loss": 2.4693, "step": 18498 }, { "epoch": 0.5, "learning_rate": 0.0010578487501276869, "loss": 2.7787, "step": 18499 }, { "epoch": 0.5, "learning_rate": 0.0010577618564744922, "loss": 2.7334, "step": 18500 }, { "epoch": 0.5, "learning_rate": 0.0010576749623837044, "loss": 2.5829, "step": 18501 }, { "epoch": 0.5, "learning_rate": 0.0010575880678559812, "loss": 2.413, "step": 18502 }, { "epoch": 0.5, "learning_rate": 0.001057501172891981, "loss": 2.8325, "step": 18503 }, { "epoch": 0.5, "learning_rate": 0.001057414277492362, "loss": 2.1843, "step": 18504 }, { "epoch": 0.5, "learning_rate": 0.0010573273816577833, "loss": 2.6409, "step": 18505 }, { "epoch": 0.5, "learning_rate": 0.0010572404853889021, "loss": 1.965, "step": 18506 }, { "epoch": 0.5, "learning_rate": 0.0010571535886863776, "loss": 2.6682, "step": 18507 }, { "epoch": 0.5, "learning_rate": 0.0010570666915508673, "loss": 2.7161, "step": 18508 }, { "epoch": 0.5, "learning_rate": 0.0010569797939830301, "loss": 2.7998, "step": 18509 }, { "epoch": 0.5, "learning_rate": 0.0010568928959835244, "loss": 2.6342, "step": 18510 }, { "epoch": 0.5, "learning_rate": 0.0010568059975530082, "loss": 2.1619, "step": 18511 }, { "epoch": 0.5, "learning_rate": 0.0010567190986921398, "loss": 2.5027, "step": 18512 }, { "epoch": 0.5, "learning_rate": 0.0010566321994015776, "loss": 2.4866, "step": 18513 }, { "epoch": 0.5, "learning_rate": 0.0010565452996819803, "loss": 2.3784, "step": 18514 }, { "epoch": 0.5, "learning_rate": 0.0010564583995340056, "loss": 2.3608, "step": 18515 }, { "epoch": 0.5, "learning_rate": 0.001056371498958312, "loss": 2.4748, "step": 18516 }, { "epoch": 0.5, "learning_rate": 0.0010562845979555583, "loss": 2.5975, "step": 18517 }, { "epoch": 0.5, "learning_rate": 0.0010561976965264026, "loss": 2.5969, "step": 18518 }, { "epoch": 0.5, "learning_rate": 0.0010561107946715032, "loss": 2.9347, "step": 18519 }, { "epoch": 0.5, "learning_rate": 0.0010560238923915182, "loss": 2.4376, "step": 18520 }, { "epoch": 0.5, "learning_rate": 0.0010559369896871065, "loss": 2.4153, "step": 18521 }, { "epoch": 0.5, "learning_rate": 0.0010558500865589257, "loss": 2.6688, "step": 18522 }, { "epoch": 0.5, "learning_rate": 0.0010557631830076352, "loss": 2.9674, "step": 18523 }, { "epoch": 0.5, "learning_rate": 0.0010556762790338925, "loss": 2.7164, "step": 18524 }, { "epoch": 0.5, "learning_rate": 0.0010555893746383564, "loss": 2.4714, "step": 18525 }, { "epoch": 0.5, "learning_rate": 0.001055502469821685, "loss": 2.3119, "step": 18526 }, { "epoch": 0.5, "learning_rate": 0.001055415564584537, "loss": 2.1711, "step": 18527 }, { "epoch": 0.5, "learning_rate": 0.0010553286589275704, "loss": 2.4291, "step": 18528 }, { "epoch": 0.5, "learning_rate": 0.0010552417528514435, "loss": 2.4849, "step": 18529 }, { "epoch": 0.5, "learning_rate": 0.0010551548463568156, "loss": 2.4796, "step": 18530 }, { "epoch": 0.5, "learning_rate": 0.0010550679394443442, "loss": 2.6705, "step": 18531 }, { "epoch": 0.5, "learning_rate": 0.0010549810321146878, "loss": 2.7127, "step": 18532 }, { "epoch": 0.5, "learning_rate": 0.0010548941243685049, "loss": 2.9996, "step": 18533 }, { "epoch": 0.5, "learning_rate": 0.001054807216206454, "loss": 2.2029, "step": 18534 }, { "epoch": 0.5, "learning_rate": 0.0010547203076291933, "loss": 2.114, "step": 18535 }, { "epoch": 0.5, "learning_rate": 0.0010546333986373815, "loss": 2.1195, "step": 18536 }, { "epoch": 0.5, "learning_rate": 0.001054546489231677, "loss": 2.7474, "step": 18537 }, { "epoch": 0.5, "learning_rate": 0.001054459579412738, "loss": 2.0138, "step": 18538 }, { "epoch": 0.5, "learning_rate": 0.0010543726691812226, "loss": 2.4125, "step": 18539 }, { "epoch": 0.5, "learning_rate": 0.00105428575853779, "loss": 2.3085, "step": 18540 }, { "epoch": 0.5, "learning_rate": 0.001054198847483098, "loss": 2.5652, "step": 18541 }, { "epoch": 0.5, "learning_rate": 0.001054111936017805, "loss": 2.5787, "step": 18542 }, { "epoch": 0.5, "learning_rate": 0.00105402502414257, "loss": 2.7412, "step": 18543 }, { "epoch": 0.5, "learning_rate": 0.001053938111858051, "loss": 2.8143, "step": 18544 }, { "epoch": 0.5, "learning_rate": 0.0010538511991649065, "loss": 2.5986, "step": 18545 }, { "epoch": 0.5, "learning_rate": 0.0010537642860637948, "loss": 2.7788, "step": 18546 }, { "epoch": 0.5, "learning_rate": 0.0010536773725553746, "loss": 2.5102, "step": 18547 }, { "epoch": 0.5, "learning_rate": 0.0010535904586403042, "loss": 2.4423, "step": 18548 }, { "epoch": 0.5, "learning_rate": 0.001053503544319242, "loss": 2.834, "step": 18549 }, { "epoch": 0.5, "learning_rate": 0.0010534166295928468, "loss": 2.2567, "step": 18550 }, { "epoch": 0.5, "learning_rate": 0.0010533297144617764, "loss": 2.0103, "step": 18551 }, { "epoch": 0.5, "learning_rate": 0.0010532427989266898, "loss": 2.5857, "step": 18552 }, { "epoch": 0.5, "learning_rate": 0.0010531558829882453, "loss": 2.8886, "step": 18553 }, { "epoch": 0.5, "learning_rate": 0.0010530689666471014, "loss": 2.4502, "step": 18554 }, { "epoch": 0.5, "learning_rate": 0.0010529820499039161, "loss": 2.4302, "step": 18555 }, { "epoch": 0.5, "learning_rate": 0.0010528951327593485, "loss": 2.3568, "step": 18556 }, { "epoch": 0.5, "learning_rate": 0.001052808215214057, "loss": 2.5748, "step": 18557 }, { "epoch": 0.5, "learning_rate": 0.0010527212972686998, "loss": 2.2451, "step": 18558 }, { "epoch": 0.5, "learning_rate": 0.0010526343789239352, "loss": 2.5721, "step": 18559 }, { "epoch": 0.5, "learning_rate": 0.0010525474601804224, "loss": 2.7859, "step": 18560 }, { "epoch": 0.5, "learning_rate": 0.0010524605410388193, "loss": 2.115, "step": 18561 }, { "epoch": 0.5, "learning_rate": 0.0010523736214997843, "loss": 2.2188, "step": 18562 }, { "epoch": 0.5, "learning_rate": 0.0010522867015639763, "loss": 2.395, "step": 18563 }, { "epoch": 0.5, "learning_rate": 0.0010521997812320536, "loss": 2.9674, "step": 18564 }, { "epoch": 0.5, "learning_rate": 0.0010521128605046747, "loss": 2.3769, "step": 18565 }, { "epoch": 0.5, "learning_rate": 0.001052025939382498, "loss": 3.0608, "step": 18566 }, { "epoch": 0.5, "learning_rate": 0.001051939017866182, "loss": 2.6445, "step": 18567 }, { "epoch": 0.5, "learning_rate": 0.0010518520959563857, "loss": 2.281, "step": 18568 }, { "epoch": 0.5, "learning_rate": 0.0010517651736537668, "loss": 2.381, "step": 18569 }, { "epoch": 0.5, "learning_rate": 0.0010516782509589842, "loss": 2.7906, "step": 18570 }, { "epoch": 0.5, "learning_rate": 0.0010515913278726968, "loss": 2.2164, "step": 18571 }, { "epoch": 0.5, "learning_rate": 0.0010515044043955622, "loss": 2.9612, "step": 18572 }, { "epoch": 0.5, "learning_rate": 0.0010514174805282396, "loss": 2.2664, "step": 18573 }, { "epoch": 0.5, "learning_rate": 0.0010513305562713875, "loss": 2.451, "step": 18574 }, { "epoch": 0.5, "learning_rate": 0.0010512436316256644, "loss": 2.5085, "step": 18575 }, { "epoch": 0.5, "learning_rate": 0.0010511567065917284, "loss": 2.5424, "step": 18576 }, { "epoch": 0.5, "learning_rate": 0.0010510697811702385, "loss": 2.2541, "step": 18577 }, { "epoch": 0.5, "learning_rate": 0.001050982855361853, "loss": 2.7555, "step": 18578 }, { "epoch": 0.5, "learning_rate": 0.0010508959291672304, "loss": 2.4746, "step": 18579 }, { "epoch": 0.5, "learning_rate": 0.0010508090025870295, "loss": 2.2008, "step": 18580 }, { "epoch": 0.5, "learning_rate": 0.001050722075621909, "loss": 2.69, "step": 18581 }, { "epoch": 0.5, "learning_rate": 0.0010506351482725263, "loss": 2.4451, "step": 18582 }, { "epoch": 0.5, "learning_rate": 0.0010505482205395414, "loss": 2.4338, "step": 18583 }, { "epoch": 0.5, "learning_rate": 0.0010504612924236124, "loss": 2.1646, "step": 18584 }, { "epoch": 0.5, "learning_rate": 0.0010503743639253972, "loss": 2.6943, "step": 18585 }, { "epoch": 0.5, "learning_rate": 0.0010502874350455547, "loss": 2.6426, "step": 18586 }, { "epoch": 0.5, "learning_rate": 0.001050200505784744, "loss": 2.2602, "step": 18587 }, { "epoch": 0.5, "learning_rate": 0.001050113576143623, "loss": 3.0282, "step": 18588 }, { "epoch": 0.5, "learning_rate": 0.0010500266461228507, "loss": 3.0167, "step": 18589 }, { "epoch": 0.5, "learning_rate": 0.0010499397157230851, "loss": 2.5512, "step": 18590 }, { "epoch": 0.5, "learning_rate": 0.0010498527849449857, "loss": 2.4084, "step": 18591 }, { "epoch": 0.5, "learning_rate": 0.0010497658537892102, "loss": 2.5335, "step": 18592 }, { "epoch": 0.5, "learning_rate": 0.0010496789222564176, "loss": 2.8194, "step": 18593 }, { "epoch": 0.5, "learning_rate": 0.0010495919903472661, "loss": 2.5307, "step": 18594 }, { "epoch": 0.5, "learning_rate": 0.0010495050580624145, "loss": 2.4959, "step": 18595 }, { "epoch": 0.5, "learning_rate": 0.001049418125402522, "loss": 2.6746, "step": 18596 }, { "epoch": 0.5, "learning_rate": 0.0010493311923682463, "loss": 2.5811, "step": 18597 }, { "epoch": 0.5, "learning_rate": 0.0010492442589602462, "loss": 2.6804, "step": 18598 }, { "epoch": 0.5, "learning_rate": 0.0010491573251791805, "loss": 3.3809, "step": 18599 }, { "epoch": 0.5, "learning_rate": 0.0010490703910257077, "loss": 2.4025, "step": 18600 }, { "epoch": 0.5, "learning_rate": 0.0010489834565004864, "loss": 2.4199, "step": 18601 }, { "epoch": 0.5, "learning_rate": 0.0010488965216041751, "loss": 2.5986, "step": 18602 }, { "epoch": 0.5, "learning_rate": 0.0010488095863374325, "loss": 2.5552, "step": 18603 }, { "epoch": 0.5, "learning_rate": 0.0010487226507009174, "loss": 2.5338, "step": 18604 }, { "epoch": 0.5, "learning_rate": 0.0010486357146952878, "loss": 2.5718, "step": 18605 }, { "epoch": 0.5, "learning_rate": 0.0010485487783212031, "loss": 2.5633, "step": 18606 }, { "epoch": 0.5, "learning_rate": 0.0010484618415793215, "loss": 2.1103, "step": 18607 }, { "epoch": 0.5, "learning_rate": 0.0010483749044703015, "loss": 2.9242, "step": 18608 }, { "epoch": 0.5, "learning_rate": 0.0010482879669948017, "loss": 2.3655, "step": 18609 }, { "epoch": 0.5, "learning_rate": 0.0010482010291534814, "loss": 2.3967, "step": 18610 }, { "epoch": 0.5, "learning_rate": 0.0010481140909469984, "loss": 2.677, "step": 18611 }, { "epoch": 0.5, "learning_rate": 0.0010480271523760118, "loss": 2.2842, "step": 18612 }, { "epoch": 0.5, "learning_rate": 0.0010479402134411797, "loss": 2.3116, "step": 18613 }, { "epoch": 0.5, "learning_rate": 0.0010478532741431616, "loss": 2.6307, "step": 18614 }, { "epoch": 0.5, "learning_rate": 0.0010477663344826153, "loss": 2.6351, "step": 18615 }, { "epoch": 0.5, "learning_rate": 0.0010476793944602001, "loss": 2.4201, "step": 18616 }, { "epoch": 0.5, "learning_rate": 0.001047592454076574, "loss": 2.6558, "step": 18617 }, { "epoch": 0.5, "learning_rate": 0.0010475055133323961, "loss": 2.3584, "step": 18618 }, { "epoch": 0.5, "learning_rate": 0.001047418572228325, "loss": 2.3601, "step": 18619 }, { "epoch": 0.5, "learning_rate": 0.0010473316307650193, "loss": 2.4998, "step": 18620 }, { "epoch": 0.5, "learning_rate": 0.0010472446889431377, "loss": 2.3092, "step": 18621 }, { "epoch": 0.5, "learning_rate": 0.0010471577467633384, "loss": 2.5672, "step": 18622 }, { "epoch": 0.5, "learning_rate": 0.0010470708042262808, "loss": 2.7127, "step": 18623 }, { "epoch": 0.5, "learning_rate": 0.0010469838613326233, "loss": 2.4294, "step": 18624 }, { "epoch": 0.5, "learning_rate": 0.001046896918083024, "loss": 2.1588, "step": 18625 }, { "epoch": 0.5, "learning_rate": 0.0010468099744781424, "loss": 2.1803, "step": 18626 }, { "epoch": 0.5, "learning_rate": 0.0010467230305186367, "loss": 2.8494, "step": 18627 }, { "epoch": 0.5, "learning_rate": 0.0010466360862051655, "loss": 2.9808, "step": 18628 }, { "epoch": 0.5, "learning_rate": 0.001046549141538388, "loss": 2.3598, "step": 18629 }, { "epoch": 0.5, "learning_rate": 0.0010464621965189625, "loss": 2.4629, "step": 18630 }, { "epoch": 0.5, "learning_rate": 0.0010463752511475472, "loss": 2.3512, "step": 18631 }, { "epoch": 0.5, "learning_rate": 0.001046288305424802, "loss": 2.5948, "step": 18632 }, { "epoch": 0.5, "learning_rate": 0.0010462013593513844, "loss": 2.4102, "step": 18633 }, { "epoch": 0.5, "learning_rate": 0.0010461144129279539, "loss": 2.5231, "step": 18634 }, { "epoch": 0.5, "learning_rate": 0.0010460274661551682, "loss": 2.7274, "step": 18635 }, { "epoch": 0.5, "learning_rate": 0.0010459405190336875, "loss": 2.7189, "step": 18636 }, { "epoch": 0.5, "learning_rate": 0.001045853571564169, "loss": 2.3761, "step": 18637 }, { "epoch": 0.5, "learning_rate": 0.001045766623747272, "loss": 2.5396, "step": 18638 }, { "epoch": 0.5, "learning_rate": 0.0010456796755836557, "loss": 2.4176, "step": 18639 }, { "epoch": 0.5, "learning_rate": 0.0010455927270739782, "loss": 2.5562, "step": 18640 }, { "epoch": 0.5, "learning_rate": 0.0010455057782188984, "loss": 2.4929, "step": 18641 }, { "epoch": 0.5, "learning_rate": 0.0010454188290190747, "loss": 2.5894, "step": 18642 }, { "epoch": 0.5, "learning_rate": 0.0010453318794751663, "loss": 2.0295, "step": 18643 }, { "epoch": 0.5, "learning_rate": 0.0010452449295878315, "loss": 2.469, "step": 18644 }, { "epoch": 0.5, "learning_rate": 0.0010451579793577294, "loss": 2.4918, "step": 18645 }, { "epoch": 0.5, "learning_rate": 0.0010450710287855185, "loss": 2.4982, "step": 18646 }, { "epoch": 0.5, "learning_rate": 0.0010449840778718575, "loss": 2.4321, "step": 18647 }, { "epoch": 0.5, "learning_rate": 0.0010448971266174049, "loss": 2.2588, "step": 18648 }, { "epoch": 0.5, "learning_rate": 0.00104481017502282, "loss": 2.4708, "step": 18649 }, { "epoch": 0.5, "learning_rate": 0.0010447232230887612, "loss": 2.5859, "step": 18650 }, { "epoch": 0.5, "learning_rate": 0.0010446362708158871, "loss": 2.7253, "step": 18651 }, { "epoch": 0.5, "learning_rate": 0.0010445493182048566, "loss": 2.2298, "step": 18652 }, { "epoch": 0.5, "learning_rate": 0.0010444623652563288, "loss": 2.6849, "step": 18653 }, { "epoch": 0.5, "learning_rate": 0.0010443754119709618, "loss": 2.722, "step": 18654 }, { "epoch": 0.5, "learning_rate": 0.0010442884583494148, "loss": 2.5131, "step": 18655 }, { "epoch": 0.5, "learning_rate": 0.001044201504392346, "loss": 2.6811, "step": 18656 }, { "epoch": 0.5, "learning_rate": 0.0010441145501004147, "loss": 2.3629, "step": 18657 }, { "epoch": 0.5, "learning_rate": 0.0010440275954742796, "loss": 2.8188, "step": 18658 }, { "epoch": 0.5, "learning_rate": 0.001043940640514599, "loss": 2.3018, "step": 18659 }, { "epoch": 0.5, "learning_rate": 0.001043853685222032, "loss": 2.5086, "step": 18660 }, { "epoch": 0.5, "learning_rate": 0.0010437667295972375, "loss": 2.6702, "step": 18661 }, { "epoch": 0.5, "learning_rate": 0.001043679773640874, "loss": 2.3564, "step": 18662 }, { "epoch": 0.5, "learning_rate": 0.0010435928173536007, "loss": 2.6223, "step": 18663 }, { "epoch": 0.5, "learning_rate": 0.0010435058607360754, "loss": 2.6949, "step": 18664 }, { "epoch": 0.5, "learning_rate": 0.0010434189037889577, "loss": 2.3969, "step": 18665 }, { "epoch": 0.5, "learning_rate": 0.0010433319465129062, "loss": 2.4832, "step": 18666 }, { "epoch": 0.5, "learning_rate": 0.0010432449889085798, "loss": 2.6638, "step": 18667 }, { "epoch": 0.5, "learning_rate": 0.0010431580309766366, "loss": 2.4542, "step": 18668 }, { "epoch": 0.5, "learning_rate": 0.0010430710727177364, "loss": 2.473, "step": 18669 }, { "epoch": 0.5, "learning_rate": 0.0010429841141325375, "loss": 2.4922, "step": 18670 }, { "epoch": 0.5, "learning_rate": 0.0010428971552216982, "loss": 2.4132, "step": 18671 }, { "epoch": 0.5, "learning_rate": 0.0010428101959858778, "loss": 2.3211, "step": 18672 }, { "epoch": 0.5, "learning_rate": 0.001042723236425735, "loss": 2.0876, "step": 18673 }, { "epoch": 0.5, "learning_rate": 0.001042636276541929, "loss": 2.4741, "step": 18674 }, { "epoch": 0.5, "learning_rate": 0.0010425493163351179, "loss": 2.6191, "step": 18675 }, { "epoch": 0.5, "learning_rate": 0.0010424623558059607, "loss": 2.1092, "step": 18676 }, { "epoch": 0.5, "learning_rate": 0.0010423753949551165, "loss": 2.7289, "step": 18677 }, { "epoch": 0.5, "learning_rate": 0.0010422884337832434, "loss": 2.6137, "step": 18678 }, { "epoch": 0.5, "learning_rate": 0.0010422014722910014, "loss": 2.4493, "step": 18679 }, { "epoch": 0.5, "learning_rate": 0.0010421145104790482, "loss": 2.7168, "step": 18680 }, { "epoch": 0.5, "learning_rate": 0.0010420275483480428, "loss": 2.3505, "step": 18681 }, { "epoch": 0.5, "learning_rate": 0.0010419405858986446, "loss": 2.3201, "step": 18682 }, { "epoch": 0.5, "learning_rate": 0.0010418536231315116, "loss": 2.5967, "step": 18683 }, { "epoch": 0.5, "learning_rate": 0.0010417666600473032, "loss": 2.5541, "step": 18684 }, { "epoch": 0.5, "learning_rate": 0.0010416796966466785, "loss": 2.4191, "step": 18685 }, { "epoch": 0.5, "learning_rate": 0.0010415927329302955, "loss": 2.4577, "step": 18686 }, { "epoch": 0.5, "learning_rate": 0.0010415057688988132, "loss": 2.4229, "step": 18687 }, { "epoch": 0.5, "learning_rate": 0.0010414188045528908, "loss": 2.3585, "step": 18688 }, { "epoch": 0.5, "learning_rate": 0.001041331839893187, "loss": 2.6787, "step": 18689 }, { "epoch": 0.5, "learning_rate": 0.0010412448749203608, "loss": 2.6843, "step": 18690 }, { "epoch": 0.5, "learning_rate": 0.00104115790963507, "loss": 2.6352, "step": 18691 }, { "epoch": 0.5, "learning_rate": 0.001041070944037975, "loss": 2.464, "step": 18692 }, { "epoch": 0.5, "learning_rate": 0.001040983978129734, "loss": 2.7386, "step": 18693 }, { "epoch": 0.5, "learning_rate": 0.001040897011911005, "loss": 2.5207, "step": 18694 }, { "epoch": 0.5, "learning_rate": 0.0010408100453824479, "loss": 2.548, "step": 18695 }, { "epoch": 0.5, "learning_rate": 0.0010407230785447212, "loss": 2.2439, "step": 18696 }, { "epoch": 0.5, "learning_rate": 0.0010406361113984837, "loss": 2.2635, "step": 18697 }, { "epoch": 0.5, "learning_rate": 0.0010405491439443944, "loss": 2.519, "step": 18698 }, { "epoch": 0.5, "learning_rate": 0.001040462176183112, "loss": 2.4882, "step": 18699 }, { "epoch": 0.5, "learning_rate": 0.0010403752081152952, "loss": 2.3397, "step": 18700 }, { "epoch": 0.5, "learning_rate": 0.0010402882397416032, "loss": 2.5217, "step": 18701 }, { "epoch": 0.5, "learning_rate": 0.0010402012710626948, "loss": 2.492, "step": 18702 }, { "epoch": 0.5, "learning_rate": 0.0010401143020792286, "loss": 2.5767, "step": 18703 }, { "epoch": 0.5, "learning_rate": 0.0010400273327918635, "loss": 2.5482, "step": 18704 }, { "epoch": 0.5, "learning_rate": 0.0010399403632012588, "loss": 2.6564, "step": 18705 }, { "epoch": 0.5, "learning_rate": 0.0010398533933080728, "loss": 2.5898, "step": 18706 }, { "epoch": 0.5, "learning_rate": 0.0010397664231129647, "loss": 2.2704, "step": 18707 }, { "epoch": 0.5, "learning_rate": 0.001039679452616593, "loss": 2.5816, "step": 18708 }, { "epoch": 0.5, "learning_rate": 0.0010395924818196174, "loss": 2.2666, "step": 18709 }, { "epoch": 0.5, "learning_rate": 0.0010395055107226962, "loss": 2.3175, "step": 18710 }, { "epoch": 0.5, "learning_rate": 0.0010394185393264876, "loss": 2.3089, "step": 18711 }, { "epoch": 0.5, "learning_rate": 0.0010393315676316519, "loss": 2.8989, "step": 18712 }, { "epoch": 0.5, "learning_rate": 0.0010392445956388472, "loss": 2.3127, "step": 18713 }, { "epoch": 0.5, "learning_rate": 0.0010391576233487324, "loss": 2.5466, "step": 18714 }, { "epoch": 0.5, "learning_rate": 0.0010390706507619662, "loss": 2.8931, "step": 18715 }, { "epoch": 0.5, "learning_rate": 0.0010389836778792081, "loss": 2.7762, "step": 18716 }, { "epoch": 0.5, "learning_rate": 0.0010388967047011161, "loss": 2.9173, "step": 18717 }, { "epoch": 0.5, "learning_rate": 0.00103880973122835, "loss": 2.6279, "step": 18718 }, { "epoch": 0.5, "learning_rate": 0.0010387227574615682, "loss": 2.473, "step": 18719 }, { "epoch": 0.5, "learning_rate": 0.00103863578340143, "loss": 2.4378, "step": 18720 }, { "epoch": 0.5, "learning_rate": 0.0010385488090485938, "loss": 2.6788, "step": 18721 }, { "epoch": 0.5, "learning_rate": 0.0010384618344037187, "loss": 2.4062, "step": 18722 }, { "epoch": 0.5, "learning_rate": 0.0010383748594674637, "loss": 2.8253, "step": 18723 }, { "epoch": 0.5, "learning_rate": 0.0010382878842404874, "loss": 2.5741, "step": 18724 }, { "epoch": 0.5, "learning_rate": 0.0010382009087234491, "loss": 2.3592, "step": 18725 }, { "epoch": 0.5, "learning_rate": 0.0010381139329170075, "loss": 2.3615, "step": 18726 }, { "epoch": 0.5, "learning_rate": 0.0010380269568218215, "loss": 2.4736, "step": 18727 }, { "epoch": 0.5, "learning_rate": 0.0010379399804385503, "loss": 2.8251, "step": 18728 }, { "epoch": 0.5, "learning_rate": 0.0010378530037678526, "loss": 2.748, "step": 18729 }, { "epoch": 0.5, "learning_rate": 0.001037766026810387, "loss": 2.035, "step": 18730 }, { "epoch": 0.5, "learning_rate": 0.001037679049566813, "loss": 2.6669, "step": 18731 }, { "epoch": 0.5, "learning_rate": 0.001037592072037789, "loss": 2.0076, "step": 18732 }, { "epoch": 0.5, "learning_rate": 0.0010375050942239745, "loss": 2.472, "step": 18733 }, { "epoch": 0.5, "learning_rate": 0.0010374181161260277, "loss": 2.4751, "step": 18734 }, { "epoch": 0.5, "learning_rate": 0.0010373311377446083, "loss": 2.3929, "step": 18735 }, { "epoch": 0.5, "learning_rate": 0.0010372441590803748, "loss": 2.9178, "step": 18736 }, { "epoch": 0.5, "learning_rate": 0.0010371571801339862, "loss": 2.5172, "step": 18737 }, { "epoch": 0.5, "learning_rate": 0.0010370702009061012, "loss": 2.6198, "step": 18738 }, { "epoch": 0.5, "learning_rate": 0.0010369832213973796, "loss": 2.3012, "step": 18739 }, { "epoch": 0.5, "learning_rate": 0.0010368962416084791, "loss": 2.5771, "step": 18740 }, { "epoch": 0.5, "learning_rate": 0.0010368092615400597, "loss": 2.4919, "step": 18741 }, { "epoch": 0.5, "learning_rate": 0.0010367222811927795, "loss": 2.82, "step": 18742 }, { "epoch": 0.5, "learning_rate": 0.0010366353005672982, "loss": 2.2957, "step": 18743 }, { "epoch": 0.5, "learning_rate": 0.0010365483196642742, "loss": 2.5746, "step": 18744 }, { "epoch": 0.5, "learning_rate": 0.0010364613384843669, "loss": 2.1456, "step": 18745 }, { "epoch": 0.5, "learning_rate": 0.001036374357028235, "loss": 2.2105, "step": 18746 }, { "epoch": 0.5, "learning_rate": 0.0010362873752965372, "loss": 2.3951, "step": 18747 }, { "epoch": 0.5, "learning_rate": 0.0010362003932899329, "loss": 2.5361, "step": 18748 }, { "epoch": 0.5, "learning_rate": 0.001036113411009081, "loss": 2.5701, "step": 18749 }, { "epoch": 0.5, "learning_rate": 0.0010360264284546398, "loss": 2.9629, "step": 18750 }, { "epoch": 0.5, "learning_rate": 0.0010359394456272695, "loss": 2.6756, "step": 18751 }, { "epoch": 0.5, "learning_rate": 0.0010358524625276283, "loss": 2.7248, "step": 18752 }, { "epoch": 0.5, "learning_rate": 0.0010357654791563749, "loss": 2.6415, "step": 18753 }, { "epoch": 0.5, "learning_rate": 0.0010356784955141687, "loss": 2.4686, "step": 18754 }, { "epoch": 0.5, "learning_rate": 0.0010355915116016688, "loss": 2.8447, "step": 18755 }, { "epoch": 0.5, "learning_rate": 0.001035504527419534, "loss": 2.108, "step": 18756 }, { "epoch": 0.5, "learning_rate": 0.001035417542968423, "loss": 2.4801, "step": 18757 }, { "epoch": 0.5, "learning_rate": 0.001035330558248995, "loss": 2.5752, "step": 18758 }, { "epoch": 0.5, "learning_rate": 0.0010352435732619094, "loss": 2.2206, "step": 18759 }, { "epoch": 0.5, "learning_rate": 0.0010351565880078245, "loss": 2.4235, "step": 18760 }, { "epoch": 0.5, "learning_rate": 0.0010350696024873996, "loss": 2.0759, "step": 18761 }, { "epoch": 0.5, "learning_rate": 0.0010349826167012936, "loss": 3.017, "step": 18762 }, { "epoch": 0.5, "learning_rate": 0.0010348956306501656, "loss": 2.4069, "step": 18763 }, { "epoch": 0.5, "learning_rate": 0.0010348086443346747, "loss": 2.5215, "step": 18764 }, { "epoch": 0.5, "learning_rate": 0.0010347216577554796, "loss": 2.9877, "step": 18765 }, { "epoch": 0.5, "learning_rate": 0.0010346346709132394, "loss": 2.3831, "step": 18766 }, { "epoch": 0.5, "learning_rate": 0.0010345476838086133, "loss": 2.612, "step": 18767 }, { "epoch": 0.5, "learning_rate": 0.00103446069644226, "loss": 2.5815, "step": 18768 }, { "epoch": 0.5, "learning_rate": 0.0010343737088148385, "loss": 2.5289, "step": 18769 }, { "epoch": 0.5, "learning_rate": 0.001034286720927008, "loss": 3.1811, "step": 18770 }, { "epoch": 0.5, "learning_rate": 0.0010341997327794274, "loss": 2.8999, "step": 18771 }, { "epoch": 0.5, "learning_rate": 0.001034112744372756, "loss": 2.5433, "step": 18772 }, { "epoch": 0.5, "learning_rate": 0.0010340257557076525, "loss": 2.8234, "step": 18773 }, { "epoch": 0.5, "learning_rate": 0.0010339387667847755, "loss": 2.2253, "step": 18774 }, { "epoch": 0.5, "learning_rate": 0.0010338517776047852, "loss": 2.649, "step": 18775 }, { "epoch": 0.5, "learning_rate": 0.0010337647881683391, "loss": 2.363, "step": 18776 }, { "epoch": 0.5, "learning_rate": 0.0010336777984760975, "loss": 2.4624, "step": 18777 }, { "epoch": 0.5, "learning_rate": 0.0010335908085287188, "loss": 2.5391, "step": 18778 }, { "epoch": 0.5, "learning_rate": 0.0010335038183268623, "loss": 2.4695, "step": 18779 }, { "epoch": 0.5, "learning_rate": 0.0010334168278711866, "loss": 2.6342, "step": 18780 }, { "epoch": 0.5, "learning_rate": 0.0010333298371623509, "loss": 2.2847, "step": 18781 }, { "epoch": 0.5, "learning_rate": 0.0010332428462010146, "loss": 2.3688, "step": 18782 }, { "epoch": 0.5, "learning_rate": 0.0010331558549878364, "loss": 2.6065, "step": 18783 }, { "epoch": 0.5, "learning_rate": 0.0010330688635234752, "loss": 2.797, "step": 18784 }, { "epoch": 0.5, "learning_rate": 0.0010329818718085905, "loss": 2.5814, "step": 18785 }, { "epoch": 0.5, "learning_rate": 0.001032894879843841, "loss": 2.1573, "step": 18786 }, { "epoch": 0.5, "learning_rate": 0.0010328078876298853, "loss": 2.2834, "step": 18787 }, { "epoch": 0.5, "learning_rate": 0.0010327208951673834, "loss": 2.6639, "step": 18788 }, { "epoch": 0.5, "learning_rate": 0.0010326339024569935, "loss": 2.7791, "step": 18789 }, { "epoch": 0.5, "learning_rate": 0.0010325469094993752, "loss": 2.4105, "step": 18790 }, { "epoch": 0.5, "learning_rate": 0.0010324599162951874, "loss": 2.6325, "step": 18791 }, { "epoch": 0.51, "learning_rate": 0.001032372922845089, "loss": 2.6178, "step": 18792 }, { "epoch": 0.51, "learning_rate": 0.001032285929149739, "loss": 2.4754, "step": 18793 }, { "epoch": 0.51, "learning_rate": 0.0010321989352097968, "loss": 2.9679, "step": 18794 }, { "epoch": 0.51, "learning_rate": 0.001032111941025921, "loss": 2.5953, "step": 18795 }, { "epoch": 0.51, "learning_rate": 0.001032024946598771, "loss": 2.5045, "step": 18796 }, { "epoch": 0.51, "learning_rate": 0.0010319379519290056, "loss": 2.8164, "step": 18797 }, { "epoch": 0.51, "learning_rate": 0.001031850957017284, "loss": 2.5278, "step": 18798 }, { "epoch": 0.51, "learning_rate": 0.0010317639618642655, "loss": 2.577, "step": 18799 }, { "epoch": 0.51, "learning_rate": 0.0010316769664706084, "loss": 2.8705, "step": 18800 }, { "epoch": 0.51, "learning_rate": 0.001031589970836973, "loss": 2.4942, "step": 18801 }, { "epoch": 0.51, "learning_rate": 0.0010315029749640172, "loss": 2.6761, "step": 18802 }, { "epoch": 0.51, "learning_rate": 0.0010314159788524005, "loss": 2.7495, "step": 18803 }, { "epoch": 0.51, "learning_rate": 0.0010313289825027818, "loss": 2.6794, "step": 18804 }, { "epoch": 0.51, "learning_rate": 0.0010312419859158206, "loss": 2.4026, "step": 18805 }, { "epoch": 0.51, "learning_rate": 0.0010311549890921754, "loss": 2.6136, "step": 18806 }, { "epoch": 0.51, "learning_rate": 0.0010310679920325061, "loss": 2.3063, "step": 18807 }, { "epoch": 0.51, "learning_rate": 0.001030980994737471, "loss": 2.3949, "step": 18808 }, { "epoch": 0.51, "learning_rate": 0.0010308939972077291, "loss": 2.4786, "step": 18809 }, { "epoch": 0.51, "learning_rate": 0.0010308069994439401, "loss": 2.6215, "step": 18810 }, { "epoch": 0.51, "learning_rate": 0.0010307200014467628, "loss": 2.4428, "step": 18811 }, { "epoch": 0.51, "learning_rate": 0.0010306330032168562, "loss": 2.7147, "step": 18812 }, { "epoch": 0.51, "learning_rate": 0.0010305460047548795, "loss": 2.4198, "step": 18813 }, { "epoch": 0.51, "learning_rate": 0.0010304590060614916, "loss": 2.5758, "step": 18814 }, { "epoch": 0.51, "learning_rate": 0.001030372007137352, "loss": 2.6308, "step": 18815 }, { "epoch": 0.51, "learning_rate": 0.0010302850079831193, "loss": 2.6883, "step": 18816 }, { "epoch": 0.51, "learning_rate": 0.0010301980085994525, "loss": 2.5094, "step": 18817 }, { "epoch": 0.51, "learning_rate": 0.0010301110089870114, "loss": 2.7309, "step": 18818 }, { "epoch": 0.51, "learning_rate": 0.0010300240091464543, "loss": 2.6975, "step": 18819 }, { "epoch": 0.51, "learning_rate": 0.001029937009078441, "loss": 2.7595, "step": 18820 }, { "epoch": 0.51, "learning_rate": 0.0010298500087836302, "loss": 2.6412, "step": 18821 }, { "epoch": 0.51, "learning_rate": 0.0010297630082626813, "loss": 2.4273, "step": 18822 }, { "epoch": 0.51, "learning_rate": 0.0010296760075162528, "loss": 2.2629, "step": 18823 }, { "epoch": 0.51, "learning_rate": 0.0010295890065450041, "loss": 2.2846, "step": 18824 }, { "epoch": 0.51, "learning_rate": 0.001029502005349595, "loss": 2.5135, "step": 18825 }, { "epoch": 0.51, "learning_rate": 0.0010294150039306834, "loss": 2.597, "step": 18826 }, { "epoch": 0.51, "learning_rate": 0.0010293280022889292, "loss": 2.599, "step": 18827 }, { "epoch": 0.51, "learning_rate": 0.001029241000424991, "loss": 2.2486, "step": 18828 }, { "epoch": 0.51, "learning_rate": 0.0010291539983395285, "loss": 2.6431, "step": 18829 }, { "epoch": 0.51, "learning_rate": 0.0010290669960332007, "loss": 2.8401, "step": 18830 }, { "epoch": 0.51, "learning_rate": 0.0010289799935066662, "loss": 2.372, "step": 18831 }, { "epoch": 0.51, "learning_rate": 0.0010288929907605847, "loss": 2.9572, "step": 18832 }, { "epoch": 0.51, "learning_rate": 0.0010288059877956149, "loss": 2.423, "step": 18833 }, { "epoch": 0.51, "learning_rate": 0.001028718984612416, "loss": 3.0072, "step": 18834 }, { "epoch": 0.51, "learning_rate": 0.0010286319812116474, "loss": 2.8062, "step": 18835 }, { "epoch": 0.51, "learning_rate": 0.0010285449775939677, "loss": 2.6298, "step": 18836 }, { "epoch": 0.51, "learning_rate": 0.0010284579737600368, "loss": 1.9909, "step": 18837 }, { "epoch": 0.51, "learning_rate": 0.0010283709697105133, "loss": 2.7486, "step": 18838 }, { "epoch": 0.51, "learning_rate": 0.0010282839654460563, "loss": 2.0804, "step": 18839 }, { "epoch": 0.51, "learning_rate": 0.001028196960967325, "loss": 2.5756, "step": 18840 }, { "epoch": 0.51, "learning_rate": 0.0010281099562749784, "loss": 2.2229, "step": 18841 }, { "epoch": 0.51, "learning_rate": 0.0010280229513696761, "loss": 2.515, "step": 18842 }, { "epoch": 0.51, "learning_rate": 0.0010279359462520767, "loss": 2.7278, "step": 18843 }, { "epoch": 0.51, "learning_rate": 0.0010278489409228397, "loss": 2.5584, "step": 18844 }, { "epoch": 0.51, "learning_rate": 0.0010277619353826245, "loss": 2.6099, "step": 18845 }, { "epoch": 0.51, "learning_rate": 0.001027674929632089, "loss": 2.7705, "step": 18846 }, { "epoch": 0.51, "learning_rate": 0.0010275879236718937, "loss": 2.3463, "step": 18847 }, { "epoch": 0.51, "learning_rate": 0.0010275009175026973, "loss": 3.0523, "step": 18848 }, { "epoch": 0.51, "learning_rate": 0.0010274139111251586, "loss": 2.3466, "step": 18849 }, { "epoch": 0.51, "learning_rate": 0.0010273269045399372, "loss": 2.3649, "step": 18850 }, { "epoch": 0.51, "learning_rate": 0.0010272398977476918, "loss": 2.6217, "step": 18851 }, { "epoch": 0.51, "learning_rate": 0.001027152890749082, "loss": 2.6305, "step": 18852 }, { "epoch": 0.51, "learning_rate": 0.0010270658835447668, "loss": 2.7265, "step": 18853 }, { "epoch": 0.51, "learning_rate": 0.0010269788761354053, "loss": 2.4028, "step": 18854 }, { "epoch": 0.51, "learning_rate": 0.0010268918685216565, "loss": 2.4969, "step": 18855 }, { "epoch": 0.51, "learning_rate": 0.0010268048607041797, "loss": 2.5713, "step": 18856 }, { "epoch": 0.51, "learning_rate": 0.0010267178526836343, "loss": 2.8607, "step": 18857 }, { "epoch": 0.51, "learning_rate": 0.0010266308444606793, "loss": 2.5392, "step": 18858 }, { "epoch": 0.51, "learning_rate": 0.001026543836035973, "loss": 2.7085, "step": 18859 }, { "epoch": 0.51, "learning_rate": 0.0010264568274101762, "loss": 2.3723, "step": 18860 }, { "epoch": 0.51, "learning_rate": 0.0010263698185839472, "loss": 2.3837, "step": 18861 }, { "epoch": 0.51, "learning_rate": 0.0010262828095579447, "loss": 2.6901, "step": 18862 }, { "epoch": 0.51, "learning_rate": 0.0010261958003328284, "loss": 2.7346, "step": 18863 }, { "epoch": 0.51, "learning_rate": 0.0010261087909092578, "loss": 2.8596, "step": 18864 }, { "epoch": 0.51, "learning_rate": 0.0010260217812878914, "loss": 2.5601, "step": 18865 }, { "epoch": 0.51, "learning_rate": 0.0010259347714693884, "loss": 2.8232, "step": 18866 }, { "epoch": 0.51, "learning_rate": 0.0010258477614544083, "loss": 2.8819, "step": 18867 }, { "epoch": 0.51, "learning_rate": 0.0010257607512436106, "loss": 2.4299, "step": 18868 }, { "epoch": 0.51, "learning_rate": 0.0010256737408376538, "loss": 2.8644, "step": 18869 }, { "epoch": 0.51, "learning_rate": 0.001025586730237197, "loss": 2.7845, "step": 18870 }, { "epoch": 0.51, "learning_rate": 0.0010254997194429002, "loss": 2.9167, "step": 18871 }, { "epoch": 0.51, "learning_rate": 0.001025412708455422, "loss": 2.5925, "step": 18872 }, { "epoch": 0.51, "learning_rate": 0.0010253256972754215, "loss": 2.5523, "step": 18873 }, { "epoch": 0.51, "learning_rate": 0.001025238685903558, "loss": 2.66, "step": 18874 }, { "epoch": 0.51, "learning_rate": 0.001025151674340491, "loss": 2.3783, "step": 18875 }, { "epoch": 0.51, "learning_rate": 0.001025064662586879, "loss": 2.3099, "step": 18876 }, { "epoch": 0.51, "learning_rate": 0.001024977650643382, "loss": 2.5152, "step": 18877 }, { "epoch": 0.51, "learning_rate": 0.0010248906385106587, "loss": 2.6136, "step": 18878 }, { "epoch": 0.51, "learning_rate": 0.001024803626189368, "loss": 2.4915, "step": 18879 }, { "epoch": 0.51, "learning_rate": 0.00102471661368017, "loss": 2.7943, "step": 18880 }, { "epoch": 0.51, "learning_rate": 0.0010246296009837233, "loss": 2.5096, "step": 18881 }, { "epoch": 0.51, "learning_rate": 0.0010245425881006869, "loss": 2.9986, "step": 18882 }, { "epoch": 0.51, "learning_rate": 0.0010244555750317202, "loss": 2.2679, "step": 18883 }, { "epoch": 0.51, "learning_rate": 0.0010243685617774827, "loss": 2.5211, "step": 18884 }, { "epoch": 0.51, "learning_rate": 0.001024281548338633, "loss": 2.5092, "step": 18885 }, { "epoch": 0.51, "learning_rate": 0.0010241945347158308, "loss": 2.4725, "step": 18886 }, { "epoch": 0.51, "learning_rate": 0.0010241075209097353, "loss": 2.0578, "step": 18887 }, { "epoch": 0.51, "learning_rate": 0.0010240205069210054, "loss": 2.3457, "step": 18888 }, { "epoch": 0.51, "learning_rate": 0.0010239334927503003, "loss": 2.4791, "step": 18889 }, { "epoch": 0.51, "learning_rate": 0.0010238464783982792, "loss": 2.7729, "step": 18890 }, { "epoch": 0.51, "learning_rate": 0.001023759463865602, "loss": 2.6812, "step": 18891 }, { "epoch": 0.51, "learning_rate": 0.0010236724491529269, "loss": 2.2569, "step": 18892 }, { "epoch": 0.51, "learning_rate": 0.0010235854342609137, "loss": 2.7217, "step": 18893 }, { "epoch": 0.51, "learning_rate": 0.0010234984191902215, "loss": 3.0889, "step": 18894 }, { "epoch": 0.51, "learning_rate": 0.0010234114039415095, "loss": 2.72, "step": 18895 }, { "epoch": 0.51, "learning_rate": 0.0010233243885154366, "loss": 2.3149, "step": 18896 }, { "epoch": 0.51, "learning_rate": 0.0010232373729126627, "loss": 2.4423, "step": 18897 }, { "epoch": 0.51, "learning_rate": 0.0010231503571338464, "loss": 2.5839, "step": 18898 }, { "epoch": 0.51, "learning_rate": 0.001023063341179647, "loss": 2.2538, "step": 18899 }, { "epoch": 0.51, "learning_rate": 0.0010229763250507243, "loss": 2.551, "step": 18900 }, { "epoch": 0.51, "learning_rate": 0.001022889308747737, "loss": 2.6067, "step": 18901 }, { "epoch": 0.51, "learning_rate": 0.0010228022922713436, "loss": 2.4102, "step": 18902 }, { "epoch": 0.51, "learning_rate": 0.001022715275622205, "loss": 2.1843, "step": 18903 }, { "epoch": 0.51, "learning_rate": 0.0010226282588009792, "loss": 2.7736, "step": 18904 }, { "epoch": 0.51, "learning_rate": 0.0010225412418083258, "loss": 2.3245, "step": 18905 }, { "epoch": 0.51, "learning_rate": 0.0010224542246449037, "loss": 2.7359, "step": 18906 }, { "epoch": 0.51, "learning_rate": 0.0010223672073113729, "loss": 2.3413, "step": 18907 }, { "epoch": 0.51, "learning_rate": 0.001022280189808392, "loss": 2.3324, "step": 18908 }, { "epoch": 0.51, "learning_rate": 0.00102219317213662, "loss": 2.5312, "step": 18909 }, { "epoch": 0.51, "learning_rate": 0.001022106154296717, "loss": 2.2603, "step": 18910 }, { "epoch": 0.51, "learning_rate": 0.0010220191362893415, "loss": 2.3753, "step": 18911 }, { "epoch": 0.51, "learning_rate": 0.0010219321181151528, "loss": 1.7506, "step": 18912 }, { "epoch": 0.51, "learning_rate": 0.0010218450997748103, "loss": 2.7082, "step": 18913 }, { "epoch": 0.51, "learning_rate": 0.0010217580812689735, "loss": 2.2514, "step": 18914 }, { "epoch": 0.51, "learning_rate": 0.0010216710625983011, "loss": 2.7371, "step": 18915 }, { "epoch": 0.51, "learning_rate": 0.001021584043763453, "loss": 2.5835, "step": 18916 }, { "epoch": 0.51, "learning_rate": 0.0010214970247650877, "loss": 2.5647, "step": 18917 }, { "epoch": 0.51, "learning_rate": 0.0010214100056038652, "loss": 2.6657, "step": 18918 }, { "epoch": 0.51, "learning_rate": 0.0010213229862804437, "loss": 2.4407, "step": 18919 }, { "epoch": 0.51, "learning_rate": 0.0010212359667954836, "loss": 2.4482, "step": 18920 }, { "epoch": 0.51, "learning_rate": 0.0010211489471496432, "loss": 2.4265, "step": 18921 }, { "epoch": 0.51, "learning_rate": 0.001021061927343582, "loss": 2.7252, "step": 18922 }, { "epoch": 0.51, "learning_rate": 0.0010209749073779601, "loss": 2.4143, "step": 18923 }, { "epoch": 0.51, "learning_rate": 0.001020887887253436, "loss": 2.6157, "step": 18924 }, { "epoch": 0.51, "learning_rate": 0.0010208008669706683, "loss": 2.7271, "step": 18925 }, { "epoch": 0.51, "learning_rate": 0.0010207138465303173, "loss": 2.6756, "step": 18926 }, { "epoch": 0.51, "learning_rate": 0.0010206268259330422, "loss": 2.4441, "step": 18927 }, { "epoch": 0.51, "learning_rate": 0.0010205398051795016, "loss": 2.5728, "step": 18928 }, { "epoch": 0.51, "learning_rate": 0.001020452784270355, "loss": 2.2952, "step": 18929 }, { "epoch": 0.51, "learning_rate": 0.0010203657632062622, "loss": 2.5161, "step": 18930 }, { "epoch": 0.51, "learning_rate": 0.0010202787419878818, "loss": 2.3511, "step": 18931 }, { "epoch": 0.51, "learning_rate": 0.0010201917206158733, "loss": 2.7646, "step": 18932 }, { "epoch": 0.51, "learning_rate": 0.0010201046990908958, "loss": 2.7499, "step": 18933 }, { "epoch": 0.51, "learning_rate": 0.001020017677413609, "loss": 2.5447, "step": 18934 }, { "epoch": 0.51, "learning_rate": 0.0010199306555846715, "loss": 2.1848, "step": 18935 }, { "epoch": 0.51, "learning_rate": 0.0010198436336047432, "loss": 2.1791, "step": 18936 }, { "epoch": 0.51, "learning_rate": 0.0010197566114744827, "loss": 2.4897, "step": 18937 }, { "epoch": 0.51, "learning_rate": 0.00101966958919455, "loss": 2.7133, "step": 18938 }, { "epoch": 0.51, "learning_rate": 0.001019582566765604, "loss": 2.3941, "step": 18939 }, { "epoch": 0.51, "learning_rate": 0.001019495544188304, "loss": 2.5226, "step": 18940 }, { "epoch": 0.51, "learning_rate": 0.001019408521463309, "loss": 2.631, "step": 18941 }, { "epoch": 0.51, "learning_rate": 0.0010193214985912784, "loss": 2.4491, "step": 18942 }, { "epoch": 0.51, "learning_rate": 0.001019234475572872, "loss": 2.6169, "step": 18943 }, { "epoch": 0.51, "learning_rate": 0.0010191474524087485, "loss": 2.4077, "step": 18944 }, { "epoch": 0.51, "learning_rate": 0.001019060429099567, "loss": 2.3538, "step": 18945 }, { "epoch": 0.51, "learning_rate": 0.0010189734056459876, "loss": 2.4375, "step": 18946 }, { "epoch": 0.51, "learning_rate": 0.0010188863820486688, "loss": 2.3786, "step": 18947 }, { "epoch": 0.51, "learning_rate": 0.0010187993583082703, "loss": 2.8344, "step": 18948 }, { "epoch": 0.51, "learning_rate": 0.001018712334425451, "loss": 2.543, "step": 18949 }, { "epoch": 0.51, "learning_rate": 0.0010186253104008708, "loss": 2.5265, "step": 18950 }, { "epoch": 0.51, "learning_rate": 0.0010185382862351882, "loss": 2.6245, "step": 18951 }, { "epoch": 0.51, "learning_rate": 0.0010184512619290627, "loss": 2.5475, "step": 18952 }, { "epoch": 0.51, "learning_rate": 0.0010183642374831541, "loss": 2.7669, "step": 18953 }, { "epoch": 0.51, "learning_rate": 0.0010182772128981214, "loss": 2.6662, "step": 18954 }, { "epoch": 0.51, "learning_rate": 0.0010181901881746237, "loss": 2.3513, "step": 18955 }, { "epoch": 0.51, "learning_rate": 0.00101810316331332, "loss": 2.5706, "step": 18956 }, { "epoch": 0.51, "learning_rate": 0.0010180161383148705, "loss": 3.0527, "step": 18957 }, { "epoch": 0.51, "learning_rate": 0.0010179291131799336, "loss": 2.4873, "step": 18958 }, { "epoch": 0.51, "learning_rate": 0.0010178420879091692, "loss": 2.9856, "step": 18959 }, { "epoch": 0.51, "learning_rate": 0.001017755062503236, "loss": 2.5056, "step": 18960 }, { "epoch": 0.51, "learning_rate": 0.0010176680369627942, "loss": 2.2467, "step": 18961 }, { "epoch": 0.51, "learning_rate": 0.001017581011288502, "loss": 2.7828, "step": 18962 }, { "epoch": 0.51, "learning_rate": 0.0010174939854810194, "loss": 2.389, "step": 18963 }, { "epoch": 0.51, "learning_rate": 0.0010174069595410055, "loss": 2.2238, "step": 18964 }, { "epoch": 0.51, "learning_rate": 0.0010173199334691193, "loss": 2.3681, "step": 18965 }, { "epoch": 0.51, "learning_rate": 0.0010172329072660206, "loss": 2.5475, "step": 18966 }, { "epoch": 0.51, "learning_rate": 0.0010171458809323688, "loss": 2.6701, "step": 18967 }, { "epoch": 0.51, "learning_rate": 0.0010170588544688222, "loss": 2.4527, "step": 18968 }, { "epoch": 0.51, "learning_rate": 0.0010169718278760411, "loss": 2.5727, "step": 18969 }, { "epoch": 0.51, "learning_rate": 0.0010168848011546847, "loss": 2.6958, "step": 18970 }, { "epoch": 0.51, "learning_rate": 0.0010167977743054117, "loss": 2.584, "step": 18971 }, { "epoch": 0.51, "learning_rate": 0.0010167107473288818, "loss": 2.2138, "step": 18972 }, { "epoch": 0.51, "learning_rate": 0.0010166237202257546, "loss": 2.1551, "step": 18973 }, { "epoch": 0.51, "learning_rate": 0.001016536692996689, "loss": 2.5861, "step": 18974 }, { "epoch": 0.51, "learning_rate": 0.0010164496656423442, "loss": 2.743, "step": 18975 }, { "epoch": 0.51, "learning_rate": 0.0010163626381633794, "loss": 2.8327, "step": 18976 }, { "epoch": 0.51, "learning_rate": 0.0010162756105604547, "loss": 2.4554, "step": 18977 }, { "epoch": 0.51, "learning_rate": 0.0010161885828342285, "loss": 2.5892, "step": 18978 }, { "epoch": 0.51, "learning_rate": 0.0010161015549853608, "loss": 2.5276, "step": 18979 }, { "epoch": 0.51, "learning_rate": 0.0010160145270145106, "loss": 2.6288, "step": 18980 }, { "epoch": 0.51, "learning_rate": 0.0010159274989223368, "loss": 2.5063, "step": 18981 }, { "epoch": 0.51, "learning_rate": 0.0010158404707094994, "loss": 2.2997, "step": 18982 }, { "epoch": 0.51, "learning_rate": 0.0010157534423766575, "loss": 2.8207, "step": 18983 }, { "epoch": 0.51, "learning_rate": 0.0010156664139244701, "loss": 2.4313, "step": 18984 }, { "epoch": 0.51, "learning_rate": 0.0010155793853535969, "loss": 2.4957, "step": 18985 }, { "epoch": 0.51, "learning_rate": 0.0010154923566646971, "loss": 2.2646, "step": 18986 }, { "epoch": 0.51, "learning_rate": 0.00101540532785843, "loss": 2.9532, "step": 18987 }, { "epoch": 0.51, "learning_rate": 0.0010153182989354546, "loss": 2.1874, "step": 18988 }, { "epoch": 0.51, "learning_rate": 0.0010152312698964308, "loss": 2.604, "step": 18989 }, { "epoch": 0.51, "learning_rate": 0.0010151442407420176, "loss": 2.3185, "step": 18990 }, { "epoch": 0.51, "learning_rate": 0.0010150572114728741, "loss": 2.1852, "step": 18991 }, { "epoch": 0.51, "learning_rate": 0.0010149701820896602, "loss": 2.4462, "step": 18992 }, { "epoch": 0.51, "learning_rate": 0.0010148831525930348, "loss": 2.1287, "step": 18993 }, { "epoch": 0.51, "learning_rate": 0.001014796122983657, "loss": 2.4376, "step": 18994 }, { "epoch": 0.51, "learning_rate": 0.0010147090932621865, "loss": 2.86, "step": 18995 }, { "epoch": 0.51, "learning_rate": 0.0010146220634292828, "loss": 2.6023, "step": 18996 }, { "epoch": 0.51, "learning_rate": 0.0010145350334856051, "loss": 2.5476, "step": 18997 }, { "epoch": 0.51, "learning_rate": 0.0010144480034318122, "loss": 2.3968, "step": 18998 }, { "epoch": 0.51, "learning_rate": 0.001014360973268564, "loss": 2.7297, "step": 18999 }, { "epoch": 0.51, "learning_rate": 0.0010142739429965196, "loss": 2.6205, "step": 19000 }, { "epoch": 0.51, "learning_rate": 0.001014186912616338, "loss": 2.6675, "step": 19001 }, { "epoch": 0.51, "learning_rate": 0.0010140998821286796, "loss": 2.6656, "step": 19002 }, { "epoch": 0.51, "learning_rate": 0.0010140128515342024, "loss": 2.5326, "step": 19003 }, { "epoch": 0.51, "learning_rate": 0.0010139258208335664, "loss": 2.7181, "step": 19004 }, { "epoch": 0.51, "learning_rate": 0.001013838790027431, "loss": 2.8316, "step": 19005 }, { "epoch": 0.51, "learning_rate": 0.0010137517591164557, "loss": 2.6026, "step": 19006 }, { "epoch": 0.51, "learning_rate": 0.0010136647281012991, "loss": 2.0306, "step": 19007 }, { "epoch": 0.51, "learning_rate": 0.0010135776969826212, "loss": 2.4947, "step": 19008 }, { "epoch": 0.51, "learning_rate": 0.0010134906657610812, "loss": 2.3865, "step": 19009 }, { "epoch": 0.51, "learning_rate": 0.0010134036344373381, "loss": 2.551, "step": 19010 }, { "epoch": 0.51, "learning_rate": 0.0010133166030120513, "loss": 2.328, "step": 19011 }, { "epoch": 0.51, "learning_rate": 0.0010132295714858806, "loss": 2.1932, "step": 19012 }, { "epoch": 0.51, "learning_rate": 0.001013142539859485, "loss": 2.6773, "step": 19013 }, { "epoch": 0.51, "learning_rate": 0.0010130555081335237, "loss": 2.3901, "step": 19014 }, { "epoch": 0.51, "learning_rate": 0.001012968476308656, "loss": 2.29, "step": 19015 }, { "epoch": 0.51, "learning_rate": 0.001012881444385542, "loss": 3.2497, "step": 19016 }, { "epoch": 0.51, "learning_rate": 0.0010127944123648402, "loss": 2.1446, "step": 19017 }, { "epoch": 0.51, "learning_rate": 0.0010127073802472103, "loss": 2.5079, "step": 19018 }, { "epoch": 0.51, "learning_rate": 0.0010126203480333117, "loss": 2.1533, "step": 19019 }, { "epoch": 0.51, "learning_rate": 0.0010125333157238036, "loss": 2.4862, "step": 19020 }, { "epoch": 0.51, "learning_rate": 0.001012446283319345, "loss": 2.2809, "step": 19021 }, { "epoch": 0.51, "learning_rate": 0.0010123592508205954, "loss": 2.9853, "step": 19022 }, { "epoch": 0.51, "learning_rate": 0.0010122722182282148, "loss": 3.0058, "step": 19023 }, { "epoch": 0.51, "learning_rate": 0.001012185185542862, "loss": 2.2137, "step": 19024 }, { "epoch": 0.51, "learning_rate": 0.0010120981527651964, "loss": 2.5157, "step": 19025 }, { "epoch": 0.51, "learning_rate": 0.0010120111198958772, "loss": 2.7763, "step": 19026 }, { "epoch": 0.51, "learning_rate": 0.0010119240869355642, "loss": 2.2638, "step": 19027 }, { "epoch": 0.51, "learning_rate": 0.001011837053884916, "loss": 2.6647, "step": 19028 }, { "epoch": 0.51, "learning_rate": 0.001011750020744593, "loss": 2.3326, "step": 19029 }, { "epoch": 0.51, "learning_rate": 0.0010116629875152531, "loss": 2.3781, "step": 19030 }, { "epoch": 0.51, "learning_rate": 0.0010115759541975571, "loss": 2.2321, "step": 19031 }, { "epoch": 0.51, "learning_rate": 0.0010114889207921637, "loss": 3.1581, "step": 19032 }, { "epoch": 0.51, "learning_rate": 0.0010114018872997323, "loss": 2.2215, "step": 19033 }, { "epoch": 0.51, "learning_rate": 0.001011314853720922, "loss": 2.6553, "step": 19034 }, { "epoch": 0.51, "learning_rate": 0.0010112278200563928, "loss": 2.6621, "step": 19035 }, { "epoch": 0.51, "learning_rate": 0.0010111407863068033, "loss": 2.6362, "step": 19036 }, { "epoch": 0.51, "learning_rate": 0.0010110537524728133, "loss": 2.7914, "step": 19037 }, { "epoch": 0.51, "learning_rate": 0.0010109667185550816, "loss": 2.1637, "step": 19038 }, { "epoch": 0.51, "learning_rate": 0.0010108796845542686, "loss": 2.3778, "step": 19039 }, { "epoch": 0.51, "learning_rate": 0.001010792650471033, "loss": 2.2406, "step": 19040 }, { "epoch": 0.51, "learning_rate": 0.0010107056163060342, "loss": 2.5449, "step": 19041 }, { "epoch": 0.51, "learning_rate": 0.0010106185820599313, "loss": 2.762, "step": 19042 }, { "epoch": 0.51, "learning_rate": 0.0010105315477333843, "loss": 2.1563, "step": 19043 }, { "epoch": 0.51, "learning_rate": 0.001010444513327052, "loss": 2.0231, "step": 19044 }, { "epoch": 0.51, "learning_rate": 0.001010357478841594, "loss": 2.4798, "step": 19045 }, { "epoch": 0.51, "learning_rate": 0.001010270444277669, "loss": 2.3422, "step": 19046 }, { "epoch": 0.51, "learning_rate": 0.0010101834096359374, "loss": 2.6061, "step": 19047 }, { "epoch": 0.51, "learning_rate": 0.0010100963749170584, "loss": 2.5002, "step": 19048 }, { "epoch": 0.51, "learning_rate": 0.001010009340121691, "loss": 2.6066, "step": 19049 }, { "epoch": 0.51, "learning_rate": 0.0010099223052504943, "loss": 2.4028, "step": 19050 }, { "epoch": 0.51, "learning_rate": 0.001009835270304128, "loss": 2.275, "step": 19051 }, { "epoch": 0.51, "learning_rate": 0.0010097482352832516, "loss": 2.4126, "step": 19052 }, { "epoch": 0.51, "learning_rate": 0.0010096612001885244, "loss": 2.6849, "step": 19053 }, { "epoch": 0.51, "learning_rate": 0.0010095741650206053, "loss": 2.7336, "step": 19054 }, { "epoch": 0.51, "learning_rate": 0.0010094871297801544, "loss": 2.7844, "step": 19055 }, { "epoch": 0.51, "learning_rate": 0.0010094000944678308, "loss": 2.665, "step": 19056 }, { "epoch": 0.51, "learning_rate": 0.0010093130590842936, "loss": 2.2958, "step": 19057 }, { "epoch": 0.51, "learning_rate": 0.0010092260236302022, "loss": 2.6262, "step": 19058 }, { "epoch": 0.51, "learning_rate": 0.0010091389881062163, "loss": 2.5696, "step": 19059 }, { "epoch": 0.51, "learning_rate": 0.0010090519525129949, "loss": 3.1147, "step": 19060 }, { "epoch": 0.51, "learning_rate": 0.0010089649168511974, "loss": 2.7438, "step": 19061 }, { "epoch": 0.51, "learning_rate": 0.0010088778811214835, "loss": 2.7657, "step": 19062 }, { "epoch": 0.51, "learning_rate": 0.0010087908453245125, "loss": 2.743, "step": 19063 }, { "epoch": 0.51, "learning_rate": 0.0010087038094609435, "loss": 2.4496, "step": 19064 }, { "epoch": 0.51, "learning_rate": 0.0010086167735314357, "loss": 2.8702, "step": 19065 }, { "epoch": 0.51, "learning_rate": 0.0010085297375366494, "loss": 2.335, "step": 19066 }, { "epoch": 0.51, "learning_rate": 0.0010084427014772426, "loss": 2.6853, "step": 19067 }, { "epoch": 0.51, "learning_rate": 0.001008355665353876, "loss": 2.3138, "step": 19068 }, { "epoch": 0.51, "learning_rate": 0.001008268629167208, "loss": 2.9478, "step": 19069 }, { "epoch": 0.51, "learning_rate": 0.0010081815929178985, "loss": 2.8091, "step": 19070 }, { "epoch": 0.51, "learning_rate": 0.0010080945566066067, "loss": 1.8789, "step": 19071 }, { "epoch": 0.51, "learning_rate": 0.001008007520233992, "loss": 2.731, "step": 19072 }, { "epoch": 0.51, "learning_rate": 0.0010079204838007137, "loss": 2.9085, "step": 19073 }, { "epoch": 0.51, "learning_rate": 0.0010078334473074314, "loss": 2.6127, "step": 19074 }, { "epoch": 0.51, "learning_rate": 0.001007746410754804, "loss": 2.4042, "step": 19075 }, { "epoch": 0.51, "learning_rate": 0.0010076593741434915, "loss": 2.4861, "step": 19076 }, { "epoch": 0.51, "learning_rate": 0.0010075723374741526, "loss": 2.9548, "step": 19077 }, { "epoch": 0.51, "learning_rate": 0.0010074853007474474, "loss": 2.7916, "step": 19078 }, { "epoch": 0.51, "learning_rate": 0.0010073982639640347, "loss": 2.3984, "step": 19079 }, { "epoch": 0.51, "learning_rate": 0.001007311227124574, "loss": 2.5048, "step": 19080 }, { "epoch": 0.51, "learning_rate": 0.0010072241902297247, "loss": 2.6153, "step": 19081 }, { "epoch": 0.51, "learning_rate": 0.0010071371532801466, "loss": 2.7715, "step": 19082 }, { "epoch": 0.51, "learning_rate": 0.0010070501162764984, "loss": 2.7947, "step": 19083 }, { "epoch": 0.51, "learning_rate": 0.00100696307921944, "loss": 2.81, "step": 19084 }, { "epoch": 0.51, "learning_rate": 0.0010068760421096303, "loss": 2.4223, "step": 19085 }, { "epoch": 0.51, "learning_rate": 0.001006789004947729, "loss": 2.1915, "step": 19086 }, { "epoch": 0.51, "learning_rate": 0.0010067019677343957, "loss": 2.5025, "step": 19087 }, { "epoch": 0.51, "learning_rate": 0.0010066149304702892, "loss": 2.1579, "step": 19088 }, { "epoch": 0.51, "learning_rate": 0.001006527893156069, "loss": 2.2698, "step": 19089 }, { "epoch": 0.51, "learning_rate": 0.0010064408557923948, "loss": 2.4537, "step": 19090 }, { "epoch": 0.51, "learning_rate": 0.001006353818379926, "loss": 2.3773, "step": 19091 }, { "epoch": 0.51, "learning_rate": 0.0010062667809193218, "loss": 2.3304, "step": 19092 }, { "epoch": 0.51, "learning_rate": 0.0010061797434112415, "loss": 2.7485, "step": 19093 }, { "epoch": 0.51, "learning_rate": 0.0010060927058563444, "loss": 2.638, "step": 19094 }, { "epoch": 0.51, "learning_rate": 0.0010060056682552904, "loss": 2.483, "step": 19095 }, { "epoch": 0.51, "learning_rate": 0.0010059186306087381, "loss": 2.4344, "step": 19096 }, { "epoch": 0.51, "learning_rate": 0.0010058315929173476, "loss": 2.4065, "step": 19097 }, { "epoch": 0.51, "learning_rate": 0.0010057445551817782, "loss": 2.58, "step": 19098 }, { "epoch": 0.51, "learning_rate": 0.0010056575174026887, "loss": 2.6089, "step": 19099 }, { "epoch": 0.51, "learning_rate": 0.0010055704795807387, "loss": 2.9245, "step": 19100 }, { "epoch": 0.51, "learning_rate": 0.0010054834417165882, "loss": 2.6501, "step": 19101 }, { "epoch": 0.51, "learning_rate": 0.001005396403810896, "loss": 2.6504, "step": 19102 }, { "epoch": 0.51, "learning_rate": 0.0010053093658643215, "loss": 2.5372, "step": 19103 }, { "epoch": 0.51, "learning_rate": 0.0010052223278775242, "loss": 2.2836, "step": 19104 }, { "epoch": 0.51, "learning_rate": 0.0010051352898511636, "loss": 2.458, "step": 19105 }, { "epoch": 0.51, "learning_rate": 0.0010050482517858991, "loss": 2.9317, "step": 19106 }, { "epoch": 0.51, "learning_rate": 0.0010049612136823897, "loss": 2.4108, "step": 19107 }, { "epoch": 0.51, "learning_rate": 0.0010048741755412948, "loss": 2.7127, "step": 19108 }, { "epoch": 0.51, "learning_rate": 0.0010047871373632747, "loss": 2.4156, "step": 19109 }, { "epoch": 0.51, "learning_rate": 0.0010047000991489875, "loss": 2.7348, "step": 19110 }, { "epoch": 0.51, "learning_rate": 0.0010046130608990936, "loss": 2.6066, "step": 19111 }, { "epoch": 0.51, "learning_rate": 0.0010045260226142516, "loss": 2.0715, "step": 19112 }, { "epoch": 0.51, "learning_rate": 0.0010044389842951212, "loss": 2.2252, "step": 19113 }, { "epoch": 0.51, "learning_rate": 0.0010043519459423623, "loss": 2.2895, "step": 19114 }, { "epoch": 0.51, "learning_rate": 0.0010042649075566337, "loss": 2.5503, "step": 19115 }, { "epoch": 0.51, "learning_rate": 0.0010041778691385948, "loss": 2.3202, "step": 19116 }, { "epoch": 0.51, "learning_rate": 0.001004090830688905, "loss": 2.6716, "step": 19117 }, { "epoch": 0.51, "learning_rate": 0.001004003792208224, "loss": 2.8233, "step": 19118 }, { "epoch": 0.51, "learning_rate": 0.001003916753697211, "loss": 2.0467, "step": 19119 }, { "epoch": 0.51, "learning_rate": 0.001003829715156525, "loss": 2.5804, "step": 19120 }, { "epoch": 0.51, "learning_rate": 0.0010037426765868262, "loss": 3.0729, "step": 19121 }, { "epoch": 0.51, "learning_rate": 0.0010036556379887736, "loss": 2.4267, "step": 19122 }, { "epoch": 0.51, "learning_rate": 0.001003568599363026, "loss": 2.6884, "step": 19123 }, { "epoch": 0.51, "learning_rate": 0.001003481560710244, "loss": 2.7991, "step": 19124 }, { "epoch": 0.51, "learning_rate": 0.0010033945220310858, "loss": 2.9453, "step": 19125 }, { "epoch": 0.51, "learning_rate": 0.0010033074833262115, "loss": 2.73, "step": 19126 }, { "epoch": 0.51, "learning_rate": 0.0010032204445962803, "loss": 2.6527, "step": 19127 }, { "epoch": 0.51, "learning_rate": 0.0010031334058419516, "loss": 2.6098, "step": 19128 }, { "epoch": 0.51, "learning_rate": 0.001003046367063885, "loss": 2.4857, "step": 19129 }, { "epoch": 0.51, "learning_rate": 0.0010029593282627394, "loss": 2.0594, "step": 19130 }, { "epoch": 0.51, "learning_rate": 0.0010028722894391742, "loss": 2.3891, "step": 19131 }, { "epoch": 0.51, "learning_rate": 0.0010027852505938495, "loss": 2.3166, "step": 19132 }, { "epoch": 0.51, "learning_rate": 0.0010026982117274242, "loss": 2.6795, "step": 19133 }, { "epoch": 0.51, "learning_rate": 0.0010026111728405577, "loss": 2.6578, "step": 19134 }, { "epoch": 0.51, "learning_rate": 0.001002524133933909, "loss": 2.6447, "step": 19135 }, { "epoch": 0.51, "learning_rate": 0.0010024370950081384, "loss": 2.6969, "step": 19136 }, { "epoch": 0.51, "learning_rate": 0.0010023500560639048, "loss": 2.8924, "step": 19137 }, { "epoch": 0.51, "learning_rate": 0.0010022630171018674, "loss": 2.5413, "step": 19138 }, { "epoch": 0.51, "learning_rate": 0.0010021759781226858, "loss": 2.7698, "step": 19139 }, { "epoch": 0.51, "learning_rate": 0.0010020889391270194, "loss": 2.5969, "step": 19140 }, { "epoch": 0.51, "learning_rate": 0.0010020019001155277, "loss": 2.4624, "step": 19141 }, { "epoch": 0.51, "learning_rate": 0.0010019148610888697, "loss": 2.5709, "step": 19142 }, { "epoch": 0.51, "learning_rate": 0.0010018278220477051, "loss": 2.1611, "step": 19143 }, { "epoch": 0.51, "learning_rate": 0.0010017407829926933, "loss": 2.8454, "step": 19144 }, { "epoch": 0.51, "learning_rate": 0.001001653743924494, "loss": 2.8455, "step": 19145 }, { "epoch": 0.51, "learning_rate": 0.0010015667048437658, "loss": 2.3232, "step": 19146 }, { "epoch": 0.51, "learning_rate": 0.0010014796657511684, "loss": 2.6171, "step": 19147 }, { "epoch": 0.51, "learning_rate": 0.0010013926266473619, "loss": 2.2845, "step": 19148 }, { "epoch": 0.51, "learning_rate": 0.0010013055875330047, "loss": 2.2278, "step": 19149 }, { "epoch": 0.51, "learning_rate": 0.0010012185484087567, "loss": 2.4104, "step": 19150 }, { "epoch": 0.51, "learning_rate": 0.001001131509275277, "loss": 2.5308, "step": 19151 }, { "epoch": 0.51, "learning_rate": 0.0010010444701332255, "loss": 2.6182, "step": 19152 }, { "epoch": 0.51, "learning_rate": 0.001000957430983261, "loss": 2.5906, "step": 19153 }, { "epoch": 0.51, "learning_rate": 0.0010008703918260435, "loss": 2.7136, "step": 19154 }, { "epoch": 0.51, "learning_rate": 0.0010007833526622318, "loss": 2.0645, "step": 19155 }, { "epoch": 0.51, "learning_rate": 0.0010006963134924856, "loss": 2.7039, "step": 19156 }, { "epoch": 0.51, "learning_rate": 0.0010006092743174643, "loss": 2.7804, "step": 19157 }, { "epoch": 0.51, "learning_rate": 0.0010005222351378274, "loss": 2.3496, "step": 19158 }, { "epoch": 0.51, "learning_rate": 0.001000435195954234, "loss": 2.3066, "step": 19159 }, { "epoch": 0.51, "learning_rate": 0.0010003481567673433, "loss": 2.4969, "step": 19160 }, { "epoch": 0.51, "learning_rate": 0.0010002611175778157, "loss": 2.5036, "step": 19161 }, { "epoch": 0.51, "learning_rate": 0.0010001740783863095, "loss": 2.691, "step": 19162 }, { "epoch": 0.51, "learning_rate": 0.0010000870391934842, "loss": 3.0909, "step": 19163 }, { "epoch": 0.52, "learning_rate": 0.001, "loss": 2.4499, "step": 19164 }, { "epoch": 0.52, "learning_rate": 0.0009999129608065157, "loss": 2.9863, "step": 19165 }, { "epoch": 0.52, "learning_rate": 0.000999825921613691, "loss": 2.4516, "step": 19166 }, { "epoch": 0.52, "learning_rate": 0.0009997388824221846, "loss": 2.4592, "step": 19167 }, { "epoch": 0.52, "learning_rate": 0.0009996518432326565, "loss": 2.5222, "step": 19168 }, { "epoch": 0.52, "learning_rate": 0.0009995648040457663, "loss": 2.7599, "step": 19169 }, { "epoch": 0.52, "learning_rate": 0.0009994777648621729, "loss": 2.4545, "step": 19170 }, { "epoch": 0.52, "learning_rate": 0.0009993907256825362, "loss": 2.6217, "step": 19171 }, { "epoch": 0.52, "learning_rate": 0.0009993036865075147, "loss": 3.0709, "step": 19172 }, { "epoch": 0.52, "learning_rate": 0.0009992166473377683, "loss": 2.7105, "step": 19173 }, { "epoch": 0.52, "learning_rate": 0.000999129608173957, "loss": 2.255, "step": 19174 }, { "epoch": 0.52, "learning_rate": 0.000999042569016739, "loss": 2.4588, "step": 19175 }, { "epoch": 0.52, "learning_rate": 0.0009989555298667745, "loss": 2.7485, "step": 19176 }, { "epoch": 0.52, "learning_rate": 0.0009988684907247232, "loss": 2.662, "step": 19177 }, { "epoch": 0.52, "learning_rate": 0.0009987814515912434, "loss": 2.4949, "step": 19178 }, { "epoch": 0.52, "learning_rate": 0.0009986944124669955, "loss": 2.5257, "step": 19179 }, { "epoch": 0.52, "learning_rate": 0.0009986073733526384, "loss": 2.6774, "step": 19180 }, { "epoch": 0.52, "learning_rate": 0.0009985203342488314, "loss": 2.5335, "step": 19181 }, { "epoch": 0.52, "learning_rate": 0.0009984332951562345, "loss": 2.4895, "step": 19182 }, { "epoch": 0.52, "learning_rate": 0.0009983462560755063, "loss": 2.1004, "step": 19183 }, { "epoch": 0.52, "learning_rate": 0.0009982592170073065, "loss": 2.3475, "step": 19184 }, { "epoch": 0.52, "learning_rate": 0.0009981721779522951, "loss": 2.1162, "step": 19185 }, { "epoch": 0.52, "learning_rate": 0.0009980851389111303, "loss": 2.2828, "step": 19186 }, { "epoch": 0.52, "learning_rate": 0.0009979980998844728, "loss": 2.6327, "step": 19187 }, { "epoch": 0.52, "learning_rate": 0.000997911060872981, "loss": 2.5685, "step": 19188 }, { "epoch": 0.52, "learning_rate": 0.0009978240218773144, "loss": 2.3394, "step": 19189 }, { "epoch": 0.52, "learning_rate": 0.000997736982898133, "loss": 3.209, "step": 19190 }, { "epoch": 0.52, "learning_rate": 0.0009976499439360955, "loss": 2.5474, "step": 19191 }, { "epoch": 0.52, "learning_rate": 0.0009975629049918616, "loss": 2.6696, "step": 19192 }, { "epoch": 0.52, "learning_rate": 0.000997475866066091, "loss": 3.009, "step": 19193 }, { "epoch": 0.52, "learning_rate": 0.0009973888271594426, "loss": 2.5041, "step": 19194 }, { "epoch": 0.52, "learning_rate": 0.000997301788272576, "loss": 2.8735, "step": 19195 }, { "epoch": 0.52, "learning_rate": 0.0009972147494061506, "loss": 2.3565, "step": 19196 }, { "epoch": 0.52, "learning_rate": 0.0009971277105608257, "loss": 2.488, "step": 19197 }, { "epoch": 0.52, "learning_rate": 0.0009970406717372611, "loss": 2.5256, "step": 19198 }, { "epoch": 0.52, "learning_rate": 0.0009969536329361153, "loss": 2.0696, "step": 19199 }, { "epoch": 0.52, "learning_rate": 0.0009968665941580482, "loss": 2.5559, "step": 19200 }, { "epoch": 0.52, "learning_rate": 0.00099677955540372, "loss": 2.6158, "step": 19201 }, { "epoch": 0.52, "learning_rate": 0.0009966925166737886, "loss": 2.5295, "step": 19202 }, { "epoch": 0.52, "learning_rate": 0.000996605477968914, "loss": 2.3616, "step": 19203 }, { "epoch": 0.52, "learning_rate": 0.0009965184392897563, "loss": 2.3531, "step": 19204 }, { "epoch": 0.52, "learning_rate": 0.000996431400636974, "loss": 2.3765, "step": 19205 }, { "epoch": 0.52, "learning_rate": 0.000996344362011227, "loss": 2.6232, "step": 19206 }, { "epoch": 0.52, "learning_rate": 0.000996257323413174, "loss": 2.3819, "step": 19207 }, { "epoch": 0.52, "learning_rate": 0.000996170284843475, "loss": 2.6597, "step": 19208 }, { "epoch": 0.52, "learning_rate": 0.0009960832463027894, "loss": 2.2071, "step": 19209 }, { "epoch": 0.52, "learning_rate": 0.000995996207791776, "loss": 2.2631, "step": 19210 }, { "epoch": 0.52, "learning_rate": 0.000995909169311095, "loss": 2.6932, "step": 19211 }, { "epoch": 0.52, "learning_rate": 0.0009958221308614054, "loss": 2.83, "step": 19212 }, { "epoch": 0.52, "learning_rate": 0.0009957350924433665, "loss": 2.785, "step": 19213 }, { "epoch": 0.52, "learning_rate": 0.0009956480540576382, "loss": 2.4361, "step": 19214 }, { "epoch": 0.52, "learning_rate": 0.0009955610157048789, "loss": 2.8575, "step": 19215 }, { "epoch": 0.52, "learning_rate": 0.0009954739773857485, "loss": 2.9766, "step": 19216 }, { "epoch": 0.52, "learning_rate": 0.0009953869391009069, "loss": 2.5606, "step": 19217 }, { "epoch": 0.52, "learning_rate": 0.0009952999008510128, "loss": 2.8108, "step": 19218 }, { "epoch": 0.52, "learning_rate": 0.0009952128626367256, "loss": 2.4195, "step": 19219 }, { "epoch": 0.52, "learning_rate": 0.0009951258244587052, "loss": 2.3119, "step": 19220 }, { "epoch": 0.52, "learning_rate": 0.0009950387863176104, "loss": 2.4767, "step": 19221 }, { "epoch": 0.52, "learning_rate": 0.0009949517482141013, "loss": 3.0336, "step": 19222 }, { "epoch": 0.52, "learning_rate": 0.0009948647101488365, "loss": 2.3154, "step": 19223 }, { "epoch": 0.52, "learning_rate": 0.0009947776721224758, "loss": 2.6095, "step": 19224 }, { "epoch": 0.52, "learning_rate": 0.0009946906341356785, "loss": 2.2591, "step": 19225 }, { "epoch": 0.52, "learning_rate": 0.000994603596189104, "loss": 2.7532, "step": 19226 }, { "epoch": 0.52, "learning_rate": 0.0009945165582834117, "loss": 2.9214, "step": 19227 }, { "epoch": 0.52, "learning_rate": 0.0009944295204192613, "loss": 2.8106, "step": 19228 }, { "epoch": 0.52, "learning_rate": 0.0009943424825973113, "loss": 2.5986, "step": 19229 }, { "epoch": 0.52, "learning_rate": 0.0009942554448182223, "loss": 2.9708, "step": 19230 }, { "epoch": 0.52, "learning_rate": 0.0009941684070826524, "loss": 2.2989, "step": 19231 }, { "epoch": 0.52, "learning_rate": 0.000994081369391262, "loss": 2.7632, "step": 19232 }, { "epoch": 0.52, "learning_rate": 0.00099399433174471, "loss": 2.3815, "step": 19233 }, { "epoch": 0.52, "learning_rate": 0.0009939072941436557, "loss": 3.0356, "step": 19234 }, { "epoch": 0.52, "learning_rate": 0.0009938202565887586, "loss": 2.6338, "step": 19235 }, { "epoch": 0.52, "learning_rate": 0.0009937332190806784, "loss": 2.5115, "step": 19236 }, { "epoch": 0.52, "learning_rate": 0.0009936461816200742, "loss": 2.4788, "step": 19237 }, { "epoch": 0.52, "learning_rate": 0.0009935591442076053, "loss": 2.8574, "step": 19238 }, { "epoch": 0.52, "learning_rate": 0.000993472106843931, "loss": 2.2851, "step": 19239 }, { "epoch": 0.52, "learning_rate": 0.000993385069529711, "loss": 2.3893, "step": 19240 }, { "epoch": 0.52, "learning_rate": 0.0009932980322656048, "loss": 2.5956, "step": 19241 }, { "epoch": 0.52, "learning_rate": 0.000993210995052271, "loss": 2.1352, "step": 19242 }, { "epoch": 0.52, "learning_rate": 0.0009931239578903697, "loss": 2.2013, "step": 19243 }, { "epoch": 0.52, "learning_rate": 0.0009930369207805604, "loss": 2.018, "step": 19244 }, { "epoch": 0.52, "learning_rate": 0.0009929498837235018, "loss": 2.7723, "step": 19245 }, { "epoch": 0.52, "learning_rate": 0.0009928628467198535, "loss": 2.9904, "step": 19246 }, { "epoch": 0.52, "learning_rate": 0.0009927758097702754, "loss": 2.5933, "step": 19247 }, { "epoch": 0.52, "learning_rate": 0.0009926887728754262, "loss": 2.7389, "step": 19248 }, { "epoch": 0.52, "learning_rate": 0.0009926017360359655, "loss": 2.2554, "step": 19249 }, { "epoch": 0.52, "learning_rate": 0.000992514699252553, "loss": 2.4164, "step": 19250 }, { "epoch": 0.52, "learning_rate": 0.0009924276625258473, "loss": 2.3436, "step": 19251 }, { "epoch": 0.52, "learning_rate": 0.000992340625856509, "loss": 3.0246, "step": 19252 }, { "epoch": 0.52, "learning_rate": 0.000992253589245196, "loss": 2.2139, "step": 19253 }, { "epoch": 0.52, "learning_rate": 0.0009921665526925686, "loss": 2.6892, "step": 19254 }, { "epoch": 0.52, "learning_rate": 0.0009920795161992863, "loss": 2.0227, "step": 19255 }, { "epoch": 0.52, "learning_rate": 0.000991992479766008, "loss": 2.7391, "step": 19256 }, { "epoch": 0.52, "learning_rate": 0.0009919054433933938, "loss": 2.753, "step": 19257 }, { "epoch": 0.52, "learning_rate": 0.0009918184070821015, "loss": 2.4163, "step": 19258 }, { "epoch": 0.52, "learning_rate": 0.000991731370832792, "loss": 2.2759, "step": 19259 }, { "epoch": 0.52, "learning_rate": 0.0009916443346461243, "loss": 1.8321, "step": 19260 }, { "epoch": 0.52, "learning_rate": 0.0009915572985227574, "loss": 2.5779, "step": 19261 }, { "epoch": 0.52, "learning_rate": 0.0009914702624633507, "loss": 2.4756, "step": 19262 }, { "epoch": 0.52, "learning_rate": 0.0009913832264685644, "loss": 2.23, "step": 19263 }, { "epoch": 0.52, "learning_rate": 0.0009912961905390568, "loss": 2.3182, "step": 19264 }, { "epoch": 0.52, "learning_rate": 0.0009912091546754878, "loss": 2.6635, "step": 19265 }, { "epoch": 0.52, "learning_rate": 0.0009911221188785165, "loss": 2.3876, "step": 19266 }, { "epoch": 0.52, "learning_rate": 0.0009910350831488024, "loss": 2.2926, "step": 19267 }, { "epoch": 0.52, "learning_rate": 0.0009909480474870054, "loss": 2.2364, "step": 19268 }, { "epoch": 0.52, "learning_rate": 0.000990861011893784, "loss": 2.8507, "step": 19269 }, { "epoch": 0.52, "learning_rate": 0.0009907739763697979, "loss": 2.8129, "step": 19270 }, { "epoch": 0.52, "learning_rate": 0.0009906869409157066, "loss": 2.464, "step": 19271 }, { "epoch": 0.52, "learning_rate": 0.0009905999055321692, "loss": 2.0105, "step": 19272 }, { "epoch": 0.52, "learning_rate": 0.0009905128702198459, "loss": 2.4847, "step": 19273 }, { "epoch": 0.52, "learning_rate": 0.0009904258349793947, "loss": 2.6763, "step": 19274 }, { "epoch": 0.52, "learning_rate": 0.0009903387998114756, "loss": 2.3037, "step": 19275 }, { "epoch": 0.52, "learning_rate": 0.0009902517647167486, "loss": 2.8516, "step": 19276 }, { "epoch": 0.52, "learning_rate": 0.000990164729695872, "loss": 3.0245, "step": 19277 }, { "epoch": 0.52, "learning_rate": 0.0009900776947495058, "loss": 2.6098, "step": 19278 }, { "epoch": 0.52, "learning_rate": 0.0009899906598783094, "loss": 2.5311, "step": 19279 }, { "epoch": 0.52, "learning_rate": 0.0009899036250829417, "loss": 2.6866, "step": 19280 }, { "epoch": 0.52, "learning_rate": 0.0009898165903640625, "loss": 2.705, "step": 19281 }, { "epoch": 0.52, "learning_rate": 0.000989729555722331, "loss": 2.8375, "step": 19282 }, { "epoch": 0.52, "learning_rate": 0.0009896425211584064, "loss": 2.2192, "step": 19283 }, { "epoch": 0.52, "learning_rate": 0.0009895554866729483, "loss": 2.3984, "step": 19284 }, { "epoch": 0.52, "learning_rate": 0.000989468452266616, "loss": 2.6371, "step": 19285 }, { "epoch": 0.52, "learning_rate": 0.0009893814179400687, "loss": 2.483, "step": 19286 }, { "epoch": 0.52, "learning_rate": 0.000989294383693966, "loss": 2.6863, "step": 19287 }, { "epoch": 0.52, "learning_rate": 0.000989207349528967, "loss": 2.7189, "step": 19288 }, { "epoch": 0.52, "learning_rate": 0.0009891203154457312, "loss": 2.7261, "step": 19289 }, { "epoch": 0.52, "learning_rate": 0.0009890332814449184, "loss": 2.3908, "step": 19290 }, { "epoch": 0.52, "learning_rate": 0.000988946247527187, "loss": 2.6691, "step": 19291 }, { "epoch": 0.52, "learning_rate": 0.0009888592136931972, "loss": 2.5231, "step": 19292 }, { "epoch": 0.52, "learning_rate": 0.0009887721799436075, "loss": 2.6008, "step": 19293 }, { "epoch": 0.52, "learning_rate": 0.000988685146279078, "loss": 2.0757, "step": 19294 }, { "epoch": 0.52, "learning_rate": 0.000988598112700268, "loss": 2.6681, "step": 19295 }, { "epoch": 0.52, "learning_rate": 0.0009885110792078365, "loss": 2.2422, "step": 19296 }, { "epoch": 0.52, "learning_rate": 0.000988424045802443, "loss": 2.356, "step": 19297 }, { "epoch": 0.52, "learning_rate": 0.000988337012484747, "loss": 2.2132, "step": 19298 }, { "epoch": 0.52, "learning_rate": 0.0009882499792554073, "loss": 2.3261, "step": 19299 }, { "epoch": 0.52, "learning_rate": 0.0009881629461150842, "loss": 2.4188, "step": 19300 }, { "epoch": 0.52, "learning_rate": 0.000988075913064436, "loss": 2.54, "step": 19301 }, { "epoch": 0.52, "learning_rate": 0.0009879888801041228, "loss": 2.5167, "step": 19302 }, { "epoch": 0.52, "learning_rate": 0.000987901847234804, "loss": 2.5511, "step": 19303 }, { "epoch": 0.52, "learning_rate": 0.0009878148144571383, "loss": 2.4885, "step": 19304 }, { "epoch": 0.52, "learning_rate": 0.0009877277817717852, "loss": 2.1258, "step": 19305 }, { "epoch": 0.52, "learning_rate": 0.0009876407491794046, "loss": 2.6003, "step": 19306 }, { "epoch": 0.52, "learning_rate": 0.0009875537166806553, "loss": 2.8408, "step": 19307 }, { "epoch": 0.52, "learning_rate": 0.0009874666842761971, "loss": 2.652, "step": 19308 }, { "epoch": 0.52, "learning_rate": 0.0009873796519666886, "loss": 2.5162, "step": 19309 }, { "epoch": 0.52, "learning_rate": 0.0009872926197527897, "loss": 2.5686, "step": 19310 }, { "epoch": 0.52, "learning_rate": 0.0009872055876351598, "loss": 2.2777, "step": 19311 }, { "epoch": 0.52, "learning_rate": 0.000987118555614458, "loss": 2.388, "step": 19312 }, { "epoch": 0.52, "learning_rate": 0.0009870315236913437, "loss": 2.3162, "step": 19313 }, { "epoch": 0.52, "learning_rate": 0.0009869444918664764, "loss": 2.3898, "step": 19314 }, { "epoch": 0.52, "learning_rate": 0.0009868574601405152, "loss": 2.5401, "step": 19315 }, { "epoch": 0.52, "learning_rate": 0.0009867704285141192, "loss": 2.7316, "step": 19316 }, { "epoch": 0.52, "learning_rate": 0.000986683396987949, "loss": 2.8439, "step": 19317 }, { "epoch": 0.52, "learning_rate": 0.000986596365562662, "loss": 2.2942, "step": 19318 }, { "epoch": 0.52, "learning_rate": 0.0009865093342389193, "loss": 2.6758, "step": 19319 }, { "epoch": 0.52, "learning_rate": 0.000986422303017379, "loss": 2.2493, "step": 19320 }, { "epoch": 0.52, "learning_rate": 0.000986335271898701, "loss": 2.8714, "step": 19321 }, { "epoch": 0.52, "learning_rate": 0.0009862482408835448, "loss": 2.1544, "step": 19322 }, { "epoch": 0.52, "learning_rate": 0.000986161209972569, "loss": 2.6122, "step": 19323 }, { "epoch": 0.52, "learning_rate": 0.0009860741791664334, "loss": 2.6934, "step": 19324 }, { "epoch": 0.52, "learning_rate": 0.0009859871484657978, "loss": 2.5964, "step": 19325 }, { "epoch": 0.52, "learning_rate": 0.0009859001178713206, "loss": 2.5731, "step": 19326 }, { "epoch": 0.52, "learning_rate": 0.000985813087383662, "loss": 2.5526, "step": 19327 }, { "epoch": 0.52, "learning_rate": 0.0009857260570034806, "loss": 2.4703, "step": 19328 }, { "epoch": 0.52, "learning_rate": 0.000985639026731436, "loss": 2.5764, "step": 19329 }, { "epoch": 0.52, "learning_rate": 0.000985551996568188, "loss": 2.3535, "step": 19330 }, { "epoch": 0.52, "learning_rate": 0.0009854649665143951, "loss": 3.0851, "step": 19331 }, { "epoch": 0.52, "learning_rate": 0.000985377936570717, "loss": 2.5504, "step": 19332 }, { "epoch": 0.52, "learning_rate": 0.0009852909067378135, "loss": 2.2923, "step": 19333 }, { "epoch": 0.52, "learning_rate": 0.000985203877016343, "loss": 2.3588, "step": 19334 }, { "epoch": 0.52, "learning_rate": 0.0009851168474069656, "loss": 2.6673, "step": 19335 }, { "epoch": 0.52, "learning_rate": 0.00098502981791034, "loss": 2.3117, "step": 19336 }, { "epoch": 0.52, "learning_rate": 0.000984942788527126, "loss": 2.7437, "step": 19337 }, { "epoch": 0.52, "learning_rate": 0.0009848557592579826, "loss": 2.9104, "step": 19338 }, { "epoch": 0.52, "learning_rate": 0.0009847687301035692, "loss": 2.1371, "step": 19339 }, { "epoch": 0.52, "learning_rate": 0.0009846817010645454, "loss": 2.5104, "step": 19340 }, { "epoch": 0.52, "learning_rate": 0.0009845946721415704, "loss": 2.6787, "step": 19341 }, { "epoch": 0.52, "learning_rate": 0.000984507643335303, "loss": 2.655, "step": 19342 }, { "epoch": 0.52, "learning_rate": 0.0009844206146464034, "loss": 2.1098, "step": 19343 }, { "epoch": 0.52, "learning_rate": 0.00098433358607553, "loss": 2.5815, "step": 19344 }, { "epoch": 0.52, "learning_rate": 0.0009842465576233425, "loss": 3.0117, "step": 19345 }, { "epoch": 0.52, "learning_rate": 0.0009841595292905008, "loss": 2.3952, "step": 19346 }, { "epoch": 0.52, "learning_rate": 0.0009840725010776634, "loss": 2.4739, "step": 19347 }, { "epoch": 0.52, "learning_rate": 0.0009839854729854895, "loss": 2.3536, "step": 19348 }, { "epoch": 0.52, "learning_rate": 0.0009838984450146395, "loss": 2.5353, "step": 19349 }, { "epoch": 0.52, "learning_rate": 0.0009838114171657716, "loss": 2.6933, "step": 19350 }, { "epoch": 0.52, "learning_rate": 0.0009837243894395456, "loss": 2.5608, "step": 19351 }, { "epoch": 0.52, "learning_rate": 0.0009836373618366207, "loss": 2.5593, "step": 19352 }, { "epoch": 0.52, "learning_rate": 0.000983550334357656, "loss": 2.3102, "step": 19353 }, { "epoch": 0.52, "learning_rate": 0.0009834633070033114, "loss": 2.1722, "step": 19354 }, { "epoch": 0.52, "learning_rate": 0.0009833762797742457, "loss": 2.2399, "step": 19355 }, { "epoch": 0.52, "learning_rate": 0.000983289252671118, "loss": 2.9131, "step": 19356 }, { "epoch": 0.52, "learning_rate": 0.0009832022256945883, "loss": 2.1502, "step": 19357 }, { "epoch": 0.52, "learning_rate": 0.0009831151988453153, "loss": 2.485, "step": 19358 }, { "epoch": 0.52, "learning_rate": 0.0009830281721239587, "loss": 2.898, "step": 19359 }, { "epoch": 0.52, "learning_rate": 0.000982941145531178, "loss": 2.2991, "step": 19360 }, { "epoch": 0.52, "learning_rate": 0.0009828541190676314, "loss": 2.7404, "step": 19361 }, { "epoch": 0.52, "learning_rate": 0.0009827670927339796, "loss": 2.8817, "step": 19362 }, { "epoch": 0.52, "learning_rate": 0.0009826800665308807, "loss": 2.2872, "step": 19363 }, { "epoch": 0.52, "learning_rate": 0.0009825930404589948, "loss": 2.7623, "step": 19364 }, { "epoch": 0.52, "learning_rate": 0.0009825060145189808, "loss": 2.5487, "step": 19365 }, { "epoch": 0.52, "learning_rate": 0.0009824189887114982, "loss": 2.1544, "step": 19366 }, { "epoch": 0.52, "learning_rate": 0.000982331963037206, "loss": 2.4292, "step": 19367 }, { "epoch": 0.52, "learning_rate": 0.000982244937496764, "loss": 2.8405, "step": 19368 }, { "epoch": 0.52, "learning_rate": 0.000982157912090831, "loss": 2.4287, "step": 19369 }, { "epoch": 0.52, "learning_rate": 0.0009820708868200664, "loss": 2.7131, "step": 19370 }, { "epoch": 0.52, "learning_rate": 0.0009819838616851296, "loss": 2.4165, "step": 19371 }, { "epoch": 0.52, "learning_rate": 0.00098189683668668, "loss": 2.6238, "step": 19372 }, { "epoch": 0.52, "learning_rate": 0.0009818098118253768, "loss": 2.5089, "step": 19373 }, { "epoch": 0.52, "learning_rate": 0.0009817227871018787, "loss": 2.1223, "step": 19374 }, { "epoch": 0.52, "learning_rate": 0.0009816357625168457, "loss": 2.3187, "step": 19375 }, { "epoch": 0.52, "learning_rate": 0.0009815487380709373, "loss": 2.5804, "step": 19376 }, { "epoch": 0.52, "learning_rate": 0.000981461713764812, "loss": 2.2968, "step": 19377 }, { "epoch": 0.52, "learning_rate": 0.0009813746895991297, "loss": 2.4967, "step": 19378 }, { "epoch": 0.52, "learning_rate": 0.000981287665574549, "loss": 2.3359, "step": 19379 }, { "epoch": 0.52, "learning_rate": 0.00098120064169173, "loss": 2.7103, "step": 19380 }, { "epoch": 0.52, "learning_rate": 0.0009811136179513314, "loss": 2.7184, "step": 19381 }, { "epoch": 0.52, "learning_rate": 0.0009810265943540125, "loss": 2.2496, "step": 19382 }, { "epoch": 0.52, "learning_rate": 0.000980939570900433, "loss": 2.9478, "step": 19383 }, { "epoch": 0.52, "learning_rate": 0.0009808525475912518, "loss": 2.2638, "step": 19384 }, { "epoch": 0.52, "learning_rate": 0.000980765524427128, "loss": 2.394, "step": 19385 }, { "epoch": 0.52, "learning_rate": 0.0009806785014087219, "loss": 2.5083, "step": 19386 }, { "epoch": 0.52, "learning_rate": 0.0009805914785366912, "loss": 2.6663, "step": 19387 }, { "epoch": 0.52, "learning_rate": 0.0009805044558116962, "loss": 2.7561, "step": 19388 }, { "epoch": 0.52, "learning_rate": 0.0009804174332343964, "loss": 2.6663, "step": 19389 }, { "epoch": 0.52, "learning_rate": 0.0009803304108054502, "loss": 2.8784, "step": 19390 }, { "epoch": 0.52, "learning_rate": 0.000980243388525517, "loss": 2.3291, "step": 19391 }, { "epoch": 0.52, "learning_rate": 0.0009801563663952573, "loss": 2.1974, "step": 19392 }, { "epoch": 0.52, "learning_rate": 0.0009800693444153286, "loss": 2.6217, "step": 19393 }, { "epoch": 0.52, "learning_rate": 0.000979982322586391, "loss": 2.4077, "step": 19394 }, { "epoch": 0.52, "learning_rate": 0.0009798953009091044, "loss": 2.5025, "step": 19395 }, { "epoch": 0.52, "learning_rate": 0.000979808279384127, "loss": 2.8355, "step": 19396 }, { "epoch": 0.52, "learning_rate": 0.0009797212580121184, "loss": 2.3426, "step": 19397 }, { "epoch": 0.52, "learning_rate": 0.0009796342367937379, "loss": 2.2872, "step": 19398 }, { "epoch": 0.52, "learning_rate": 0.000979547215729645, "loss": 2.5147, "step": 19399 }, { "epoch": 0.52, "learning_rate": 0.0009794601948204986, "loss": 2.6325, "step": 19400 }, { "epoch": 0.52, "learning_rate": 0.000979373174066958, "loss": 2.4992, "step": 19401 }, { "epoch": 0.52, "learning_rate": 0.0009792861534696825, "loss": 2.3729, "step": 19402 }, { "epoch": 0.52, "learning_rate": 0.000979199133029332, "loss": 2.574, "step": 19403 }, { "epoch": 0.52, "learning_rate": 0.0009791121127465643, "loss": 2.6846, "step": 19404 }, { "epoch": 0.52, "learning_rate": 0.0009790250926220404, "loss": 2.6686, "step": 19405 }, { "epoch": 0.52, "learning_rate": 0.000978938072656418, "loss": 2.6068, "step": 19406 }, { "epoch": 0.52, "learning_rate": 0.0009788510528503569, "loss": 2.1232, "step": 19407 }, { "epoch": 0.52, "learning_rate": 0.0009787640332045168, "loss": 2.0153, "step": 19408 }, { "epoch": 0.52, "learning_rate": 0.0009786770137195564, "loss": 2.35, "step": 19409 }, { "epoch": 0.52, "learning_rate": 0.000978589994396135, "loss": 2.4531, "step": 19410 }, { "epoch": 0.52, "learning_rate": 0.0009785029752349126, "loss": 2.0262, "step": 19411 }, { "epoch": 0.52, "learning_rate": 0.000978415956236547, "loss": 2.2654, "step": 19412 }, { "epoch": 0.52, "learning_rate": 0.000978328937401699, "loss": 2.4527, "step": 19413 }, { "epoch": 0.52, "learning_rate": 0.0009782419187310265, "loss": 2.3861, "step": 19414 }, { "epoch": 0.52, "learning_rate": 0.0009781549002251897, "loss": 2.5306, "step": 19415 }, { "epoch": 0.52, "learning_rate": 0.0009780678818848473, "loss": 2.5788, "step": 19416 }, { "epoch": 0.52, "learning_rate": 0.0009779808637106586, "loss": 2.5294, "step": 19417 }, { "epoch": 0.52, "learning_rate": 0.000977893845703283, "loss": 2.583, "step": 19418 }, { "epoch": 0.52, "learning_rate": 0.0009778068278633802, "loss": 2.4557, "step": 19419 }, { "epoch": 0.52, "learning_rate": 0.0009777198101916082, "loss": 2.4014, "step": 19420 }, { "epoch": 0.52, "learning_rate": 0.0009776327926886274, "loss": 2.7955, "step": 19421 }, { "epoch": 0.52, "learning_rate": 0.0009775457753550963, "loss": 3.1432, "step": 19422 }, { "epoch": 0.52, "learning_rate": 0.0009774587581916744, "loss": 2.307, "step": 19423 }, { "epoch": 0.52, "learning_rate": 0.000977371741199021, "loss": 2.4171, "step": 19424 }, { "epoch": 0.52, "learning_rate": 0.0009772847243777953, "loss": 2.5008, "step": 19425 }, { "epoch": 0.52, "learning_rate": 0.0009771977077286562, "loss": 2.3508, "step": 19426 }, { "epoch": 0.52, "learning_rate": 0.0009771106912522635, "loss": 2.8068, "step": 19427 }, { "epoch": 0.52, "learning_rate": 0.000977023674949276, "loss": 2.3399, "step": 19428 }, { "epoch": 0.52, "learning_rate": 0.000976936658820353, "loss": 2.3939, "step": 19429 }, { "epoch": 0.52, "learning_rate": 0.0009768496428661539, "loss": 2.3218, "step": 19430 }, { "epoch": 0.52, "learning_rate": 0.0009767626270873375, "loss": 2.3946, "step": 19431 }, { "epoch": 0.52, "learning_rate": 0.0009766756114845637, "loss": 2.5951, "step": 19432 }, { "epoch": 0.52, "learning_rate": 0.0009765885960584908, "loss": 2.4147, "step": 19433 }, { "epoch": 0.52, "learning_rate": 0.0009765015808097786, "loss": 3.1283, "step": 19434 }, { "epoch": 0.52, "learning_rate": 0.0009764145657390868, "loss": 2.8262, "step": 19435 }, { "epoch": 0.52, "learning_rate": 0.0009763275508470734, "loss": 2.5842, "step": 19436 }, { "epoch": 0.52, "learning_rate": 0.000976240536134398, "loss": 2.0571, "step": 19437 }, { "epoch": 0.52, "learning_rate": 0.0009761535216017209, "loss": 2.2605, "step": 19438 }, { "epoch": 0.52, "learning_rate": 0.0009760665072497, "loss": 3.2177, "step": 19439 }, { "epoch": 0.52, "learning_rate": 0.000975979493078995, "loss": 2.4375, "step": 19440 }, { "epoch": 0.52, "learning_rate": 0.000975892479090265, "loss": 2.0771, "step": 19441 }, { "epoch": 0.52, "learning_rate": 0.0009758054652841692, "loss": 2.1379, "step": 19442 }, { "epoch": 0.52, "learning_rate": 0.0009757184516613671, "loss": 2.8559, "step": 19443 }, { "epoch": 0.52, "learning_rate": 0.0009756314382225175, "loss": 2.4139, "step": 19444 }, { "epoch": 0.52, "learning_rate": 0.0009755444249682798, "loss": 2.1257, "step": 19445 }, { "epoch": 0.52, "learning_rate": 0.0009754574118993134, "loss": 2.7348, "step": 19446 }, { "epoch": 0.52, "learning_rate": 0.0009753703990162769, "loss": 2.4777, "step": 19447 }, { "epoch": 0.52, "learning_rate": 0.0009752833863198304, "loss": 2.3929, "step": 19448 }, { "epoch": 0.52, "learning_rate": 0.000975196373810632, "loss": 2.5886, "step": 19449 }, { "epoch": 0.52, "learning_rate": 0.0009751093614893412, "loss": 2.7807, "step": 19450 }, { "epoch": 0.52, "learning_rate": 0.0009750223493566183, "loss": 2.8699, "step": 19451 }, { "epoch": 0.52, "learning_rate": 0.000974935337413121, "loss": 2.8583, "step": 19452 }, { "epoch": 0.52, "learning_rate": 0.0009748483256595092, "loss": 2.6273, "step": 19453 }, { "epoch": 0.52, "learning_rate": 0.0009747613140964421, "loss": 2.7749, "step": 19454 }, { "epoch": 0.52, "learning_rate": 0.0009746743027245786, "loss": 2.5787, "step": 19455 }, { "epoch": 0.52, "learning_rate": 0.0009745872915445784, "loss": 3.0135, "step": 19456 }, { "epoch": 0.52, "learning_rate": 0.0009745002805570999, "loss": 2.5, "step": 19457 }, { "epoch": 0.52, "learning_rate": 0.0009744132697628028, "loss": 2.3307, "step": 19458 }, { "epoch": 0.52, "learning_rate": 0.0009743262591623465, "loss": 3.0699, "step": 19459 }, { "epoch": 0.52, "learning_rate": 0.0009742392487563896, "loss": 2.5962, "step": 19460 }, { "epoch": 0.52, "learning_rate": 0.0009741522385455914, "loss": 2.5014, "step": 19461 }, { "epoch": 0.52, "learning_rate": 0.0009740652285306118, "loss": 2.3545, "step": 19462 }, { "epoch": 0.52, "learning_rate": 0.0009739782187121088, "loss": 2.3401, "step": 19463 }, { "epoch": 0.52, "learning_rate": 0.0009738912090907423, "loss": 2.7394, "step": 19464 }, { "epoch": 0.52, "learning_rate": 0.0009738041996671717, "loss": 2.6289, "step": 19465 }, { "epoch": 0.52, "learning_rate": 0.0009737171904420554, "loss": 2.4483, "step": 19466 }, { "epoch": 0.52, "learning_rate": 0.0009736301814160533, "loss": 2.8119, "step": 19467 }, { "epoch": 0.52, "learning_rate": 0.0009735431725898239, "loss": 2.8012, "step": 19468 }, { "epoch": 0.52, "learning_rate": 0.0009734561639640267, "loss": 2.4821, "step": 19469 }, { "epoch": 0.52, "learning_rate": 0.0009733691555393212, "loss": 2.3036, "step": 19470 }, { "epoch": 0.52, "learning_rate": 0.0009732821473163659, "loss": 2.6436, "step": 19471 }, { "epoch": 0.52, "learning_rate": 0.0009731951392958203, "loss": 2.726, "step": 19472 }, { "epoch": 0.52, "learning_rate": 0.0009731081314783436, "loss": 2.588, "step": 19473 }, { "epoch": 0.52, "learning_rate": 0.0009730211238645948, "loss": 2.3064, "step": 19474 }, { "epoch": 0.52, "learning_rate": 0.0009729341164552336, "loss": 2.4779, "step": 19475 }, { "epoch": 0.52, "learning_rate": 0.000972847109250918, "loss": 2.4912, "step": 19476 }, { "epoch": 0.52, "learning_rate": 0.000972760102252308, "loss": 1.8553, "step": 19477 }, { "epoch": 0.52, "learning_rate": 0.0009726730954600632, "loss": 2.3664, "step": 19478 }, { "epoch": 0.52, "learning_rate": 0.0009725860888748417, "loss": 2.6423, "step": 19479 }, { "epoch": 0.52, "learning_rate": 0.0009724990824973027, "loss": 2.2704, "step": 19480 }, { "epoch": 0.52, "learning_rate": 0.0009724120763281065, "loss": 2.6008, "step": 19481 }, { "epoch": 0.52, "learning_rate": 0.000972325070367911, "loss": 2.7086, "step": 19482 }, { "epoch": 0.52, "learning_rate": 0.0009722380646173761, "loss": 2.2531, "step": 19483 }, { "epoch": 0.52, "learning_rate": 0.0009721510590771604, "loss": 2.6462, "step": 19484 }, { "epoch": 0.52, "learning_rate": 0.0009720640537479232, "loss": 2.5613, "step": 19485 }, { "epoch": 0.52, "learning_rate": 0.0009719770486303241, "loss": 2.5665, "step": 19486 }, { "epoch": 0.52, "learning_rate": 0.0009718900437250215, "loss": 2.2738, "step": 19487 }, { "epoch": 0.52, "learning_rate": 0.0009718030390326751, "loss": 2.2428, "step": 19488 }, { "epoch": 0.52, "learning_rate": 0.000971716034553944, "loss": 2.5898, "step": 19489 }, { "epoch": 0.52, "learning_rate": 0.0009716290302894867, "loss": 2.4379, "step": 19490 }, { "epoch": 0.52, "learning_rate": 0.0009715420262399636, "loss": 2.7041, "step": 19491 }, { "epoch": 0.52, "learning_rate": 0.0009714550224060323, "loss": 2.5344, "step": 19492 }, { "epoch": 0.52, "learning_rate": 0.0009713680187883526, "loss": 2.3948, "step": 19493 }, { "epoch": 0.52, "learning_rate": 0.0009712810153875843, "loss": 2.6401, "step": 19494 }, { "epoch": 0.52, "learning_rate": 0.0009711940122043854, "loss": 2.716, "step": 19495 }, { "epoch": 0.52, "learning_rate": 0.0009711070092394156, "loss": 2.7274, "step": 19496 }, { "epoch": 0.52, "learning_rate": 0.000971020006493334, "loss": 2.4934, "step": 19497 }, { "epoch": 0.52, "learning_rate": 0.0009709330039667996, "loss": 2.5446, "step": 19498 }, { "epoch": 0.52, "learning_rate": 0.0009708460016604714, "loss": 2.1344, "step": 19499 }, { "epoch": 0.52, "learning_rate": 0.000970758999575009, "loss": 2.2496, "step": 19500 }, { "epoch": 0.52, "learning_rate": 0.000970671997711071, "loss": 2.4017, "step": 19501 }, { "epoch": 0.52, "learning_rate": 0.0009705849960693168, "loss": 2.54, "step": 19502 }, { "epoch": 0.52, "learning_rate": 0.0009704979946504053, "loss": 2.2771, "step": 19503 }, { "epoch": 0.52, "learning_rate": 0.0009704109934549957, "loss": 2.9236, "step": 19504 }, { "epoch": 0.52, "learning_rate": 0.0009703239924837476, "loss": 2.3404, "step": 19505 }, { "epoch": 0.52, "learning_rate": 0.000970236991737319, "loss": 2.7472, "step": 19506 }, { "epoch": 0.52, "learning_rate": 0.0009701499912163697, "loss": 2.6844, "step": 19507 }, { "epoch": 0.52, "learning_rate": 0.0009700629909215593, "loss": 2.9331, "step": 19508 }, { "epoch": 0.52, "learning_rate": 0.0009699759908535457, "loss": 2.1464, "step": 19509 }, { "epoch": 0.52, "learning_rate": 0.000969888991012989, "loss": 2.6381, "step": 19510 }, { "epoch": 0.52, "learning_rate": 0.0009698019914005477, "loss": 2.1647, "step": 19511 }, { "epoch": 0.52, "learning_rate": 0.0009697149920168811, "loss": 2.6111, "step": 19512 }, { "epoch": 0.52, "learning_rate": 0.0009696279928626485, "loss": 2.537, "step": 19513 }, { "epoch": 0.52, "learning_rate": 0.0009695409939385086, "loss": 2.6239, "step": 19514 }, { "epoch": 0.52, "learning_rate": 0.0009694539952451207, "loss": 2.6822, "step": 19515 }, { "epoch": 0.52, "learning_rate": 0.000969366996783144, "loss": 2.4906, "step": 19516 }, { "epoch": 0.52, "learning_rate": 0.0009692799985532374, "loss": 2.172, "step": 19517 }, { "epoch": 0.52, "learning_rate": 0.0009691930005560603, "loss": 2.3804, "step": 19518 }, { "epoch": 0.52, "learning_rate": 0.0009691060027922709, "loss": 2.3981, "step": 19519 }, { "epoch": 0.52, "learning_rate": 0.0009690190052625291, "loss": 2.4843, "step": 19520 }, { "epoch": 0.52, "learning_rate": 0.0009689320079674943, "loss": 2.3851, "step": 19521 }, { "epoch": 0.52, "learning_rate": 0.0009688450109078246, "loss": 2.8988, "step": 19522 }, { "epoch": 0.52, "learning_rate": 0.0009687580140841793, "loss": 2.4619, "step": 19523 }, { "epoch": 0.52, "learning_rate": 0.0009686710174972185, "loss": 2.4634, "step": 19524 }, { "epoch": 0.52, "learning_rate": 0.0009685840211475998, "loss": 2.3999, "step": 19525 }, { "epoch": 0.52, "learning_rate": 0.0009684970250359833, "loss": 2.276, "step": 19526 }, { "epoch": 0.52, "learning_rate": 0.0009684100291630273, "loss": 2.489, "step": 19527 }, { "epoch": 0.52, "learning_rate": 0.0009683230335293914, "loss": 3.0436, "step": 19528 }, { "epoch": 0.52, "learning_rate": 0.0009682360381357348, "loss": 2.1687, "step": 19529 }, { "epoch": 0.52, "learning_rate": 0.000968149042982716, "loss": 2.5138, "step": 19530 }, { "epoch": 0.52, "learning_rate": 0.0009680620480709945, "loss": 2.3528, "step": 19531 }, { "epoch": 0.52, "learning_rate": 0.0009679750534012292, "loss": 2.5389, "step": 19532 }, { "epoch": 0.52, "learning_rate": 0.0009678880589740792, "loss": 2.4736, "step": 19533 }, { "epoch": 0.52, "learning_rate": 0.0009678010647902038, "loss": 2.4294, "step": 19534 }, { "epoch": 0.52, "learning_rate": 0.0009677140708502613, "loss": 2.7183, "step": 19535 }, { "epoch": 0.53, "learning_rate": 0.0009676270771549111, "loss": 2.2167, "step": 19536 }, { "epoch": 0.53, "learning_rate": 0.0009675400837048131, "loss": 2.1803, "step": 19537 }, { "epoch": 0.53, "learning_rate": 0.0009674530905006251, "loss": 2.4496, "step": 19538 }, { "epoch": 0.53, "learning_rate": 0.0009673660975430067, "loss": 2.0867, "step": 19539 }, { "epoch": 0.53, "learning_rate": 0.000967279104832617, "loss": 2.4282, "step": 19540 }, { "epoch": 0.53, "learning_rate": 0.0009671921123701148, "loss": 2.7012, "step": 19541 }, { "epoch": 0.53, "learning_rate": 0.0009671051201561593, "loss": 2.268, "step": 19542 }, { "epoch": 0.53, "learning_rate": 0.0009670181281914098, "loss": 2.7162, "step": 19543 }, { "epoch": 0.53, "learning_rate": 0.0009669311364765248, "loss": 2.6421, "step": 19544 }, { "epoch": 0.53, "learning_rate": 0.0009668441450121639, "loss": 2.114, "step": 19545 }, { "epoch": 0.53, "learning_rate": 0.0009667571537989855, "loss": 2.2516, "step": 19546 }, { "epoch": 0.53, "learning_rate": 0.000966670162837649, "loss": 2.7865, "step": 19547 }, { "epoch": 0.53, "learning_rate": 0.0009665831721288138, "loss": 2.1303, "step": 19548 }, { "epoch": 0.53, "learning_rate": 0.0009664961816731379, "loss": 2.4143, "step": 19549 }, { "epoch": 0.53, "learning_rate": 0.0009664091914712811, "loss": 2.3173, "step": 19550 }, { "epoch": 0.53, "learning_rate": 0.0009663222015239029, "loss": 2.618, "step": 19551 }, { "epoch": 0.53, "learning_rate": 0.000966235211831661, "loss": 2.4168, "step": 19552 }, { "epoch": 0.53, "learning_rate": 0.0009661482223952154, "loss": 2.5507, "step": 19553 }, { "epoch": 0.53, "learning_rate": 0.0009660612332152245, "loss": 2.4406, "step": 19554 }, { "epoch": 0.53, "learning_rate": 0.0009659742442923478, "loss": 2.5766, "step": 19555 }, { "epoch": 0.53, "learning_rate": 0.0009658872556272442, "loss": 2.2083, "step": 19556 }, { "epoch": 0.53, "learning_rate": 0.0009658002672205725, "loss": 2.6564, "step": 19557 }, { "epoch": 0.53, "learning_rate": 0.000965713279072992, "loss": 2.722, "step": 19558 }, { "epoch": 0.53, "learning_rate": 0.0009656262911851616, "loss": 2.5527, "step": 19559 }, { "epoch": 0.53, "learning_rate": 0.0009655393035577401, "loss": 2.6552, "step": 19560 }, { "epoch": 0.53, "learning_rate": 0.0009654523161913872, "loss": 2.5437, "step": 19561 }, { "epoch": 0.53, "learning_rate": 0.0009653653290867607, "loss": 2.7185, "step": 19562 }, { "epoch": 0.53, "learning_rate": 0.0009652783422445203, "loss": 2.4159, "step": 19563 }, { "epoch": 0.53, "learning_rate": 0.0009651913556653257, "loss": 2.2829, "step": 19564 }, { "epoch": 0.53, "learning_rate": 0.0009651043693498345, "loss": 2.4335, "step": 19565 }, { "epoch": 0.53, "learning_rate": 0.0009650173832987062, "loss": 2.6139, "step": 19566 }, { "epoch": 0.53, "learning_rate": 0.0009649303975126007, "loss": 2.6284, "step": 19567 }, { "epoch": 0.53, "learning_rate": 0.0009648434119921758, "loss": 2.4631, "step": 19568 }, { "epoch": 0.53, "learning_rate": 0.0009647564267380909, "loss": 2.7924, "step": 19569 }, { "epoch": 0.53, "learning_rate": 0.0009646694417510051, "loss": 2.8474, "step": 19570 }, { "epoch": 0.53, "learning_rate": 0.0009645824570315771, "loss": 2.563, "step": 19571 }, { "epoch": 0.53, "learning_rate": 0.0009644954725804663, "loss": 2.8946, "step": 19572 }, { "epoch": 0.53, "learning_rate": 0.0009644084883983313, "loss": 2.3705, "step": 19573 }, { "epoch": 0.53, "learning_rate": 0.0009643215044858312, "loss": 2.3315, "step": 19574 }, { "epoch": 0.53, "learning_rate": 0.0009642345208436253, "loss": 2.6216, "step": 19575 }, { "epoch": 0.53, "learning_rate": 0.0009641475374723719, "loss": 2.8287, "step": 19576 }, { "epoch": 0.53, "learning_rate": 0.0009640605543727305, "loss": 2.4993, "step": 19577 }, { "epoch": 0.53, "learning_rate": 0.0009639735715453602, "loss": 2.5058, "step": 19578 }, { "epoch": 0.53, "learning_rate": 0.0009638865889909191, "loss": 2.6522, "step": 19579 }, { "epoch": 0.53, "learning_rate": 0.0009637996067100675, "loss": 2.4984, "step": 19580 }, { "epoch": 0.53, "learning_rate": 0.0009637126247034631, "loss": 2.2795, "step": 19581 }, { "epoch": 0.53, "learning_rate": 0.0009636256429717653, "loss": 2.7626, "step": 19582 }, { "epoch": 0.53, "learning_rate": 0.0009635386615156335, "loss": 1.9997, "step": 19583 }, { "epoch": 0.53, "learning_rate": 0.000963451680335726, "loss": 2.5063, "step": 19584 }, { "epoch": 0.53, "learning_rate": 0.0009633646994327018, "loss": 2.9775, "step": 19585 }, { "epoch": 0.53, "learning_rate": 0.0009632777188072206, "loss": 2.327, "step": 19586 }, { "epoch": 0.53, "learning_rate": 0.0009631907384599405, "loss": 1.7507, "step": 19587 }, { "epoch": 0.53, "learning_rate": 0.0009631037583915211, "loss": 2.9231, "step": 19588 }, { "epoch": 0.53, "learning_rate": 0.0009630167786026207, "loss": 2.2472, "step": 19589 }, { "epoch": 0.53, "learning_rate": 0.0009629297990938986, "loss": 2.574, "step": 19590 }, { "epoch": 0.53, "learning_rate": 0.0009628428198660139, "loss": 2.5119, "step": 19591 }, { "epoch": 0.53, "learning_rate": 0.0009627558409196252, "loss": 2.4837, "step": 19592 }, { "epoch": 0.53, "learning_rate": 0.0009626688622553916, "loss": 2.2208, "step": 19593 }, { "epoch": 0.53, "learning_rate": 0.0009625818838739725, "loss": 2.2601, "step": 19594 }, { "epoch": 0.53, "learning_rate": 0.0009624949057760256, "loss": 2.5325, "step": 19595 }, { "epoch": 0.53, "learning_rate": 0.0009624079279622112, "loss": 2.097, "step": 19596 }, { "epoch": 0.53, "learning_rate": 0.0009623209504331874, "loss": 2.1275, "step": 19597 }, { "epoch": 0.53, "learning_rate": 0.0009622339731896132, "loss": 2.3473, "step": 19598 }, { "epoch": 0.53, "learning_rate": 0.0009621469962321479, "loss": 2.9773, "step": 19599 }, { "epoch": 0.53, "learning_rate": 0.0009620600195614498, "loss": 2.3077, "step": 19600 }, { "epoch": 0.53, "learning_rate": 0.0009619730431781785, "loss": 2.208, "step": 19601 }, { "epoch": 0.53, "learning_rate": 0.0009618860670829926, "loss": 2.2797, "step": 19602 }, { "epoch": 0.53, "learning_rate": 0.0009617990912765509, "loss": 2.2345, "step": 19603 }, { "epoch": 0.53, "learning_rate": 0.0009617121157595127, "loss": 2.6998, "step": 19604 }, { "epoch": 0.53, "learning_rate": 0.0009616251405325365, "loss": 2.4436, "step": 19605 }, { "epoch": 0.53, "learning_rate": 0.0009615381655962813, "loss": 2.8304, "step": 19606 }, { "epoch": 0.53, "learning_rate": 0.0009614511909514067, "loss": 2.767, "step": 19607 }, { "epoch": 0.53, "learning_rate": 0.0009613642165985701, "loss": 2.2967, "step": 19608 }, { "epoch": 0.53, "learning_rate": 0.0009612772425384315, "loss": 2.7567, "step": 19609 }, { "epoch": 0.53, "learning_rate": 0.0009611902687716501, "loss": 2.606, "step": 19610 }, { "epoch": 0.53, "learning_rate": 0.0009611032952988839, "loss": 2.2337, "step": 19611 }, { "epoch": 0.53, "learning_rate": 0.0009610163221207919, "loss": 2.2662, "step": 19612 }, { "epoch": 0.53, "learning_rate": 0.000960929349238034, "loss": 2.7921, "step": 19613 }, { "epoch": 0.53, "learning_rate": 0.0009608423766512678, "loss": 2.6702, "step": 19614 }, { "epoch": 0.53, "learning_rate": 0.0009607554043611532, "loss": 2.3241, "step": 19615 }, { "epoch": 0.53, "learning_rate": 0.0009606684323683482, "loss": 2.514, "step": 19616 }, { "epoch": 0.53, "learning_rate": 0.0009605814606735122, "loss": 2.3634, "step": 19617 }, { "epoch": 0.53, "learning_rate": 0.0009604944892773042, "loss": 2.6499, "step": 19618 }, { "epoch": 0.53, "learning_rate": 0.0009604075181803826, "loss": 2.4282, "step": 19619 }, { "epoch": 0.53, "learning_rate": 0.0009603205473834067, "loss": 2.5164, "step": 19620 }, { "epoch": 0.53, "learning_rate": 0.0009602335768870354, "loss": 2.694, "step": 19621 }, { "epoch": 0.53, "learning_rate": 0.0009601466066919272, "loss": 2.6117, "step": 19622 }, { "epoch": 0.53, "learning_rate": 0.0009600596367987416, "loss": 2.5803, "step": 19623 }, { "epoch": 0.53, "learning_rate": 0.0009599726672081367, "loss": 2.9502, "step": 19624 }, { "epoch": 0.53, "learning_rate": 0.0009598856979207714, "loss": 2.7777, "step": 19625 }, { "epoch": 0.53, "learning_rate": 0.0009597987289373056, "loss": 2.3024, "step": 19626 }, { "epoch": 0.53, "learning_rate": 0.0009597117602583971, "loss": 2.3446, "step": 19627 }, { "epoch": 0.53, "learning_rate": 0.0009596247918847049, "loss": 2.1258, "step": 19628 }, { "epoch": 0.53, "learning_rate": 0.0009595378238168883, "loss": 2.6585, "step": 19629 }, { "epoch": 0.53, "learning_rate": 0.0009594508560556058, "loss": 2.4575, "step": 19630 }, { "epoch": 0.53, "learning_rate": 0.0009593638886015164, "loss": 2.9805, "step": 19631 }, { "epoch": 0.53, "learning_rate": 0.0009592769214552788, "loss": 2.5722, "step": 19632 }, { "epoch": 0.53, "learning_rate": 0.000959189954617552, "loss": 2.7735, "step": 19633 }, { "epoch": 0.53, "learning_rate": 0.0009591029880889952, "loss": 2.5173, "step": 19634 }, { "epoch": 0.53, "learning_rate": 0.0009590160218702664, "loss": 2.7757, "step": 19635 }, { "epoch": 0.53, "learning_rate": 0.0009589290559620249, "loss": 2.7815, "step": 19636 }, { "epoch": 0.53, "learning_rate": 0.00095884209036493, "loss": 2.8308, "step": 19637 }, { "epoch": 0.53, "learning_rate": 0.0009587551250796395, "loss": 2.5987, "step": 19638 }, { "epoch": 0.53, "learning_rate": 0.0009586681601068132, "loss": 2.6114, "step": 19639 }, { "epoch": 0.53, "learning_rate": 0.0009585811954471094, "loss": 2.4302, "step": 19640 }, { "epoch": 0.53, "learning_rate": 0.0009584942311011869, "loss": 2.6361, "step": 19641 }, { "epoch": 0.53, "learning_rate": 0.000958407267069705, "loss": 2.381, "step": 19642 }, { "epoch": 0.53, "learning_rate": 0.0009583203033533218, "loss": 2.5169, "step": 19643 }, { "epoch": 0.53, "learning_rate": 0.0009582333399526967, "loss": 2.3911, "step": 19644 }, { "epoch": 0.53, "learning_rate": 0.0009581463768684885, "loss": 2.5585, "step": 19645 }, { "epoch": 0.53, "learning_rate": 0.0009580594141013557, "loss": 2.6454, "step": 19646 }, { "epoch": 0.53, "learning_rate": 0.0009579724516519573, "loss": 2.3639, "step": 19647 }, { "epoch": 0.53, "learning_rate": 0.0009578854895209521, "loss": 2.6066, "step": 19648 }, { "epoch": 0.53, "learning_rate": 0.0009577985277089989, "loss": 2.0534, "step": 19649 }, { "epoch": 0.53, "learning_rate": 0.0009577115662167568, "loss": 2.1869, "step": 19650 }, { "epoch": 0.53, "learning_rate": 0.0009576246050448838, "loss": 2.7972, "step": 19651 }, { "epoch": 0.53, "learning_rate": 0.0009575376441940393, "loss": 2.4722, "step": 19652 }, { "epoch": 0.53, "learning_rate": 0.0009574506836648825, "loss": 2.5644, "step": 19653 }, { "epoch": 0.53, "learning_rate": 0.0009573637234580714, "loss": 2.4962, "step": 19654 }, { "epoch": 0.53, "learning_rate": 0.0009572767635742648, "loss": 2.628, "step": 19655 }, { "epoch": 0.53, "learning_rate": 0.0009571898040141223, "loss": 2.3925, "step": 19656 }, { "epoch": 0.53, "learning_rate": 0.000957102844778302, "loss": 2.656, "step": 19657 }, { "epoch": 0.53, "learning_rate": 0.000957015885867463, "loss": 2.3898, "step": 19658 }, { "epoch": 0.53, "learning_rate": 0.0009569289272822638, "loss": 2.5038, "step": 19659 }, { "epoch": 0.53, "learning_rate": 0.0009568419690233633, "loss": 3.0762, "step": 19660 }, { "epoch": 0.53, "learning_rate": 0.0009567550110914205, "loss": 2.7763, "step": 19661 }, { "epoch": 0.53, "learning_rate": 0.0009566680534870938, "loss": 1.8572, "step": 19662 }, { "epoch": 0.53, "learning_rate": 0.0009565810962110421, "loss": 2.7717, "step": 19663 }, { "epoch": 0.53, "learning_rate": 0.0009564941392639247, "loss": 3.0359, "step": 19664 }, { "epoch": 0.53, "learning_rate": 0.0009564071826463996, "loss": 2.3688, "step": 19665 }, { "epoch": 0.53, "learning_rate": 0.0009563202263591263, "loss": 2.3877, "step": 19666 }, { "epoch": 0.53, "learning_rate": 0.0009562332704027627, "loss": 2.5502, "step": 19667 }, { "epoch": 0.53, "learning_rate": 0.0009561463147779677, "loss": 2.6671, "step": 19668 }, { "epoch": 0.53, "learning_rate": 0.0009560593594854013, "loss": 3.1944, "step": 19669 }, { "epoch": 0.53, "learning_rate": 0.0009559724045257208, "loss": 2.6818, "step": 19670 }, { "epoch": 0.53, "learning_rate": 0.0009558854498995853, "loss": 2.5057, "step": 19671 }, { "epoch": 0.53, "learning_rate": 0.0009557984956076542, "loss": 2.5368, "step": 19672 }, { "epoch": 0.53, "learning_rate": 0.0009557115416505855, "loss": 2.615, "step": 19673 }, { "epoch": 0.53, "learning_rate": 0.0009556245880290384, "loss": 2.6269, "step": 19674 }, { "epoch": 0.53, "learning_rate": 0.0009555376347436714, "loss": 2.3982, "step": 19675 }, { "epoch": 0.53, "learning_rate": 0.0009554506817951432, "loss": 2.6342, "step": 19676 }, { "epoch": 0.53, "learning_rate": 0.0009553637291841129, "loss": 2.6428, "step": 19677 }, { "epoch": 0.53, "learning_rate": 0.0009552767769112389, "loss": 2.5765, "step": 19678 }, { "epoch": 0.53, "learning_rate": 0.0009551898249771799, "loss": 2.415, "step": 19679 }, { "epoch": 0.53, "learning_rate": 0.0009551028733825954, "loss": 2.4134, "step": 19680 }, { "epoch": 0.53, "learning_rate": 0.0009550159221281426, "loss": 2.5464, "step": 19681 }, { "epoch": 0.53, "learning_rate": 0.000954928971214482, "loss": 2.6489, "step": 19682 }, { "epoch": 0.53, "learning_rate": 0.0009548420206422709, "loss": 2.6075, "step": 19683 }, { "epoch": 0.53, "learning_rate": 0.0009547550704121686, "loss": 2.0808, "step": 19684 }, { "epoch": 0.53, "learning_rate": 0.0009546681205248341, "loss": 2.6016, "step": 19685 }, { "epoch": 0.53, "learning_rate": 0.0009545811709809254, "loss": 2.0667, "step": 19686 }, { "epoch": 0.53, "learning_rate": 0.0009544942217811018, "loss": 2.151, "step": 19687 }, { "epoch": 0.53, "learning_rate": 0.0009544072729260221, "loss": 2.5802, "step": 19688 }, { "epoch": 0.53, "learning_rate": 0.0009543203244163444, "loss": 2.3924, "step": 19689 }, { "epoch": 0.53, "learning_rate": 0.0009542333762527277, "loss": 2.4036, "step": 19690 }, { "epoch": 0.53, "learning_rate": 0.0009541464284358312, "loss": 2.3739, "step": 19691 }, { "epoch": 0.53, "learning_rate": 0.0009540594809663128, "loss": 2.0944, "step": 19692 }, { "epoch": 0.53, "learning_rate": 0.000953972533844832, "loss": 2.4322, "step": 19693 }, { "epoch": 0.53, "learning_rate": 0.0009538855870720464, "loss": 2.5729, "step": 19694 }, { "epoch": 0.53, "learning_rate": 0.0009537986406486157, "loss": 3.0408, "step": 19695 }, { "epoch": 0.53, "learning_rate": 0.0009537116945751985, "loss": 2.3832, "step": 19696 }, { "epoch": 0.53, "learning_rate": 0.0009536247488524527, "loss": 2.3867, "step": 19697 }, { "epoch": 0.53, "learning_rate": 0.0009535378034810376, "loss": 2.9232, "step": 19698 }, { "epoch": 0.53, "learning_rate": 0.0009534508584616122, "loss": 2.8488, "step": 19699 }, { "epoch": 0.53, "learning_rate": 0.0009533639137948344, "loss": 2.6003, "step": 19700 }, { "epoch": 0.53, "learning_rate": 0.0009532769694813635, "loss": 2.3065, "step": 19701 }, { "epoch": 0.53, "learning_rate": 0.0009531900255218578, "loss": 2.1873, "step": 19702 }, { "epoch": 0.53, "learning_rate": 0.0009531030819169759, "loss": 2.1215, "step": 19703 }, { "epoch": 0.53, "learning_rate": 0.0009530161386673771, "loss": 2.5955, "step": 19704 }, { "epoch": 0.53, "learning_rate": 0.0009529291957737193, "loss": 2.4682, "step": 19705 }, { "epoch": 0.53, "learning_rate": 0.0009528422532366614, "loss": 2.4319, "step": 19706 }, { "epoch": 0.53, "learning_rate": 0.0009527553110568626, "loss": 2.5041, "step": 19707 }, { "epoch": 0.53, "learning_rate": 0.0009526683692349806, "loss": 2.2605, "step": 19708 }, { "epoch": 0.53, "learning_rate": 0.0009525814277716754, "loss": 2.4063, "step": 19709 }, { "epoch": 0.53, "learning_rate": 0.0009524944866676041, "loss": 2.6412, "step": 19710 }, { "epoch": 0.53, "learning_rate": 0.0009524075459234258, "loss": 2.3481, "step": 19711 }, { "epoch": 0.53, "learning_rate": 0.0009523206055398003, "loss": 2.5323, "step": 19712 }, { "epoch": 0.53, "learning_rate": 0.0009522336655173849, "loss": 2.5735, "step": 19713 }, { "epoch": 0.53, "learning_rate": 0.0009521467258568386, "loss": 2.6572, "step": 19714 }, { "epoch": 0.53, "learning_rate": 0.0009520597865588205, "loss": 2.717, "step": 19715 }, { "epoch": 0.53, "learning_rate": 0.0009519728476239885, "loss": 2.7183, "step": 19716 }, { "epoch": 0.53, "learning_rate": 0.0009518859090530019, "loss": 2.686, "step": 19717 }, { "epoch": 0.53, "learning_rate": 0.0009517989708465189, "loss": 2.6193, "step": 19718 }, { "epoch": 0.53, "learning_rate": 0.0009517120330051981, "loss": 2.6426, "step": 19719 }, { "epoch": 0.53, "learning_rate": 0.0009516250955296987, "loss": 2.4486, "step": 19720 }, { "epoch": 0.53, "learning_rate": 0.0009515381584206787, "loss": 2.5652, "step": 19721 }, { "epoch": 0.53, "learning_rate": 0.0009514512216787969, "loss": 2.602, "step": 19722 }, { "epoch": 0.53, "learning_rate": 0.0009513642853047124, "loss": 2.4459, "step": 19723 }, { "epoch": 0.53, "learning_rate": 0.0009512773492990829, "loss": 2.6462, "step": 19724 }, { "epoch": 0.53, "learning_rate": 0.0009511904136625674, "loss": 2.6304, "step": 19725 }, { "epoch": 0.53, "learning_rate": 0.0009511034783958253, "loss": 2.2919, "step": 19726 }, { "epoch": 0.53, "learning_rate": 0.0009510165434995139, "loss": 2.4271, "step": 19727 }, { "epoch": 0.53, "learning_rate": 0.0009509296089742927, "loss": 2.4164, "step": 19728 }, { "epoch": 0.53, "learning_rate": 0.0009508426748208198, "loss": 2.7515, "step": 19729 }, { "epoch": 0.53, "learning_rate": 0.0009507557410397539, "loss": 2.0094, "step": 19730 }, { "epoch": 0.53, "learning_rate": 0.000950668807631754, "loss": 2.5387, "step": 19731 }, { "epoch": 0.53, "learning_rate": 0.0009505818745974782, "loss": 2.8275, "step": 19732 }, { "epoch": 0.53, "learning_rate": 0.0009504949419375852, "loss": 2.6167, "step": 19733 }, { "epoch": 0.53, "learning_rate": 0.000950408009652734, "loss": 2.4699, "step": 19734 }, { "epoch": 0.53, "learning_rate": 0.0009503210777435826, "loss": 2.5239, "step": 19735 }, { "epoch": 0.53, "learning_rate": 0.0009502341462107903, "loss": 2.0696, "step": 19736 }, { "epoch": 0.53, "learning_rate": 0.0009501472150550144, "loss": 2.5554, "step": 19737 }, { "epoch": 0.53, "learning_rate": 0.0009500602842769147, "loss": 2.205, "step": 19738 }, { "epoch": 0.53, "learning_rate": 0.0009499733538771497, "loss": 2.5084, "step": 19739 }, { "epoch": 0.53, "learning_rate": 0.0009498864238563771, "loss": 2.6236, "step": 19740 }, { "epoch": 0.53, "learning_rate": 0.0009497994942152559, "loss": 2.7236, "step": 19741 }, { "epoch": 0.53, "learning_rate": 0.0009497125649544454, "loss": 2.6787, "step": 19742 }, { "epoch": 0.53, "learning_rate": 0.0009496256360746031, "loss": 2.4974, "step": 19743 }, { "epoch": 0.53, "learning_rate": 0.0009495387075763882, "loss": 2.4797, "step": 19744 }, { "epoch": 0.53, "learning_rate": 0.0009494517794604587, "loss": 2.878, "step": 19745 }, { "epoch": 0.53, "learning_rate": 0.0009493648517274736, "loss": 2.3327, "step": 19746 }, { "epoch": 0.53, "learning_rate": 0.0009492779243780914, "loss": 2.6172, "step": 19747 }, { "epoch": 0.53, "learning_rate": 0.0009491909974129705, "loss": 2.8693, "step": 19748 }, { "epoch": 0.53, "learning_rate": 0.0009491040708327695, "loss": 2.6474, "step": 19749 }, { "epoch": 0.53, "learning_rate": 0.0009490171446381472, "loss": 2.3111, "step": 19750 }, { "epoch": 0.53, "learning_rate": 0.0009489302188297616, "loss": 2.9058, "step": 19751 }, { "epoch": 0.53, "learning_rate": 0.0009488432934082721, "loss": 2.1761, "step": 19752 }, { "epoch": 0.53, "learning_rate": 0.0009487563683743358, "loss": 2.5083, "step": 19753 }, { "epoch": 0.53, "learning_rate": 0.0009486694437286124, "loss": 2.555, "step": 19754 }, { "epoch": 0.53, "learning_rate": 0.0009485825194717606, "loss": 2.932, "step": 19755 }, { "epoch": 0.53, "learning_rate": 0.000948495595604438, "loss": 2.3727, "step": 19756 }, { "epoch": 0.53, "learning_rate": 0.0009484086721273033, "loss": 3.0053, "step": 19757 }, { "epoch": 0.53, "learning_rate": 0.000948321749041016, "loss": 2.6386, "step": 19758 }, { "epoch": 0.53, "learning_rate": 0.0009482348263462334, "loss": 2.5333, "step": 19759 }, { "epoch": 0.53, "learning_rate": 0.0009481479040436145, "loss": 2.1585, "step": 19760 }, { "epoch": 0.53, "learning_rate": 0.000948060982133818, "loss": 2.7245, "step": 19761 }, { "epoch": 0.53, "learning_rate": 0.000947974060617502, "loss": 2.4573, "step": 19762 }, { "epoch": 0.53, "learning_rate": 0.0009478871394953255, "loss": 2.386, "step": 19763 }, { "epoch": 0.53, "learning_rate": 0.0009478002187679464, "loss": 2.2509, "step": 19764 }, { "epoch": 0.53, "learning_rate": 0.0009477132984360236, "loss": 2.4205, "step": 19765 }, { "epoch": 0.53, "learning_rate": 0.0009476263785002157, "loss": 2.9494, "step": 19766 }, { "epoch": 0.53, "learning_rate": 0.0009475394589611808, "loss": 2.2706, "step": 19767 }, { "epoch": 0.53, "learning_rate": 0.0009474525398195776, "loss": 2.4486, "step": 19768 }, { "epoch": 0.53, "learning_rate": 0.0009473656210760649, "loss": 2.3296, "step": 19769 }, { "epoch": 0.53, "learning_rate": 0.0009472787027313002, "loss": 2.4702, "step": 19770 }, { "epoch": 0.53, "learning_rate": 0.0009471917847859434, "loss": 2.3967, "step": 19771 }, { "epoch": 0.53, "learning_rate": 0.0009471048672406516, "loss": 2.652, "step": 19772 }, { "epoch": 0.53, "learning_rate": 0.0009470179500960839, "loss": 2.875, "step": 19773 }, { "epoch": 0.53, "learning_rate": 0.0009469310333528991, "loss": 2.5796, "step": 19774 }, { "epoch": 0.53, "learning_rate": 0.0009468441170117548, "loss": 3.07, "step": 19775 }, { "epoch": 0.53, "learning_rate": 0.0009467572010733103, "loss": 2.4305, "step": 19776 }, { "epoch": 0.53, "learning_rate": 0.0009466702855382237, "loss": 2.6942, "step": 19777 }, { "epoch": 0.53, "learning_rate": 0.0009465833704071534, "loss": 2.8424, "step": 19778 }, { "epoch": 0.53, "learning_rate": 0.0009464964556807581, "loss": 2.5076, "step": 19779 }, { "epoch": 0.53, "learning_rate": 0.000946409541359696, "loss": 2.7821, "step": 19780 }, { "epoch": 0.53, "learning_rate": 0.0009463226274446254, "loss": 2.5685, "step": 19781 }, { "epoch": 0.53, "learning_rate": 0.0009462357139362055, "loss": 2.8853, "step": 19782 }, { "epoch": 0.53, "learning_rate": 0.0009461488008350936, "loss": 2.5489, "step": 19783 }, { "epoch": 0.53, "learning_rate": 0.0009460618881419491, "loss": 2.6807, "step": 19784 }, { "epoch": 0.53, "learning_rate": 0.0009459749758574303, "loss": 2.7646, "step": 19785 }, { "epoch": 0.53, "learning_rate": 0.0009458880639821951, "loss": 2.0415, "step": 19786 }, { "epoch": 0.53, "learning_rate": 0.0009458011525169024, "loss": 2.4941, "step": 19787 }, { "epoch": 0.53, "learning_rate": 0.0009457142414622103, "loss": 2.1431, "step": 19788 }, { "epoch": 0.53, "learning_rate": 0.0009456273308187775, "loss": 2.6892, "step": 19789 }, { "epoch": 0.53, "learning_rate": 0.0009455404205872624, "loss": 2.5313, "step": 19790 }, { "epoch": 0.53, "learning_rate": 0.0009454535107683232, "loss": 2.7174, "step": 19791 }, { "epoch": 0.53, "learning_rate": 0.0009453666013626184, "loss": 2.5686, "step": 19792 }, { "epoch": 0.53, "learning_rate": 0.0009452796923708067, "loss": 2.8342, "step": 19793 }, { "epoch": 0.53, "learning_rate": 0.0009451927837935461, "loss": 2.4661, "step": 19794 }, { "epoch": 0.53, "learning_rate": 0.0009451058756314955, "loss": 2.4726, "step": 19795 }, { "epoch": 0.53, "learning_rate": 0.0009450189678853124, "loss": 2.8957, "step": 19796 }, { "epoch": 0.53, "learning_rate": 0.000944932060555656, "loss": 2.3712, "step": 19797 }, { "epoch": 0.53, "learning_rate": 0.0009448451536431848, "loss": 2.7442, "step": 19798 }, { "epoch": 0.53, "learning_rate": 0.0009447582471485565, "loss": 2.2877, "step": 19799 }, { "epoch": 0.53, "learning_rate": 0.0009446713410724295, "loss": 2.6107, "step": 19800 }, { "epoch": 0.53, "learning_rate": 0.0009445844354154635, "loss": 2.3133, "step": 19801 }, { "epoch": 0.53, "learning_rate": 0.0009444975301783152, "loss": 2.6269, "step": 19802 }, { "epoch": 0.53, "learning_rate": 0.0009444106253616438, "loss": 2.9653, "step": 19803 }, { "epoch": 0.53, "learning_rate": 0.0009443237209661076, "loss": 2.897, "step": 19804 }, { "epoch": 0.53, "learning_rate": 0.0009442368169923649, "loss": 2.4309, "step": 19805 }, { "epoch": 0.53, "learning_rate": 0.0009441499134410742, "loss": 2.4726, "step": 19806 }, { "epoch": 0.53, "learning_rate": 0.0009440630103128937, "loss": 2.3195, "step": 19807 }, { "epoch": 0.53, "learning_rate": 0.0009439761076084818, "loss": 2.6758, "step": 19808 }, { "epoch": 0.53, "learning_rate": 0.0009438892053284971, "loss": 2.4271, "step": 19809 }, { "epoch": 0.53, "learning_rate": 0.0009438023034735975, "loss": 2.6918, "step": 19810 }, { "epoch": 0.53, "learning_rate": 0.0009437154020444416, "loss": 2.3959, "step": 19811 }, { "epoch": 0.53, "learning_rate": 0.0009436285010416881, "loss": 2.8642, "step": 19812 }, { "epoch": 0.53, "learning_rate": 0.0009435416004659944, "loss": 2.3997, "step": 19813 }, { "epoch": 0.53, "learning_rate": 0.0009434547003180203, "loss": 2.0048, "step": 19814 }, { "epoch": 0.53, "learning_rate": 0.0009433678005984226, "loss": 2.5782, "step": 19815 }, { "epoch": 0.53, "learning_rate": 0.0009432809013078605, "loss": 2.6418, "step": 19816 }, { "epoch": 0.53, "learning_rate": 0.0009431940024469921, "loss": 2.6632, "step": 19817 }, { "epoch": 0.53, "learning_rate": 0.0009431071040164758, "loss": 2.5255, "step": 19818 }, { "epoch": 0.53, "learning_rate": 0.0009430202060169698, "loss": 2.2265, "step": 19819 }, { "epoch": 0.53, "learning_rate": 0.0009429333084491328, "loss": 2.3171, "step": 19820 }, { "epoch": 0.53, "learning_rate": 0.0009428464113136227, "loss": 2.4935, "step": 19821 }, { "epoch": 0.53, "learning_rate": 0.0009427595146110981, "loss": 2.3735, "step": 19822 }, { "epoch": 0.53, "learning_rate": 0.0009426726183422169, "loss": 2.29, "step": 19823 }, { "epoch": 0.53, "learning_rate": 0.0009425857225076378, "loss": 2.5377, "step": 19824 }, { "epoch": 0.53, "learning_rate": 0.0009424988271080195, "loss": 2.565, "step": 19825 }, { "epoch": 0.53, "learning_rate": 0.000942411932144019, "loss": 2.2343, "step": 19826 }, { "epoch": 0.53, "learning_rate": 0.0009423250376162956, "loss": 2.6509, "step": 19827 }, { "epoch": 0.53, "learning_rate": 0.000942238143525508, "loss": 2.7902, "step": 19828 }, { "epoch": 0.53, "learning_rate": 0.0009421512498723134, "loss": 2.2568, "step": 19829 }, { "epoch": 0.53, "learning_rate": 0.0009420643566573708, "loss": 2.512, "step": 19830 }, { "epoch": 0.53, "learning_rate": 0.000941977463881338, "loss": 2.4545, "step": 19831 }, { "epoch": 0.53, "learning_rate": 0.0009418905715448735, "loss": 2.6805, "step": 19832 }, { "epoch": 0.53, "learning_rate": 0.0009418036796486362, "loss": 1.6721, "step": 19833 }, { "epoch": 0.53, "learning_rate": 0.0009417167881932832, "loss": 2.3139, "step": 19834 }, { "epoch": 0.53, "learning_rate": 0.0009416298971794737, "loss": 2.7872, "step": 19835 }, { "epoch": 0.53, "learning_rate": 0.0009415430066078656, "loss": 2.2376, "step": 19836 }, { "epoch": 0.53, "learning_rate": 0.0009414561164791172, "loss": 2.3157, "step": 19837 }, { "epoch": 0.53, "learning_rate": 0.0009413692267938867, "loss": 2.6184, "step": 19838 }, { "epoch": 0.53, "learning_rate": 0.0009412823375528328, "loss": 2.8502, "step": 19839 }, { "epoch": 0.53, "learning_rate": 0.0009411954487566131, "loss": 2.4357, "step": 19840 }, { "epoch": 0.53, "learning_rate": 0.0009411085604058867, "loss": 1.8148, "step": 19841 }, { "epoch": 0.53, "learning_rate": 0.0009410216725013107, "loss": 2.5433, "step": 19842 }, { "epoch": 0.53, "learning_rate": 0.0009409347850435439, "loss": 2.22, "step": 19843 }, { "epoch": 0.53, "learning_rate": 0.0009408478980332452, "loss": 2.7672, "step": 19844 }, { "epoch": 0.53, "learning_rate": 0.0009407610114710718, "loss": 2.673, "step": 19845 }, { "epoch": 0.53, "learning_rate": 0.0009406741253576824, "loss": 2.4375, "step": 19846 }, { "epoch": 0.53, "learning_rate": 0.0009405872396937355, "loss": 2.5407, "step": 19847 }, { "epoch": 0.53, "learning_rate": 0.0009405003544798888, "loss": 2.4004, "step": 19848 }, { "epoch": 0.53, "learning_rate": 0.000940413469716801, "loss": 2.7637, "step": 19849 }, { "epoch": 0.53, "learning_rate": 0.0009403265854051299, "loss": 2.5111, "step": 19850 }, { "epoch": 0.53, "learning_rate": 0.0009402397015455337, "loss": 2.7076, "step": 19851 }, { "epoch": 0.53, "learning_rate": 0.0009401528181386713, "loss": 2.3841, "step": 19852 }, { "epoch": 0.53, "learning_rate": 0.0009400659351852001, "loss": 2.2034, "step": 19853 }, { "epoch": 0.53, "learning_rate": 0.0009399790526857788, "loss": 2.57, "step": 19854 }, { "epoch": 0.53, "learning_rate": 0.0009398921706410658, "loss": 2.1041, "step": 19855 }, { "epoch": 0.53, "learning_rate": 0.0009398052890517184, "loss": 2.4136, "step": 19856 }, { "epoch": 0.53, "learning_rate": 0.0009397184079183959, "loss": 2.4179, "step": 19857 }, { "epoch": 0.53, "learning_rate": 0.0009396315272417556, "loss": 2.1589, "step": 19858 }, { "epoch": 0.53, "learning_rate": 0.0009395446470224562, "loss": 2.0415, "step": 19859 }, { "epoch": 0.53, "learning_rate": 0.0009394577672611557, "loss": 2.6608, "step": 19860 }, { "epoch": 0.53, "learning_rate": 0.0009393708879585122, "loss": 2.4827, "step": 19861 }, { "epoch": 0.53, "learning_rate": 0.0009392840091151841, "loss": 2.1599, "step": 19862 }, { "epoch": 0.53, "learning_rate": 0.0009391971307318297, "loss": 2.2505, "step": 19863 }, { "epoch": 0.53, "learning_rate": 0.0009391102528091067, "loss": 2.3742, "step": 19864 }, { "epoch": 0.53, "learning_rate": 0.0009390233753476737, "loss": 2.3511, "step": 19865 }, { "epoch": 0.53, "learning_rate": 0.0009389364983481885, "loss": 2.4424, "step": 19866 }, { "epoch": 0.53, "learning_rate": 0.0009388496218113095, "loss": 2.2624, "step": 19867 }, { "epoch": 0.53, "learning_rate": 0.0009387627457376952, "loss": 2.491, "step": 19868 }, { "epoch": 0.53, "learning_rate": 0.0009386758701280029, "loss": 2.0771, "step": 19869 }, { "epoch": 0.53, "learning_rate": 0.0009385889949828914, "loss": 2.8198, "step": 19870 }, { "epoch": 0.53, "learning_rate": 0.0009385021203030192, "loss": 2.6094, "step": 19871 }, { "epoch": 0.53, "learning_rate": 0.0009384152460890434, "loss": 2.2904, "step": 19872 }, { "epoch": 0.53, "learning_rate": 0.0009383283723416225, "loss": 2.3843, "step": 19873 }, { "epoch": 0.53, "learning_rate": 0.0009382414990614154, "loss": 2.5074, "step": 19874 }, { "epoch": 0.53, "learning_rate": 0.0009381546262490794, "loss": 2.4834, "step": 19875 }, { "epoch": 0.53, "learning_rate": 0.0009380677539052728, "loss": 2.6306, "step": 19876 }, { "epoch": 0.53, "learning_rate": 0.0009379808820306539, "loss": 2.6434, "step": 19877 }, { "epoch": 0.53, "learning_rate": 0.0009378940106258807, "loss": 2.687, "step": 19878 }, { "epoch": 0.53, "learning_rate": 0.0009378071396916116, "loss": 2.1016, "step": 19879 }, { "epoch": 0.53, "learning_rate": 0.0009377202692285041, "loss": 2.3385, "step": 19880 }, { "epoch": 0.53, "learning_rate": 0.000937633399237217, "loss": 2.4609, "step": 19881 }, { "epoch": 0.53, "learning_rate": 0.0009375465297184081, "loss": 1.8088, "step": 19882 }, { "epoch": 0.53, "learning_rate": 0.0009374596606727353, "loss": 2.7421, "step": 19883 }, { "epoch": 0.53, "learning_rate": 0.0009373727921008575, "loss": 2.6817, "step": 19884 }, { "epoch": 0.53, "learning_rate": 0.0009372859240034318, "loss": 2.6751, "step": 19885 }, { "epoch": 0.53, "learning_rate": 0.0009371990563811164, "loss": 2.6388, "step": 19886 }, { "epoch": 0.53, "learning_rate": 0.0009371121892345703, "loss": 2.4153, "step": 19887 }, { "epoch": 0.53, "learning_rate": 0.0009370253225644507, "loss": 2.4524, "step": 19888 }, { "epoch": 0.53, "learning_rate": 0.000936938456371416, "loss": 2.5164, "step": 19889 }, { "epoch": 0.53, "learning_rate": 0.0009368515906561244, "loss": 2.6158, "step": 19890 }, { "epoch": 0.53, "learning_rate": 0.0009367647254192339, "loss": 2.6664, "step": 19891 }, { "epoch": 0.53, "learning_rate": 0.0009366778606614025, "loss": 2.7429, "step": 19892 }, { "epoch": 0.53, "learning_rate": 0.0009365909963832881, "loss": 2.4926, "step": 19893 }, { "epoch": 0.53, "learning_rate": 0.0009365041325855491, "loss": 2.1722, "step": 19894 }, { "epoch": 0.53, "learning_rate": 0.0009364172692688436, "loss": 2.4492, "step": 19895 }, { "epoch": 0.53, "learning_rate": 0.0009363304064338293, "loss": 2.9273, "step": 19896 }, { "epoch": 0.53, "learning_rate": 0.0009362435440811644, "loss": 2.3804, "step": 19897 }, { "epoch": 0.53, "learning_rate": 0.0009361566822115075, "loss": 2.4187, "step": 19898 }, { "epoch": 0.53, "learning_rate": 0.0009360698208255155, "loss": 2.12, "step": 19899 }, { "epoch": 0.53, "learning_rate": 0.0009359829599238479, "loss": 2.3631, "step": 19900 }, { "epoch": 0.53, "learning_rate": 0.0009358960995071613, "loss": 2.484, "step": 19901 }, { "epoch": 0.53, "learning_rate": 0.0009358092395761144, "loss": 2.5909, "step": 19902 }, { "epoch": 0.53, "learning_rate": 0.0009357223801313656, "loss": 2.0862, "step": 19903 }, { "epoch": 0.53, "learning_rate": 0.0009356355211735722, "loss": 2.2068, "step": 19904 }, { "epoch": 0.53, "learning_rate": 0.0009355486627033926, "loss": 2.3912, "step": 19905 }, { "epoch": 0.53, "learning_rate": 0.0009354618047214851, "loss": 2.6472, "step": 19906 }, { "epoch": 0.53, "learning_rate": 0.0009353749472285071, "loss": 2.4045, "step": 19907 }, { "epoch": 0.54, "learning_rate": 0.0009352880902251172, "loss": 2.7681, "step": 19908 }, { "epoch": 0.54, "learning_rate": 0.000935201233711973, "loss": 2.0274, "step": 19909 }, { "epoch": 0.54, "learning_rate": 0.0009351143776897326, "loss": 2.1226, "step": 19910 }, { "epoch": 0.54, "learning_rate": 0.0009350275221590547, "loss": 2.3377, "step": 19911 }, { "epoch": 0.54, "learning_rate": 0.0009349406671205957, "loss": 2.8732, "step": 19912 }, { "epoch": 0.54, "learning_rate": 0.000934853812575015, "loss": 1.9878, "step": 19913 }, { "epoch": 0.54, "learning_rate": 0.0009347669585229707, "loss": 2.253, "step": 19914 }, { "epoch": 0.54, "learning_rate": 0.0009346801049651197, "loss": 2.1482, "step": 19915 }, { "epoch": 0.54, "learning_rate": 0.0009345932519021203, "loss": 2.5493, "step": 19916 }, { "epoch": 0.54, "learning_rate": 0.0009345063993346313, "loss": 2.8311, "step": 19917 }, { "epoch": 0.54, "learning_rate": 0.0009344195472633098, "loss": 2.4959, "step": 19918 }, { "epoch": 0.54, "learning_rate": 0.0009343326956888142, "loss": 2.2537, "step": 19919 }, { "epoch": 0.54, "learning_rate": 0.0009342458446118023, "loss": 2.7856, "step": 19920 }, { "epoch": 0.54, "learning_rate": 0.0009341589940329321, "loss": 2.5472, "step": 19921 }, { "epoch": 0.54, "learning_rate": 0.0009340721439528618, "loss": 2.4044, "step": 19922 }, { "epoch": 0.54, "learning_rate": 0.0009339852943722488, "loss": 2.1915, "step": 19923 }, { "epoch": 0.54, "learning_rate": 0.0009338984452917515, "loss": 2.9667, "step": 19924 }, { "epoch": 0.54, "learning_rate": 0.000933811596712028, "loss": 2.881, "step": 19925 }, { "epoch": 0.54, "learning_rate": 0.0009337247486337358, "loss": 2.7065, "step": 19926 }, { "epoch": 0.54, "learning_rate": 0.0009336379010575335, "loss": 2.5247, "step": 19927 }, { "epoch": 0.54, "learning_rate": 0.0009335510539840778, "loss": 2.634, "step": 19928 }, { "epoch": 0.54, "learning_rate": 0.0009334642074140279, "loss": 2.5825, "step": 19929 }, { "epoch": 0.54, "learning_rate": 0.0009333773613480414, "loss": 2.4055, "step": 19930 }, { "epoch": 0.54, "learning_rate": 0.0009332905157867758, "loss": 2.4484, "step": 19931 }, { "epoch": 0.54, "learning_rate": 0.0009332036707308892, "loss": 2.4633, "step": 19932 }, { "epoch": 0.54, "learning_rate": 0.0009331168261810402, "loss": 2.3967, "step": 19933 }, { "epoch": 0.54, "learning_rate": 0.0009330299821378858, "loss": 2.854, "step": 19934 }, { "epoch": 0.54, "learning_rate": 0.0009329431386020844, "loss": 2.3971, "step": 19935 }, { "epoch": 0.54, "learning_rate": 0.0009328562955742936, "loss": 2.8611, "step": 19936 }, { "epoch": 0.54, "learning_rate": 0.0009327694530551716, "loss": 2.5507, "step": 19937 }, { "epoch": 0.54, "learning_rate": 0.0009326826110453763, "loss": 3.0104, "step": 19938 }, { "epoch": 0.54, "learning_rate": 0.0009325957695455653, "loss": 2.2635, "step": 19939 }, { "epoch": 0.54, "learning_rate": 0.0009325089285563968, "loss": 2.9902, "step": 19940 }, { "epoch": 0.54, "learning_rate": 0.0009324220880785288, "loss": 2.6358, "step": 19941 }, { "epoch": 0.54, "learning_rate": 0.0009323352481126187, "loss": 2.5891, "step": 19942 }, { "epoch": 0.54, "learning_rate": 0.0009322484086593251, "loss": 2.8059, "step": 19943 }, { "epoch": 0.54, "learning_rate": 0.0009321615697193051, "loss": 2.835, "step": 19944 }, { "epoch": 0.54, "learning_rate": 0.0009320747312932166, "loss": 2.8401, "step": 19945 }, { "epoch": 0.54, "learning_rate": 0.0009319878933817185, "loss": 2.4437, "step": 19946 }, { "epoch": 0.54, "learning_rate": 0.0009319010559854675, "loss": 2.6162, "step": 19947 }, { "epoch": 0.54, "learning_rate": 0.0009318142191051218, "loss": 2.5475, "step": 19948 }, { "epoch": 0.54, "learning_rate": 0.0009317273827413398, "loss": 2.413, "step": 19949 }, { "epoch": 0.54, "learning_rate": 0.0009316405468947787, "loss": 2.6307, "step": 19950 }, { "epoch": 0.54, "learning_rate": 0.0009315537115660965, "loss": 2.557, "step": 19951 }, { "epoch": 0.54, "learning_rate": 0.0009314668767559514, "loss": 2.4055, "step": 19952 }, { "epoch": 0.54, "learning_rate": 0.0009313800424650007, "loss": 2.2193, "step": 19953 }, { "epoch": 0.54, "learning_rate": 0.0009312932086939029, "loss": 2.8156, "step": 19954 }, { "epoch": 0.54, "learning_rate": 0.0009312063754433151, "loss": 2.6432, "step": 19955 }, { "epoch": 0.54, "learning_rate": 0.0009311195427138956, "loss": 2.8219, "step": 19956 }, { "epoch": 0.54, "learning_rate": 0.0009310327105063026, "loss": 2.2847, "step": 19957 }, { "epoch": 0.54, "learning_rate": 0.0009309458788211928, "loss": 2.5447, "step": 19958 }, { "epoch": 0.54, "learning_rate": 0.0009308590476592247, "loss": 2.4711, "step": 19959 }, { "epoch": 0.54, "learning_rate": 0.0009307722170210568, "loss": 2.8006, "step": 19960 }, { "epoch": 0.54, "learning_rate": 0.0009306853869073455, "loss": 2.6373, "step": 19961 }, { "epoch": 0.54, "learning_rate": 0.0009305985573187497, "loss": 2.3906, "step": 19962 }, { "epoch": 0.54, "learning_rate": 0.0009305117282559266, "loss": 2.5793, "step": 19963 }, { "epoch": 0.54, "learning_rate": 0.0009304248997195341, "loss": 2.7247, "step": 19964 }, { "epoch": 0.54, "learning_rate": 0.0009303380717102306, "loss": 2.7655, "step": 19965 }, { "epoch": 0.54, "learning_rate": 0.0009302512442286729, "loss": 2.775, "step": 19966 }, { "epoch": 0.54, "learning_rate": 0.0009301644172755195, "loss": 2.3137, "step": 19967 }, { "epoch": 0.54, "learning_rate": 0.0009300775908514281, "loss": 2.6221, "step": 19968 }, { "epoch": 0.54, "learning_rate": 0.0009299907649570563, "loss": 2.7884, "step": 19969 }, { "epoch": 0.54, "learning_rate": 0.0009299039395930621, "loss": 2.7159, "step": 19970 }, { "epoch": 0.54, "learning_rate": 0.0009298171147601028, "loss": 2.2976, "step": 19971 }, { "epoch": 0.54, "learning_rate": 0.0009297302904588365, "loss": 2.6555, "step": 19972 }, { "epoch": 0.54, "learning_rate": 0.0009296434666899214, "loss": 2.3669, "step": 19973 }, { "epoch": 0.54, "learning_rate": 0.0009295566434540145, "loss": 2.4825, "step": 19974 }, { "epoch": 0.54, "learning_rate": 0.0009294698207517736, "loss": 2.5438, "step": 19975 }, { "epoch": 0.54, "learning_rate": 0.0009293829985838573, "loss": 2.3155, "step": 19976 }, { "epoch": 0.54, "learning_rate": 0.0009292961769509225, "loss": 2.8115, "step": 19977 }, { "epoch": 0.54, "learning_rate": 0.0009292093558536273, "loss": 2.388, "step": 19978 }, { "epoch": 0.54, "learning_rate": 0.0009291225352926291, "loss": 3.2381, "step": 19979 }, { "epoch": 0.54, "learning_rate": 0.0009290357152685862, "loss": 2.2918, "step": 19980 }, { "epoch": 0.54, "learning_rate": 0.0009289488957821559, "loss": 2.5354, "step": 19981 }, { "epoch": 0.54, "learning_rate": 0.000928862076833996, "loss": 2.3476, "step": 19982 }, { "epoch": 0.54, "learning_rate": 0.0009287752584247643, "loss": 2.6093, "step": 19983 }, { "epoch": 0.54, "learning_rate": 0.0009286884405551187, "loss": 2.8706, "step": 19984 }, { "epoch": 0.54, "learning_rate": 0.0009286016232257165, "loss": 2.6421, "step": 19985 }, { "epoch": 0.54, "learning_rate": 0.0009285148064372158, "loss": 2.6906, "step": 19986 }, { "epoch": 0.54, "learning_rate": 0.0009284279901902744, "loss": 2.7735, "step": 19987 }, { "epoch": 0.54, "learning_rate": 0.0009283411744855491, "loss": 2.4918, "step": 19988 }, { "epoch": 0.54, "learning_rate": 0.0009282543593236989, "loss": 2.5931, "step": 19989 }, { "epoch": 0.54, "learning_rate": 0.0009281675447053804, "loss": 2.53, "step": 19990 }, { "epoch": 0.54, "learning_rate": 0.0009280807306312519, "loss": 2.5123, "step": 19991 }, { "epoch": 0.54, "learning_rate": 0.000927993917101971, "loss": 2.4018, "step": 19992 }, { "epoch": 0.54, "learning_rate": 0.0009279071041181951, "loss": 2.4742, "step": 19993 }, { "epoch": 0.54, "learning_rate": 0.0009278202916805821, "loss": 2.4066, "step": 19994 }, { "epoch": 0.54, "learning_rate": 0.00092773347978979, "loss": 2.8776, "step": 19995 }, { "epoch": 0.54, "learning_rate": 0.0009276466684464758, "loss": 2.8895, "step": 19996 }, { "epoch": 0.54, "learning_rate": 0.0009275598576512976, "loss": 2.5912, "step": 19997 }, { "epoch": 0.54, "learning_rate": 0.0009274730474049131, "loss": 2.9146, "step": 19998 }, { "epoch": 0.54, "learning_rate": 0.0009273862377079795, "loss": 2.7393, "step": 19999 }, { "epoch": 0.54, "learning_rate": 0.0009272994285611553, "loss": 2.5859, "step": 20000 }, { "epoch": 0.54, "learning_rate": 0.000927212619965097, "loss": 2.7366, "step": 20001 }, { "epoch": 0.54, "learning_rate": 0.000927125811920463, "loss": 2.9945, "step": 20002 }, { "epoch": 0.54, "learning_rate": 0.0009270390044279114, "loss": 2.4895, "step": 20003 }, { "epoch": 0.54, "learning_rate": 0.0009269521974880989, "loss": 2.3461, "step": 20004 }, { "epoch": 0.54, "learning_rate": 0.0009268653911016835, "loss": 2.9124, "step": 20005 }, { "epoch": 0.54, "learning_rate": 0.0009267785852693228, "loss": 2.4751, "step": 20006 }, { "epoch": 0.54, "learning_rate": 0.0009266917799916743, "loss": 2.7148, "step": 20007 }, { "epoch": 0.54, "learning_rate": 0.000926604975269396, "loss": 2.7608, "step": 20008 }, { "epoch": 0.54, "learning_rate": 0.0009265181711031452, "loss": 2.7604, "step": 20009 }, { "epoch": 0.54, "learning_rate": 0.0009264313674935795, "loss": 2.4002, "step": 20010 }, { "epoch": 0.54, "learning_rate": 0.0009263445644413568, "loss": 2.7511, "step": 20011 }, { "epoch": 0.54, "learning_rate": 0.0009262577619471343, "loss": 2.8579, "step": 20012 }, { "epoch": 0.54, "learning_rate": 0.0009261709600115702, "loss": 2.1106, "step": 20013 }, { "epoch": 0.54, "learning_rate": 0.0009260841586353211, "loss": 2.4249, "step": 20014 }, { "epoch": 0.54, "learning_rate": 0.0009259973578190455, "loss": 2.5643, "step": 20015 }, { "epoch": 0.54, "learning_rate": 0.000925910557563401, "loss": 2.9538, "step": 20016 }, { "epoch": 0.54, "learning_rate": 0.0009258237578690445, "loss": 2.5621, "step": 20017 }, { "epoch": 0.54, "learning_rate": 0.0009257369587366337, "loss": 2.6662, "step": 20018 }, { "epoch": 0.54, "learning_rate": 0.0009256501601668273, "loss": 2.4996, "step": 20019 }, { "epoch": 0.54, "learning_rate": 0.0009255633621602813, "loss": 2.1881, "step": 20020 }, { "epoch": 0.54, "learning_rate": 0.000925476564717654, "loss": 2.7193, "step": 20021 }, { "epoch": 0.54, "learning_rate": 0.0009253897678396032, "loss": 2.7049, "step": 20022 }, { "epoch": 0.54, "learning_rate": 0.0009253029715267858, "loss": 2.6712, "step": 20023 }, { "epoch": 0.54, "learning_rate": 0.00092521617577986, "loss": 2.5377, "step": 20024 }, { "epoch": 0.54, "learning_rate": 0.000925129380599483, "loss": 2.5772, "step": 20025 }, { "epoch": 0.54, "learning_rate": 0.0009250425859863124, "loss": 2.7991, "step": 20026 }, { "epoch": 0.54, "learning_rate": 0.000924955791941006, "loss": 2.9805, "step": 20027 }, { "epoch": 0.54, "learning_rate": 0.0009248689984642208, "loss": 2.5258, "step": 20028 }, { "epoch": 0.54, "learning_rate": 0.0009247822055566147, "loss": 2.4353, "step": 20029 }, { "epoch": 0.54, "learning_rate": 0.0009246954132188455, "loss": 2.2489, "step": 20030 }, { "epoch": 0.54, "learning_rate": 0.0009246086214515698, "loss": 3.0641, "step": 20031 }, { "epoch": 0.54, "learning_rate": 0.0009245218302554463, "loss": 2.2991, "step": 20032 }, { "epoch": 0.54, "learning_rate": 0.0009244350396311316, "loss": 2.4258, "step": 20033 }, { "epoch": 0.54, "learning_rate": 0.0009243482495792835, "loss": 2.3321, "step": 20034 }, { "epoch": 0.54, "learning_rate": 0.0009242614601005597, "loss": 2.3498, "step": 20035 }, { "epoch": 0.54, "learning_rate": 0.0009241746711956174, "loss": 2.8117, "step": 20036 }, { "epoch": 0.54, "learning_rate": 0.0009240878828651141, "loss": 2.7656, "step": 20037 }, { "epoch": 0.54, "learning_rate": 0.0009240010951097078, "loss": 2.5514, "step": 20038 }, { "epoch": 0.54, "learning_rate": 0.0009239143079300552, "loss": 2.3479, "step": 20039 }, { "epoch": 0.54, "learning_rate": 0.0009238275213268147, "loss": 2.5353, "step": 20040 }, { "epoch": 0.54, "learning_rate": 0.0009237407353006428, "loss": 2.4825, "step": 20041 }, { "epoch": 0.54, "learning_rate": 0.0009236539498521976, "loss": 2.3342, "step": 20042 }, { "epoch": 0.54, "learning_rate": 0.0009235671649821369, "loss": 2.7732, "step": 20043 }, { "epoch": 0.54, "learning_rate": 0.0009234803806911169, "loss": 2.4328, "step": 20044 }, { "epoch": 0.54, "learning_rate": 0.0009233935969797962, "loss": 2.6235, "step": 20045 }, { "epoch": 0.54, "learning_rate": 0.0009233068138488322, "loss": 2.3758, "step": 20046 }, { "epoch": 0.54, "learning_rate": 0.0009232200312988818, "loss": 2.6094, "step": 20047 }, { "epoch": 0.54, "learning_rate": 0.0009231332493306028, "loss": 2.4858, "step": 20048 }, { "epoch": 0.54, "learning_rate": 0.0009230464679446524, "loss": 2.1626, "step": 20049 }, { "epoch": 0.54, "learning_rate": 0.0009229596871416882, "loss": 2.3614, "step": 20050 }, { "epoch": 0.54, "learning_rate": 0.0009228729069223678, "loss": 2.8218, "step": 20051 }, { "epoch": 0.54, "learning_rate": 0.0009227861272873483, "loss": 2.3244, "step": 20052 }, { "epoch": 0.54, "learning_rate": 0.0009226993482372873, "loss": 2.5148, "step": 20053 }, { "epoch": 0.54, "learning_rate": 0.0009226125697728425, "loss": 2.5307, "step": 20054 }, { "epoch": 0.54, "learning_rate": 0.0009225257918946707, "loss": 2.549, "step": 20055 }, { "epoch": 0.54, "learning_rate": 0.0009224390146034302, "loss": 2.2319, "step": 20056 }, { "epoch": 0.54, "learning_rate": 0.0009223522378997771, "loss": 2.5659, "step": 20057 }, { "epoch": 0.54, "learning_rate": 0.0009222654617843698, "loss": 2.6202, "step": 20058 }, { "epoch": 0.54, "learning_rate": 0.0009221786862578659, "loss": 2.7623, "step": 20059 }, { "epoch": 0.54, "learning_rate": 0.0009220919113209219, "loss": 2.5496, "step": 20060 }, { "epoch": 0.54, "learning_rate": 0.0009220051369741955, "loss": 2.4174, "step": 20061 }, { "epoch": 0.54, "learning_rate": 0.0009219183632183449, "loss": 2.2181, "step": 20062 }, { "epoch": 0.54, "learning_rate": 0.0009218315900540264, "loss": 2.3616, "step": 20063 }, { "epoch": 0.54, "learning_rate": 0.0009217448174818977, "loss": 2.3061, "step": 20064 }, { "epoch": 0.54, "learning_rate": 0.0009216580455026165, "loss": 2.3555, "step": 20065 }, { "epoch": 0.54, "learning_rate": 0.0009215712741168398, "loss": 2.3188, "step": 20066 }, { "epoch": 0.54, "learning_rate": 0.0009214845033252252, "loss": 2.637, "step": 20067 }, { "epoch": 0.54, "learning_rate": 0.0009213977331284299, "loss": 2.2952, "step": 20068 }, { "epoch": 0.54, "learning_rate": 0.0009213109635271113, "loss": 2.5414, "step": 20069 }, { "epoch": 0.54, "learning_rate": 0.000921224194521927, "loss": 2.7581, "step": 20070 }, { "epoch": 0.54, "learning_rate": 0.0009211374261135338, "loss": 2.4614, "step": 20071 }, { "epoch": 0.54, "learning_rate": 0.0009210506583025894, "loss": 2.2916, "step": 20072 }, { "epoch": 0.54, "learning_rate": 0.0009209638910897516, "loss": 2.4599, "step": 20073 }, { "epoch": 0.54, "learning_rate": 0.0009208771244756764, "loss": 2.8332, "step": 20074 }, { "epoch": 0.54, "learning_rate": 0.0009207903584610228, "loss": 2.7468, "step": 20075 }, { "epoch": 0.54, "learning_rate": 0.0009207035930464468, "loss": 2.4414, "step": 20076 }, { "epoch": 0.54, "learning_rate": 0.0009206168282326062, "loss": 2.7882, "step": 20077 }, { "epoch": 0.54, "learning_rate": 0.0009205300640201584, "loss": 2.5471, "step": 20078 }, { "epoch": 0.54, "learning_rate": 0.0009204433004097605, "loss": 2.7243, "step": 20079 }, { "epoch": 0.54, "learning_rate": 0.00092035653740207, "loss": 2.5886, "step": 20080 }, { "epoch": 0.54, "learning_rate": 0.0009202697749977443, "loss": 2.2354, "step": 20081 }, { "epoch": 0.54, "learning_rate": 0.0009201830131974403, "loss": 2.4491, "step": 20082 }, { "epoch": 0.54, "learning_rate": 0.0009200962520018158, "loss": 2.6317, "step": 20083 }, { "epoch": 0.54, "learning_rate": 0.0009200094914115275, "loss": 2.3578, "step": 20084 }, { "epoch": 0.54, "learning_rate": 0.0009199227314272331, "loss": 2.7609, "step": 20085 }, { "epoch": 0.54, "learning_rate": 0.0009198359720495899, "loss": 2.456, "step": 20086 }, { "epoch": 0.54, "learning_rate": 0.0009197492132792549, "loss": 2.0869, "step": 20087 }, { "epoch": 0.54, "learning_rate": 0.0009196624551168855, "loss": 2.7899, "step": 20088 }, { "epoch": 0.54, "learning_rate": 0.0009195756975631394, "loss": 2.2641, "step": 20089 }, { "epoch": 0.54, "learning_rate": 0.0009194889406186727, "loss": 2.5181, "step": 20090 }, { "epoch": 0.54, "learning_rate": 0.0009194021842841441, "loss": 2.4227, "step": 20091 }, { "epoch": 0.54, "learning_rate": 0.0009193154285602098, "loss": 3.0571, "step": 20092 }, { "epoch": 0.54, "learning_rate": 0.0009192286734475273, "loss": 2.677, "step": 20093 }, { "epoch": 0.54, "learning_rate": 0.0009191419189467541, "loss": 2.8473, "step": 20094 }, { "epoch": 0.54, "learning_rate": 0.0009190551650585471, "loss": 2.5603, "step": 20095 }, { "epoch": 0.54, "learning_rate": 0.0009189684117835637, "loss": 2.6301, "step": 20096 }, { "epoch": 0.54, "learning_rate": 0.0009188816591224613, "loss": 2.222, "step": 20097 }, { "epoch": 0.54, "learning_rate": 0.0009187949070758968, "loss": 2.4246, "step": 20098 }, { "epoch": 0.54, "learning_rate": 0.0009187081556445276, "loss": 2.8923, "step": 20099 }, { "epoch": 0.54, "learning_rate": 0.000918621404829011, "loss": 2.8249, "step": 20100 }, { "epoch": 0.54, "learning_rate": 0.000918534654630004, "loss": 2.4448, "step": 20101 }, { "epoch": 0.54, "learning_rate": 0.0009184479050481642, "loss": 2.2952, "step": 20102 }, { "epoch": 0.54, "learning_rate": 0.0009183611560841478, "loss": 2.4841, "step": 20103 }, { "epoch": 0.54, "learning_rate": 0.000918274407738613, "loss": 2.6325, "step": 20104 }, { "epoch": 0.54, "learning_rate": 0.0009181876600122171, "loss": 2.313, "step": 20105 }, { "epoch": 0.54, "learning_rate": 0.0009181009129056164, "loss": 2.8994, "step": 20106 }, { "epoch": 0.54, "learning_rate": 0.0009180141664194684, "loss": 2.4717, "step": 20107 }, { "epoch": 0.54, "learning_rate": 0.000917927420554431, "loss": 2.7153, "step": 20108 }, { "epoch": 0.54, "learning_rate": 0.0009178406753111604, "loss": 2.3552, "step": 20109 }, { "epoch": 0.54, "learning_rate": 0.0009177539306903142, "loss": 2.1036, "step": 20110 }, { "epoch": 0.54, "learning_rate": 0.0009176671866925495, "loss": 2.322, "step": 20111 }, { "epoch": 0.54, "learning_rate": 0.0009175804433185234, "loss": 2.4884, "step": 20112 }, { "epoch": 0.54, "learning_rate": 0.0009174937005688934, "loss": 2.8112, "step": 20113 }, { "epoch": 0.54, "learning_rate": 0.000917406958444316, "loss": 2.7655, "step": 20114 }, { "epoch": 0.54, "learning_rate": 0.0009173202169454489, "loss": 2.8255, "step": 20115 }, { "epoch": 0.54, "learning_rate": 0.0009172334760729491, "loss": 2.4848, "step": 20116 }, { "epoch": 0.54, "learning_rate": 0.0009171467358274737, "loss": 2.8511, "step": 20117 }, { "epoch": 0.54, "learning_rate": 0.0009170599962096801, "loss": 2.5265, "step": 20118 }, { "epoch": 0.54, "learning_rate": 0.0009169732572202247, "loss": 2.3979, "step": 20119 }, { "epoch": 0.54, "learning_rate": 0.0009168865188597648, "loss": 2.6954, "step": 20120 }, { "epoch": 0.54, "learning_rate": 0.0009167997811289585, "loss": 2.2728, "step": 20121 }, { "epoch": 0.54, "learning_rate": 0.0009167130440284617, "loss": 2.3193, "step": 20122 }, { "epoch": 0.54, "learning_rate": 0.000916626307558932, "loss": 2.322, "step": 20123 }, { "epoch": 0.54, "learning_rate": 0.0009165395717210268, "loss": 2.5874, "step": 20124 }, { "epoch": 0.54, "learning_rate": 0.0009164528365154026, "loss": 2.406, "step": 20125 }, { "epoch": 0.54, "learning_rate": 0.000916366101942717, "loss": 2.1398, "step": 20126 }, { "epoch": 0.54, "learning_rate": 0.0009162793680036267, "loss": 2.3609, "step": 20127 }, { "epoch": 0.54, "learning_rate": 0.0009161926346987888, "loss": 2.3827, "step": 20128 }, { "epoch": 0.54, "learning_rate": 0.0009161059020288607, "loss": 2.4726, "step": 20129 }, { "epoch": 0.54, "learning_rate": 0.0009160191699944993, "loss": 2.1107, "step": 20130 }, { "epoch": 0.54, "learning_rate": 0.0009159324385963615, "loss": 2.7138, "step": 20131 }, { "epoch": 0.54, "learning_rate": 0.000915845707835105, "loss": 2.0572, "step": 20132 }, { "epoch": 0.54, "learning_rate": 0.0009157589777113857, "loss": 1.9863, "step": 20133 }, { "epoch": 0.54, "learning_rate": 0.0009156722482258616, "loss": 2.4015, "step": 20134 }, { "epoch": 0.54, "learning_rate": 0.0009155855193791897, "loss": 2.7856, "step": 20135 }, { "epoch": 0.54, "learning_rate": 0.0009154987911720266, "loss": 2.7189, "step": 20136 }, { "epoch": 0.54, "learning_rate": 0.0009154120636050297, "loss": 2.7558, "step": 20137 }, { "epoch": 0.54, "learning_rate": 0.0009153253366788556, "loss": 2.5177, "step": 20138 }, { "epoch": 0.54, "learning_rate": 0.0009152386103941618, "loss": 2.587, "step": 20139 }, { "epoch": 0.54, "learning_rate": 0.0009151518847516052, "loss": 2.2341, "step": 20140 }, { "epoch": 0.54, "learning_rate": 0.0009150651597518426, "loss": 2.6095, "step": 20141 }, { "epoch": 0.54, "learning_rate": 0.000914978435395531, "loss": 2.3377, "step": 20142 }, { "epoch": 0.54, "learning_rate": 0.000914891711683328, "loss": 2.6549, "step": 20143 }, { "epoch": 0.54, "learning_rate": 0.0009148049886158897, "loss": 2.6678, "step": 20144 }, { "epoch": 0.54, "learning_rate": 0.0009147182661938744, "loss": 2.5757, "step": 20145 }, { "epoch": 0.54, "learning_rate": 0.0009146315444179373, "loss": 2.601, "step": 20146 }, { "epoch": 0.54, "learning_rate": 0.0009145448232887367, "loss": 2.458, "step": 20147 }, { "epoch": 0.54, "learning_rate": 0.0009144581028069297, "loss": 2.4367, "step": 20148 }, { "epoch": 0.54, "learning_rate": 0.0009143713829731722, "loss": 2.5504, "step": 20149 }, { "epoch": 0.54, "learning_rate": 0.0009142846637881217, "loss": 2.4862, "step": 20150 }, { "epoch": 0.54, "learning_rate": 0.000914197945252436, "loss": 2.6983, "step": 20151 }, { "epoch": 0.54, "learning_rate": 0.0009141112273667708, "loss": 2.6298, "step": 20152 }, { "epoch": 0.54, "learning_rate": 0.0009140245101317838, "loss": 2.5004, "step": 20153 }, { "epoch": 0.54, "learning_rate": 0.0009139377935481316, "loss": 2.3587, "step": 20154 }, { "epoch": 0.54, "learning_rate": 0.0009138510776164712, "loss": 2.5144, "step": 20155 }, { "epoch": 0.54, "learning_rate": 0.0009137643623374598, "loss": 2.4603, "step": 20156 }, { "epoch": 0.54, "learning_rate": 0.0009136776477117541, "loss": 3.0783, "step": 20157 }, { "epoch": 0.54, "learning_rate": 0.000913590933740011, "loss": 2.3465, "step": 20158 }, { "epoch": 0.54, "learning_rate": 0.0009135042204228878, "loss": 2.7826, "step": 20159 }, { "epoch": 0.54, "learning_rate": 0.0009134175077610409, "loss": 2.4396, "step": 20160 }, { "epoch": 0.54, "learning_rate": 0.000913330795755128, "loss": 2.134, "step": 20161 }, { "epoch": 0.54, "learning_rate": 0.0009132440844058051, "loss": 2.5932, "step": 20162 }, { "epoch": 0.54, "learning_rate": 0.0009131573737137292, "loss": 2.9726, "step": 20163 }, { "epoch": 0.54, "learning_rate": 0.0009130706636795581, "loss": 2.2792, "step": 20164 }, { "epoch": 0.54, "learning_rate": 0.0009129839543039477, "loss": 2.2271, "step": 20165 }, { "epoch": 0.54, "learning_rate": 0.0009128972455875555, "loss": 2.4855, "step": 20166 }, { "epoch": 0.54, "learning_rate": 0.0009128105375310382, "loss": 2.6011, "step": 20167 }, { "epoch": 0.54, "learning_rate": 0.0009127238301350525, "loss": 2.2939, "step": 20168 }, { "epoch": 0.54, "learning_rate": 0.0009126371234002555, "loss": 2.2537, "step": 20169 }, { "epoch": 0.54, "learning_rate": 0.0009125504173273043, "loss": 2.7557, "step": 20170 }, { "epoch": 0.54, "learning_rate": 0.0009124637119168552, "loss": 2.9489, "step": 20171 }, { "epoch": 0.54, "learning_rate": 0.0009123770071695656, "loss": 2.4892, "step": 20172 }, { "epoch": 0.54, "learning_rate": 0.000912290303086092, "loss": 2.3748, "step": 20173 }, { "epoch": 0.54, "learning_rate": 0.0009122035996670913, "loss": 2.2524, "step": 20174 }, { "epoch": 0.54, "learning_rate": 0.0009121168969132208, "loss": 2.4925, "step": 20175 }, { "epoch": 0.54, "learning_rate": 0.0009120301948251364, "loss": 2.3036, "step": 20176 }, { "epoch": 0.54, "learning_rate": 0.0009119434934034958, "loss": 2.4407, "step": 20177 }, { "epoch": 0.54, "learning_rate": 0.0009118567926489559, "loss": 2.8583, "step": 20178 }, { "epoch": 0.54, "learning_rate": 0.0009117700925621727, "loss": 2.6096, "step": 20179 }, { "epoch": 0.54, "learning_rate": 0.0009116833931438038, "loss": 2.7887, "step": 20180 }, { "epoch": 0.54, "learning_rate": 0.0009115966943945055, "loss": 2.834, "step": 20181 }, { "epoch": 0.54, "learning_rate": 0.0009115099963149348, "loss": 3.0862, "step": 20182 }, { "epoch": 0.54, "learning_rate": 0.0009114232989057489, "loss": 2.0968, "step": 20183 }, { "epoch": 0.54, "learning_rate": 0.0009113366021676039, "loss": 2.6231, "step": 20184 }, { "epoch": 0.54, "learning_rate": 0.000911249906101157, "loss": 2.279, "step": 20185 }, { "epoch": 0.54, "learning_rate": 0.0009111632107070651, "loss": 2.451, "step": 20186 }, { "epoch": 0.54, "learning_rate": 0.0009110765159859847, "loss": 2.5616, "step": 20187 }, { "epoch": 0.54, "learning_rate": 0.000910989821938573, "loss": 2.5528, "step": 20188 }, { "epoch": 0.54, "learning_rate": 0.000910903128565486, "loss": 2.4064, "step": 20189 }, { "epoch": 0.54, "learning_rate": 0.0009108164358673812, "loss": 2.5655, "step": 20190 }, { "epoch": 0.54, "learning_rate": 0.0009107297438449154, "loss": 2.2747, "step": 20191 }, { "epoch": 0.54, "learning_rate": 0.0009106430524987448, "loss": 2.615, "step": 20192 }, { "epoch": 0.54, "learning_rate": 0.0009105563618295263, "loss": 2.6872, "step": 20193 }, { "epoch": 0.54, "learning_rate": 0.0009104696718379173, "loss": 2.6641, "step": 20194 }, { "epoch": 0.54, "learning_rate": 0.0009103829825245738, "loss": 2.4905, "step": 20195 }, { "epoch": 0.54, "learning_rate": 0.0009102962938901529, "loss": 2.2404, "step": 20196 }, { "epoch": 0.54, "learning_rate": 0.000910209605935311, "loss": 2.8681, "step": 20197 }, { "epoch": 0.54, "learning_rate": 0.0009101229186607052, "loss": 2.7356, "step": 20198 }, { "epoch": 0.54, "learning_rate": 0.0009100362320669922, "loss": 2.8638, "step": 20199 }, { "epoch": 0.54, "learning_rate": 0.0009099495461548284, "loss": 2.567, "step": 20200 }, { "epoch": 0.54, "learning_rate": 0.0009098628609248708, "loss": 2.6917, "step": 20201 }, { "epoch": 0.54, "learning_rate": 0.0009097761763777763, "loss": 2.6688, "step": 20202 }, { "epoch": 0.54, "learning_rate": 0.0009096894925142011, "loss": 2.309, "step": 20203 }, { "epoch": 0.54, "learning_rate": 0.0009096028093348025, "loss": 2.6823, "step": 20204 }, { "epoch": 0.54, "learning_rate": 0.0009095161268402365, "loss": 2.5899, "step": 20205 }, { "epoch": 0.54, "learning_rate": 0.0009094294450311599, "loss": 2.6521, "step": 20206 }, { "epoch": 0.54, "learning_rate": 0.0009093427639082303, "loss": 2.5148, "step": 20207 }, { "epoch": 0.54, "learning_rate": 0.0009092560834721034, "loss": 2.8156, "step": 20208 }, { "epoch": 0.54, "learning_rate": 0.000909169403723436, "loss": 2.3762, "step": 20209 }, { "epoch": 0.54, "learning_rate": 0.0009090827246628853, "loss": 2.4426, "step": 20210 }, { "epoch": 0.54, "learning_rate": 0.0009089960462911074, "loss": 2.262, "step": 20211 }, { "epoch": 0.54, "learning_rate": 0.000908909368608759, "loss": 2.5912, "step": 20212 }, { "epoch": 0.54, "learning_rate": 0.0009088226916164975, "loss": 2.0758, "step": 20213 }, { "epoch": 0.54, "learning_rate": 0.0009087360153149785, "loss": 2.3373, "step": 20214 }, { "epoch": 0.54, "learning_rate": 0.0009086493397048594, "loss": 2.7735, "step": 20215 }, { "epoch": 0.54, "learning_rate": 0.0009085626647867964, "loss": 2.3839, "step": 20216 }, { "epoch": 0.54, "learning_rate": 0.0009084759905614463, "loss": 2.2904, "step": 20217 }, { "epoch": 0.54, "learning_rate": 0.0009083893170294662, "loss": 2.6105, "step": 20218 }, { "epoch": 0.54, "learning_rate": 0.0009083026441915114, "loss": 2.5927, "step": 20219 }, { "epoch": 0.54, "learning_rate": 0.0009082159720482398, "loss": 2.2608, "step": 20220 }, { "epoch": 0.54, "learning_rate": 0.0009081293006003079, "loss": 2.6306, "step": 20221 }, { "epoch": 0.54, "learning_rate": 0.0009080426298483717, "loss": 2.5213, "step": 20222 }, { "epoch": 0.54, "learning_rate": 0.0009079559597930882, "loss": 1.9824, "step": 20223 }, { "epoch": 0.54, "learning_rate": 0.0009078692904351137, "loss": 2.0839, "step": 20224 }, { "epoch": 0.54, "learning_rate": 0.000907782621775105, "loss": 2.7198, "step": 20225 }, { "epoch": 0.54, "learning_rate": 0.0009076959538137188, "loss": 2.7027, "step": 20226 }, { "epoch": 0.54, "learning_rate": 0.0009076092865516114, "loss": 2.7155, "step": 20227 }, { "epoch": 0.54, "learning_rate": 0.0009075226199894397, "loss": 2.8982, "step": 20228 }, { "epoch": 0.54, "learning_rate": 0.0009074359541278601, "loss": 2.5279, "step": 20229 }, { "epoch": 0.54, "learning_rate": 0.0009073492889675289, "loss": 2.5651, "step": 20230 }, { "epoch": 0.54, "learning_rate": 0.0009072626245091035, "loss": 2.5576, "step": 20231 }, { "epoch": 0.54, "learning_rate": 0.0009071759607532393, "loss": 2.5921, "step": 20232 }, { "epoch": 0.54, "learning_rate": 0.0009070892977005935, "loss": 2.7469, "step": 20233 }, { "epoch": 0.54, "learning_rate": 0.0009070026353518231, "loss": 2.632, "step": 20234 }, { "epoch": 0.54, "learning_rate": 0.0009069159737075835, "loss": 2.7646, "step": 20235 }, { "epoch": 0.54, "learning_rate": 0.0009068293127685317, "loss": 2.5194, "step": 20236 }, { "epoch": 0.54, "learning_rate": 0.000906742652535325, "loss": 2.6391, "step": 20237 }, { "epoch": 0.54, "learning_rate": 0.000906655993008619, "loss": 2.3761, "step": 20238 }, { "epoch": 0.54, "learning_rate": 0.0009065693341890706, "loss": 2.3521, "step": 20239 }, { "epoch": 0.54, "learning_rate": 0.0009064826760773361, "loss": 2.4961, "step": 20240 }, { "epoch": 0.54, "learning_rate": 0.000906396018674072, "loss": 2.5328, "step": 20241 }, { "epoch": 0.54, "learning_rate": 0.0009063093619799352, "loss": 2.6363, "step": 20242 }, { "epoch": 0.54, "learning_rate": 0.0009062227059955818, "loss": 2.332, "step": 20243 }, { "epoch": 0.54, "learning_rate": 0.0009061360507216683, "loss": 2.2305, "step": 20244 }, { "epoch": 0.54, "learning_rate": 0.0009060493961588515, "loss": 2.5116, "step": 20245 }, { "epoch": 0.54, "learning_rate": 0.0009059627423077876, "loss": 2.751, "step": 20246 }, { "epoch": 0.54, "learning_rate": 0.000905876089169133, "loss": 2.2185, "step": 20247 }, { "epoch": 0.54, "learning_rate": 0.0009057894367435448, "loss": 2.7762, "step": 20248 }, { "epoch": 0.54, "learning_rate": 0.0009057027850316783, "loss": 2.111, "step": 20249 }, { "epoch": 0.54, "learning_rate": 0.0009056161340341914, "loss": 2.5573, "step": 20250 }, { "epoch": 0.54, "learning_rate": 0.0009055294837517393, "loss": 2.713, "step": 20251 }, { "epoch": 0.54, "learning_rate": 0.0009054428341849787, "loss": 2.7208, "step": 20252 }, { "epoch": 0.54, "learning_rate": 0.000905356185334567, "loss": 2.9283, "step": 20253 }, { "epoch": 0.54, "learning_rate": 0.0009052695372011594, "loss": 2.3436, "step": 20254 }, { "epoch": 0.54, "learning_rate": 0.0009051828897854128, "loss": 2.4421, "step": 20255 }, { "epoch": 0.54, "learning_rate": 0.0009050962430879841, "loss": 2.4544, "step": 20256 }, { "epoch": 0.54, "learning_rate": 0.0009050095971095289, "loss": 2.2465, "step": 20257 }, { "epoch": 0.54, "learning_rate": 0.0009049229518507043, "loss": 2.3584, "step": 20258 }, { "epoch": 0.54, "learning_rate": 0.0009048363073121662, "loss": 2.5909, "step": 20259 }, { "epoch": 0.54, "learning_rate": 0.0009047496634945712, "loss": 2.6621, "step": 20260 }, { "epoch": 0.54, "learning_rate": 0.0009046630203985759, "loss": 2.3015, "step": 20261 }, { "epoch": 0.54, "learning_rate": 0.0009045763780248364, "loss": 2.5661, "step": 20262 }, { "epoch": 0.54, "learning_rate": 0.0009044897363740092, "loss": 2.6739, "step": 20263 }, { "epoch": 0.54, "learning_rate": 0.000904403095446751, "loss": 2.5328, "step": 20264 }, { "epoch": 0.54, "learning_rate": 0.0009043164552437174, "loss": 2.5941, "step": 20265 }, { "epoch": 0.54, "learning_rate": 0.0009042298157655657, "loss": 2.6244, "step": 20266 }, { "epoch": 0.54, "learning_rate": 0.0009041431770129513, "loss": 2.6108, "step": 20267 }, { "epoch": 0.54, "learning_rate": 0.0009040565389865312, "loss": 2.718, "step": 20268 }, { "epoch": 0.54, "learning_rate": 0.0009039699016869618, "loss": 2.6319, "step": 20269 }, { "epoch": 0.54, "learning_rate": 0.0009038832651148991, "loss": 2.3428, "step": 20270 }, { "epoch": 0.54, "learning_rate": 0.0009037966292709994, "loss": 2.6178, "step": 20271 }, { "epoch": 0.54, "learning_rate": 0.0009037099941559196, "loss": 2.3744, "step": 20272 }, { "epoch": 0.54, "learning_rate": 0.0009036233597703154, "loss": 2.5496, "step": 20273 }, { "epoch": 0.54, "learning_rate": 0.0009035367261148437, "loss": 2.5955, "step": 20274 }, { "epoch": 0.54, "learning_rate": 0.0009034500931901602, "loss": 2.4683, "step": 20275 }, { "epoch": 0.54, "learning_rate": 0.0009033634609969215, "loss": 2.8279, "step": 20276 }, { "epoch": 0.54, "learning_rate": 0.0009032768295357845, "loss": 2.1745, "step": 20277 }, { "epoch": 0.54, "learning_rate": 0.0009031901988074042, "loss": 2.2887, "step": 20278 }, { "epoch": 0.54, "learning_rate": 0.000903103568812438, "loss": 2.6363, "step": 20279 }, { "epoch": 0.55, "learning_rate": 0.0009030169395515422, "loss": 2.6658, "step": 20280 }, { "epoch": 0.55, "learning_rate": 0.0009029303110253723, "loss": 2.2542, "step": 20281 }, { "epoch": 0.55, "learning_rate": 0.0009028436832345848, "loss": 2.4903, "step": 20282 }, { "epoch": 0.55, "learning_rate": 0.0009027570561798367, "loss": 2.5201, "step": 20283 }, { "epoch": 0.55, "learning_rate": 0.0009026704298617835, "loss": 2.3392, "step": 20284 }, { "epoch": 0.55, "learning_rate": 0.0009025838042810818, "loss": 2.3494, "step": 20285 }, { "epoch": 0.55, "learning_rate": 0.0009024971794383876, "loss": 2.1064, "step": 20286 }, { "epoch": 0.55, "learning_rate": 0.0009024105553343575, "loss": 2.2002, "step": 20287 }, { "epoch": 0.55, "learning_rate": 0.0009023239319696475, "loss": 2.6399, "step": 20288 }, { "epoch": 0.55, "learning_rate": 0.000902237309344914, "loss": 2.2129, "step": 20289 }, { "epoch": 0.55, "learning_rate": 0.000902150687460813, "loss": 2.1809, "step": 20290 }, { "epoch": 0.55, "learning_rate": 0.0009020640663180012, "loss": 2.6288, "step": 20291 }, { "epoch": 0.55, "learning_rate": 0.0009019774459171343, "loss": 2.7823, "step": 20292 }, { "epoch": 0.55, "learning_rate": 0.0009018908262588691, "loss": 2.4076, "step": 20293 }, { "epoch": 0.55, "learning_rate": 0.000901804207343861, "loss": 2.4302, "step": 20294 }, { "epoch": 0.55, "learning_rate": 0.0009017175891727666, "loss": 2.5957, "step": 20295 }, { "epoch": 0.55, "learning_rate": 0.0009016309717462428, "loss": 1.8905, "step": 20296 }, { "epoch": 0.55, "learning_rate": 0.0009015443550649447, "loss": 2.5694, "step": 20297 }, { "epoch": 0.55, "learning_rate": 0.0009014577391295289, "loss": 2.1083, "step": 20298 }, { "epoch": 0.55, "learning_rate": 0.0009013711239406519, "loss": 2.6675, "step": 20299 }, { "epoch": 0.55, "learning_rate": 0.0009012845094989694, "loss": 2.2647, "step": 20300 }, { "epoch": 0.55, "learning_rate": 0.0009011978958051381, "loss": 2.7667, "step": 20301 }, { "epoch": 0.55, "learning_rate": 0.0009011112828598136, "loss": 2.3787, "step": 20302 }, { "epoch": 0.55, "learning_rate": 0.0009010246706636525, "loss": 2.7217, "step": 20303 }, { "epoch": 0.55, "learning_rate": 0.0009009380592173107, "loss": 2.5603, "step": 20304 }, { "epoch": 0.55, "learning_rate": 0.0009008514485214445, "loss": 2.3363, "step": 20305 }, { "epoch": 0.55, "learning_rate": 0.0009007648385767099, "loss": 2.2475, "step": 20306 }, { "epoch": 0.55, "learning_rate": 0.0009006782293837636, "loss": 2.7702, "step": 20307 }, { "epoch": 0.55, "learning_rate": 0.0009005916209432606, "loss": 2.6653, "step": 20308 }, { "epoch": 0.55, "learning_rate": 0.0009005050132558584, "loss": 1.9947, "step": 20309 }, { "epoch": 0.55, "learning_rate": 0.0009004184063222119, "loss": 2.6786, "step": 20310 }, { "epoch": 0.55, "learning_rate": 0.0009003318001429779, "loss": 2.2837, "step": 20311 }, { "epoch": 0.55, "learning_rate": 0.0009002451947188125, "loss": 2.3603, "step": 20312 }, { "epoch": 0.55, "learning_rate": 0.0009001585900503715, "loss": 2.7337, "step": 20313 }, { "epoch": 0.55, "learning_rate": 0.0009000719861383111, "loss": 2.2953, "step": 20314 }, { "epoch": 0.55, "learning_rate": 0.0008999853829832877, "loss": 2.3813, "step": 20315 }, { "epoch": 0.55, "learning_rate": 0.000899898780585957, "loss": 2.8689, "step": 20316 }, { "epoch": 0.55, "learning_rate": 0.0008998121789469753, "loss": 2.8985, "step": 20317 }, { "epoch": 0.55, "learning_rate": 0.0008997255780669987, "loss": 2.1569, "step": 20318 }, { "epoch": 0.55, "learning_rate": 0.000899638977946683, "loss": 2.7576, "step": 20319 }, { "epoch": 0.55, "learning_rate": 0.0008995523785866849, "loss": 2.4702, "step": 20320 }, { "epoch": 0.55, "learning_rate": 0.0008994657799876592, "loss": 2.8687, "step": 20321 }, { "epoch": 0.55, "learning_rate": 0.0008993791821502633, "loss": 2.6619, "step": 20322 }, { "epoch": 0.55, "learning_rate": 0.000899292585075153, "loss": 2.2822, "step": 20323 }, { "epoch": 0.55, "learning_rate": 0.0008992059887629836, "loss": 2.8538, "step": 20324 }, { "epoch": 0.55, "learning_rate": 0.0008991193932144115, "loss": 2.3908, "step": 20325 }, { "epoch": 0.55, "learning_rate": 0.0008990327984300934, "loss": 2.4146, "step": 20326 }, { "epoch": 0.55, "learning_rate": 0.0008989462044106844, "loss": 2.4148, "step": 20327 }, { "epoch": 0.55, "learning_rate": 0.0008988596111568411, "loss": 2.2441, "step": 20328 }, { "epoch": 0.55, "learning_rate": 0.0008987730186692191, "loss": 2.8939, "step": 20329 }, { "epoch": 0.55, "learning_rate": 0.0008986864269484746, "loss": 2.671, "step": 20330 }, { "epoch": 0.55, "learning_rate": 0.0008985998359952637, "loss": 2.0718, "step": 20331 }, { "epoch": 0.55, "learning_rate": 0.0008985132458102423, "loss": 2.376, "step": 20332 }, { "epoch": 0.55, "learning_rate": 0.0008984266563940663, "loss": 2.7906, "step": 20333 }, { "epoch": 0.55, "learning_rate": 0.0008983400677473921, "loss": 2.1913, "step": 20334 }, { "epoch": 0.55, "learning_rate": 0.000898253479870875, "loss": 2.5075, "step": 20335 }, { "epoch": 0.55, "learning_rate": 0.000898166892765172, "loss": 2.368, "step": 20336 }, { "epoch": 0.55, "learning_rate": 0.0008980803064309377, "loss": 2.4266, "step": 20337 }, { "epoch": 0.55, "learning_rate": 0.0008979937208688286, "loss": 2.2931, "step": 20338 }, { "epoch": 0.55, "learning_rate": 0.0008979071360795017, "loss": 2.7293, "step": 20339 }, { "epoch": 0.55, "learning_rate": 0.0008978205520636115, "loss": 2.5445, "step": 20340 }, { "epoch": 0.55, "learning_rate": 0.0008977339688218147, "loss": 2.4782, "step": 20341 }, { "epoch": 0.55, "learning_rate": 0.0008976473863547672, "loss": 2.5322, "step": 20342 }, { "epoch": 0.55, "learning_rate": 0.0008975608046631245, "loss": 2.3816, "step": 20343 }, { "epoch": 0.55, "learning_rate": 0.0008974742237475431, "loss": 2.8759, "step": 20344 }, { "epoch": 0.55, "learning_rate": 0.0008973876436086783, "loss": 2.5792, "step": 20345 }, { "epoch": 0.55, "learning_rate": 0.0008973010642471867, "loss": 2.5127, "step": 20346 }, { "epoch": 0.55, "learning_rate": 0.0008972144856637238, "loss": 2.5978, "step": 20347 }, { "epoch": 0.55, "learning_rate": 0.0008971279078589454, "loss": 2.141, "step": 20348 }, { "epoch": 0.55, "learning_rate": 0.0008970413308335076, "loss": 2.8838, "step": 20349 }, { "epoch": 0.55, "learning_rate": 0.0008969547545880668, "loss": 2.8849, "step": 20350 }, { "epoch": 0.55, "learning_rate": 0.0008968681791232775, "loss": 2.4056, "step": 20351 }, { "epoch": 0.55, "learning_rate": 0.0008967816044397973, "loss": 2.449, "step": 20352 }, { "epoch": 0.55, "learning_rate": 0.0008966950305382808, "loss": 2.3425, "step": 20353 }, { "epoch": 0.55, "learning_rate": 0.000896608457419384, "loss": 2.6187, "step": 20354 }, { "epoch": 0.55, "learning_rate": 0.0008965218850837635, "loss": 2.3133, "step": 20355 }, { "epoch": 0.55, "learning_rate": 0.0008964353135320744, "loss": 2.5126, "step": 20356 }, { "epoch": 0.55, "learning_rate": 0.0008963487427649729, "loss": 2.3278, "step": 20357 }, { "epoch": 0.55, "learning_rate": 0.000896262172783115, "loss": 2.6846, "step": 20358 }, { "epoch": 0.55, "learning_rate": 0.0008961756035871561, "loss": 3.01, "step": 20359 }, { "epoch": 0.55, "learning_rate": 0.0008960890351777522, "loss": 2.2943, "step": 20360 }, { "epoch": 0.55, "learning_rate": 0.0008960024675555595, "loss": 2.5381, "step": 20361 }, { "epoch": 0.55, "learning_rate": 0.0008959159007212332, "loss": 2.4812, "step": 20362 }, { "epoch": 0.55, "learning_rate": 0.0008958293346754301, "loss": 2.3119, "step": 20363 }, { "epoch": 0.55, "learning_rate": 0.0008957427694188044, "loss": 2.9124, "step": 20364 }, { "epoch": 0.55, "learning_rate": 0.0008956562049520131, "loss": 2.9831, "step": 20365 }, { "epoch": 0.55, "learning_rate": 0.0008955696412757123, "loss": 2.3787, "step": 20366 }, { "epoch": 0.55, "learning_rate": 0.0008954830783905567, "loss": 2.5853, "step": 20367 }, { "epoch": 0.55, "learning_rate": 0.0008953965162972024, "loss": 1.9111, "step": 20368 }, { "epoch": 0.55, "learning_rate": 0.000895309954996306, "loss": 2.635, "step": 20369 }, { "epoch": 0.55, "learning_rate": 0.0008952233944885224, "loss": 2.2509, "step": 20370 }, { "epoch": 0.55, "learning_rate": 0.0008951368347745078, "loss": 2.5885, "step": 20371 }, { "epoch": 0.55, "learning_rate": 0.0008950502758549175, "loss": 2.567, "step": 20372 }, { "epoch": 0.55, "learning_rate": 0.0008949637177304075, "loss": 2.9768, "step": 20373 }, { "epoch": 0.55, "learning_rate": 0.0008948771604016339, "loss": 2.4448, "step": 20374 }, { "epoch": 0.55, "learning_rate": 0.0008947906038692519, "loss": 2.5383, "step": 20375 }, { "epoch": 0.55, "learning_rate": 0.0008947040481339175, "loss": 1.8894, "step": 20376 }, { "epoch": 0.55, "learning_rate": 0.0008946174931962865, "loss": 2.2662, "step": 20377 }, { "epoch": 0.55, "learning_rate": 0.0008945309390570146, "loss": 2.5706, "step": 20378 }, { "epoch": 0.55, "learning_rate": 0.0008944443857167577, "loss": 2.3497, "step": 20379 }, { "epoch": 0.55, "learning_rate": 0.0008943578331761708, "loss": 2.6489, "step": 20380 }, { "epoch": 0.55, "learning_rate": 0.0008942712814359098, "loss": 2.3262, "step": 20381 }, { "epoch": 0.55, "learning_rate": 0.0008941847304966314, "loss": 2.5436, "step": 20382 }, { "epoch": 0.55, "learning_rate": 0.0008940981803589902, "loss": 2.6105, "step": 20383 }, { "epoch": 0.55, "learning_rate": 0.0008940116310236421, "loss": 2.5527, "step": 20384 }, { "epoch": 0.55, "learning_rate": 0.0008939250824912433, "loss": 2.4578, "step": 20385 }, { "epoch": 0.55, "learning_rate": 0.0008938385347624488, "loss": 2.5348, "step": 20386 }, { "epoch": 0.55, "learning_rate": 0.0008937519878379148, "loss": 2.0616, "step": 20387 }, { "epoch": 0.55, "learning_rate": 0.0008936654417182966, "loss": 2.8117, "step": 20388 }, { "epoch": 0.55, "learning_rate": 0.0008935788964042499, "loss": 2.4067, "step": 20389 }, { "epoch": 0.55, "learning_rate": 0.0008934923518964308, "loss": 2.4225, "step": 20390 }, { "epoch": 0.55, "learning_rate": 0.0008934058081954944, "loss": 2.3772, "step": 20391 }, { "epoch": 0.55, "learning_rate": 0.0008933192653020963, "loss": 2.3944, "step": 20392 }, { "epoch": 0.55, "learning_rate": 0.0008932327232168929, "loss": 2.5111, "step": 20393 }, { "epoch": 0.55, "learning_rate": 0.0008931461819405387, "loss": 2.2583, "step": 20394 }, { "epoch": 0.55, "learning_rate": 0.0008930596414736902, "loss": 2.5879, "step": 20395 }, { "epoch": 0.55, "learning_rate": 0.0008929731018170031, "loss": 2.5809, "step": 20396 }, { "epoch": 0.55, "learning_rate": 0.0008928865629711322, "loss": 2.6695, "step": 20397 }, { "epoch": 0.55, "learning_rate": 0.0008928000249367338, "loss": 2.4499, "step": 20398 }, { "epoch": 0.55, "learning_rate": 0.0008927134877144632, "loss": 2.4145, "step": 20399 }, { "epoch": 0.55, "learning_rate": 0.0008926269513049758, "loss": 2.999, "step": 20400 }, { "epoch": 0.55, "learning_rate": 0.0008925404157089276, "loss": 2.5862, "step": 20401 }, { "epoch": 0.55, "learning_rate": 0.0008924538809269739, "loss": 2.5509, "step": 20402 }, { "epoch": 0.55, "learning_rate": 0.0008923673469597704, "loss": 2.3101, "step": 20403 }, { "epoch": 0.55, "learning_rate": 0.0008922808138079728, "loss": 3.0079, "step": 20404 }, { "epoch": 0.55, "learning_rate": 0.0008921942814722363, "loss": 2.8117, "step": 20405 }, { "epoch": 0.55, "learning_rate": 0.000892107749953217, "loss": 2.6211, "step": 20406 }, { "epoch": 0.55, "learning_rate": 0.0008920212192515695, "loss": 2.8241, "step": 20407 }, { "epoch": 0.55, "learning_rate": 0.0008919346893679502, "loss": 2.3584, "step": 20408 }, { "epoch": 0.55, "learning_rate": 0.0008918481603030148, "loss": 2.478, "step": 20409 }, { "epoch": 0.55, "learning_rate": 0.0008917616320574179, "loss": 2.7528, "step": 20410 }, { "epoch": 0.55, "learning_rate": 0.0008916751046318153, "loss": 2.3923, "step": 20411 }, { "epoch": 0.55, "learning_rate": 0.0008915885780268636, "loss": 2.4232, "step": 20412 }, { "epoch": 0.55, "learning_rate": 0.0008915020522432168, "loss": 2.4042, "step": 20413 }, { "epoch": 0.55, "learning_rate": 0.0008914155272815313, "loss": 2.9351, "step": 20414 }, { "epoch": 0.55, "learning_rate": 0.0008913290031424622, "loss": 2.4114, "step": 20415 }, { "epoch": 0.55, "learning_rate": 0.000891242479826665, "loss": 2.2669, "step": 20416 }, { "epoch": 0.55, "learning_rate": 0.0008911559573347957, "loss": 2.6962, "step": 20417 }, { "epoch": 0.55, "learning_rate": 0.0008910694356675091, "loss": 2.7062, "step": 20418 }, { "epoch": 0.55, "learning_rate": 0.0008909829148254612, "loss": 2.6706, "step": 20419 }, { "epoch": 0.55, "learning_rate": 0.0008908963948093072, "loss": 2.5263, "step": 20420 }, { "epoch": 0.55, "learning_rate": 0.0008908098756197024, "loss": 2.8425, "step": 20421 }, { "epoch": 0.55, "learning_rate": 0.000890723357257303, "loss": 2.5222, "step": 20422 }, { "epoch": 0.55, "learning_rate": 0.0008906368397227632, "loss": 2.1598, "step": 20423 }, { "epoch": 0.55, "learning_rate": 0.0008905503230167395, "loss": 2.3383, "step": 20424 }, { "epoch": 0.55, "learning_rate": 0.0008904638071398872, "loss": 2.5945, "step": 20425 }, { "epoch": 0.55, "learning_rate": 0.0008903772920928612, "loss": 2.5628, "step": 20426 }, { "epoch": 0.55, "learning_rate": 0.000890290777876317, "loss": 2.7217, "step": 20427 }, { "epoch": 0.55, "learning_rate": 0.000890204264490911, "loss": 2.6541, "step": 20428 }, { "epoch": 0.55, "learning_rate": 0.0008901177519372974, "loss": 2.2825, "step": 20429 }, { "epoch": 0.55, "learning_rate": 0.0008900312402161319, "loss": 2.8478, "step": 20430 }, { "epoch": 0.55, "learning_rate": 0.0008899447293280704, "loss": 2.5314, "step": 20431 }, { "epoch": 0.55, "learning_rate": 0.0008898582192737678, "loss": 2.5537, "step": 20432 }, { "epoch": 0.55, "learning_rate": 0.0008897717100538798, "loss": 2.2846, "step": 20433 }, { "epoch": 0.55, "learning_rate": 0.0008896852016690613, "loss": 2.2199, "step": 20434 }, { "epoch": 0.55, "learning_rate": 0.0008895986941199681, "loss": 2.2474, "step": 20435 }, { "epoch": 0.55, "learning_rate": 0.0008895121874072557, "loss": 2.2566, "step": 20436 }, { "epoch": 0.55, "learning_rate": 0.0008894256815315789, "loss": 3.1772, "step": 20437 }, { "epoch": 0.55, "learning_rate": 0.0008893391764935935, "loss": 2.4445, "step": 20438 }, { "epoch": 0.55, "learning_rate": 0.000889252672293955, "loss": 3.0539, "step": 20439 }, { "epoch": 0.55, "learning_rate": 0.0008891661689333179, "loss": 2.4909, "step": 20440 }, { "epoch": 0.55, "learning_rate": 0.0008890796664123387, "loss": 2.5527, "step": 20441 }, { "epoch": 0.55, "learning_rate": 0.0008889931647316717, "loss": 2.5357, "step": 20442 }, { "epoch": 0.55, "learning_rate": 0.0008889066638919726, "loss": 2.7591, "step": 20443 }, { "epoch": 0.55, "learning_rate": 0.000888820163893897, "loss": 2.1327, "step": 20444 }, { "epoch": 0.55, "learning_rate": 0.0008887336647380997, "loss": 2.2794, "step": 20445 }, { "epoch": 0.55, "learning_rate": 0.0008886471664252363, "loss": 2.6111, "step": 20446 }, { "epoch": 0.55, "learning_rate": 0.0008885606689559623, "loss": 2.7545, "step": 20447 }, { "epoch": 0.55, "learning_rate": 0.0008884741723309325, "loss": 2.5766, "step": 20448 }, { "epoch": 0.55, "learning_rate": 0.0008883876765508027, "loss": 2.4255, "step": 20449 }, { "epoch": 0.55, "learning_rate": 0.0008883011816162277, "loss": 2.2529, "step": 20450 }, { "epoch": 0.55, "learning_rate": 0.0008882146875278629, "loss": 3.0371, "step": 20451 }, { "epoch": 0.55, "learning_rate": 0.0008881281942863642, "loss": 2.0034, "step": 20452 }, { "epoch": 0.55, "learning_rate": 0.0008880417018923855, "loss": 2.496, "step": 20453 }, { "epoch": 0.55, "learning_rate": 0.0008879552103465831, "loss": 2.674, "step": 20454 }, { "epoch": 0.55, "learning_rate": 0.0008878687196496125, "loss": 2.8671, "step": 20455 }, { "epoch": 0.55, "learning_rate": 0.0008877822298021279, "loss": 2.6833, "step": 20456 }, { "epoch": 0.55, "learning_rate": 0.0008876957408047853, "loss": 2.3938, "step": 20457 }, { "epoch": 0.55, "learning_rate": 0.0008876092526582395, "loss": 2.2468, "step": 20458 }, { "epoch": 0.55, "learning_rate": 0.0008875227653631459, "loss": 2.441, "step": 20459 }, { "epoch": 0.55, "learning_rate": 0.00088743627892016, "loss": 2.2837, "step": 20460 }, { "epoch": 0.55, "learning_rate": 0.0008873497933299365, "loss": 2.8905, "step": 20461 }, { "epoch": 0.55, "learning_rate": 0.0008872633085931308, "loss": 2.6302, "step": 20462 }, { "epoch": 0.55, "learning_rate": 0.0008871768247103983, "loss": 2.5039, "step": 20463 }, { "epoch": 0.55, "learning_rate": 0.0008870903416823937, "loss": 2.5903, "step": 20464 }, { "epoch": 0.55, "learning_rate": 0.0008870038595097732, "loss": 2.1793, "step": 20465 }, { "epoch": 0.55, "learning_rate": 0.0008869173781931903, "loss": 2.7431, "step": 20466 }, { "epoch": 0.55, "learning_rate": 0.0008868308977333015, "loss": 2.2624, "step": 20467 }, { "epoch": 0.55, "learning_rate": 0.000886744418130762, "loss": 2.5637, "step": 20468 }, { "epoch": 0.55, "learning_rate": 0.000886657939386226, "loss": 2.3519, "step": 20469 }, { "epoch": 0.55, "learning_rate": 0.0008865714615003492, "loss": 2.6977, "step": 20470 }, { "epoch": 0.55, "learning_rate": 0.0008864849844737872, "loss": 2.6601, "step": 20471 }, { "epoch": 0.55, "learning_rate": 0.0008863985083071943, "loss": 2.6111, "step": 20472 }, { "epoch": 0.55, "learning_rate": 0.000886312033001226, "loss": 2.7479, "step": 20473 }, { "epoch": 0.55, "learning_rate": 0.0008862255585565376, "loss": 2.9495, "step": 20474 }, { "epoch": 0.55, "learning_rate": 0.0008861390849737838, "loss": 2.6557, "step": 20475 }, { "epoch": 0.55, "learning_rate": 0.0008860526122536202, "loss": 2.5052, "step": 20476 }, { "epoch": 0.55, "learning_rate": 0.0008859661403967014, "loss": 2.6841, "step": 20477 }, { "epoch": 0.55, "learning_rate": 0.0008858796694036827, "loss": 2.9402, "step": 20478 }, { "epoch": 0.55, "learning_rate": 0.0008857931992752195, "loss": 2.6856, "step": 20479 }, { "epoch": 0.55, "learning_rate": 0.0008857067300119663, "loss": 2.4665, "step": 20480 }, { "epoch": 0.55, "learning_rate": 0.0008856202616145786, "loss": 2.3368, "step": 20481 }, { "epoch": 0.55, "learning_rate": 0.0008855337940837116, "loss": 2.4284, "step": 20482 }, { "epoch": 0.55, "learning_rate": 0.0008854473274200196, "loss": 2.2885, "step": 20483 }, { "epoch": 0.55, "learning_rate": 0.0008853608616241588, "loss": 2.5789, "step": 20484 }, { "epoch": 0.55, "learning_rate": 0.0008852743966967832, "loss": 2.8577, "step": 20485 }, { "epoch": 0.55, "learning_rate": 0.0008851879326385483, "loss": 2.3403, "step": 20486 }, { "epoch": 0.55, "learning_rate": 0.0008851014694501091, "loss": 2.4094, "step": 20487 }, { "epoch": 0.55, "learning_rate": 0.0008850150071321206, "loss": 2.6579, "step": 20488 }, { "epoch": 0.55, "learning_rate": 0.0008849285456852379, "loss": 2.6533, "step": 20489 }, { "epoch": 0.55, "learning_rate": 0.0008848420851101159, "loss": 2.7217, "step": 20490 }, { "epoch": 0.55, "learning_rate": 0.0008847556254074098, "loss": 2.5437, "step": 20491 }, { "epoch": 0.55, "learning_rate": 0.0008846691665777744, "loss": 2.5206, "step": 20492 }, { "epoch": 0.55, "learning_rate": 0.0008845827086218647, "loss": 2.7682, "step": 20493 }, { "epoch": 0.55, "learning_rate": 0.0008844962515403359, "loss": 2.6101, "step": 20494 }, { "epoch": 0.55, "learning_rate": 0.000884409795333843, "loss": 2.3719, "step": 20495 }, { "epoch": 0.55, "learning_rate": 0.0008843233400030404, "loss": 2.4598, "step": 20496 }, { "epoch": 0.55, "learning_rate": 0.0008842368855485836, "loss": 2.8927, "step": 20497 }, { "epoch": 0.55, "learning_rate": 0.000884150431971128, "loss": 2.3878, "step": 20498 }, { "epoch": 0.55, "learning_rate": 0.0008840639792713275, "loss": 2.4745, "step": 20499 }, { "epoch": 0.55, "learning_rate": 0.0008839775274498377, "loss": 2.8538, "step": 20500 }, { "epoch": 0.55, "learning_rate": 0.0008838910765073132, "loss": 2.0842, "step": 20501 }, { "epoch": 0.55, "learning_rate": 0.0008838046264444093, "loss": 2.6071, "step": 20502 }, { "epoch": 0.55, "learning_rate": 0.0008837181772617809, "loss": 2.2785, "step": 20503 }, { "epoch": 0.55, "learning_rate": 0.0008836317289600826, "loss": 2.5349, "step": 20504 }, { "epoch": 0.55, "learning_rate": 0.0008835452815399695, "loss": 2.8619, "step": 20505 }, { "epoch": 0.55, "learning_rate": 0.0008834588350020968, "loss": 2.8741, "step": 20506 }, { "epoch": 0.55, "learning_rate": 0.0008833723893471188, "loss": 2.3779, "step": 20507 }, { "epoch": 0.55, "learning_rate": 0.0008832859445756909, "loss": 2.1359, "step": 20508 }, { "epoch": 0.55, "learning_rate": 0.0008831995006884679, "loss": 2.1005, "step": 20509 }, { "epoch": 0.55, "learning_rate": 0.0008831130576861044, "loss": 2.8198, "step": 20510 }, { "epoch": 0.55, "learning_rate": 0.0008830266155692559, "loss": 2.5787, "step": 20511 }, { "epoch": 0.55, "learning_rate": 0.0008829401743385766, "loss": 2.5004, "step": 20512 }, { "epoch": 0.55, "learning_rate": 0.0008828537339947211, "loss": 2.6204, "step": 20513 }, { "epoch": 0.55, "learning_rate": 0.0008827672945383455, "loss": 2.771, "step": 20514 }, { "epoch": 0.55, "learning_rate": 0.0008826808559701037, "loss": 2.6182, "step": 20515 }, { "epoch": 0.55, "learning_rate": 0.0008825944182906505, "loss": 2.4502, "step": 20516 }, { "epoch": 0.55, "learning_rate": 0.0008825079815006413, "loss": 2.6913, "step": 20517 }, { "epoch": 0.55, "learning_rate": 0.0008824215456007304, "loss": 2.3615, "step": 20518 }, { "epoch": 0.55, "learning_rate": 0.0008823351105915732, "loss": 2.5066, "step": 20519 }, { "epoch": 0.55, "learning_rate": 0.0008822486764738238, "loss": 2.8826, "step": 20520 }, { "epoch": 0.55, "learning_rate": 0.0008821622432481375, "loss": 2.6786, "step": 20521 }, { "epoch": 0.55, "learning_rate": 0.000882075810915169, "loss": 2.661, "step": 20522 }, { "epoch": 0.55, "learning_rate": 0.0008819893794755729, "loss": 2.68, "step": 20523 }, { "epoch": 0.55, "learning_rate": 0.0008819029489300043, "loss": 2.1437, "step": 20524 }, { "epoch": 0.55, "learning_rate": 0.0008818165192791182, "loss": 3.0774, "step": 20525 }, { "epoch": 0.55, "learning_rate": 0.0008817300905235683, "loss": 2.4612, "step": 20526 }, { "epoch": 0.55, "learning_rate": 0.0008816436626640109, "loss": 2.4408, "step": 20527 }, { "epoch": 0.55, "learning_rate": 0.0008815572357010994, "loss": 2.6475, "step": 20528 }, { "epoch": 0.55, "learning_rate": 0.000881470809635489, "loss": 2.7351, "step": 20529 }, { "epoch": 0.55, "learning_rate": 0.0008813843844678351, "loss": 2.0824, "step": 20530 }, { "epoch": 0.55, "learning_rate": 0.0008812979601987915, "loss": 2.4352, "step": 20531 }, { "epoch": 0.55, "learning_rate": 0.0008812115368290132, "loss": 2.7995, "step": 20532 }, { "epoch": 0.55, "learning_rate": 0.0008811251143591555, "loss": 2.4434, "step": 20533 }, { "epoch": 0.55, "learning_rate": 0.0008810386927898723, "loss": 2.3678, "step": 20534 }, { "epoch": 0.55, "learning_rate": 0.0008809522721218191, "loss": 2.4603, "step": 20535 }, { "epoch": 0.55, "learning_rate": 0.0008808658523556497, "loss": 2.4284, "step": 20536 }, { "epoch": 0.55, "learning_rate": 0.0008807794334920195, "loss": 2.3552, "step": 20537 }, { "epoch": 0.55, "learning_rate": 0.0008806930155315834, "loss": 2.5656, "step": 20538 }, { "epoch": 0.55, "learning_rate": 0.0008806065984749951, "loss": 2.4449, "step": 20539 }, { "epoch": 0.55, "learning_rate": 0.00088052018232291, "loss": 2.5065, "step": 20540 }, { "epoch": 0.55, "learning_rate": 0.0008804337670759832, "loss": 3.1521, "step": 20541 }, { "epoch": 0.55, "learning_rate": 0.0008803473527348681, "loss": 2.5958, "step": 20542 }, { "epoch": 0.55, "learning_rate": 0.00088026093930022, "loss": 2.5388, "step": 20543 }, { "epoch": 0.55, "learning_rate": 0.0008801745267726943, "loss": 2.4684, "step": 20544 }, { "epoch": 0.55, "learning_rate": 0.0008800881151529445, "loss": 2.7166, "step": 20545 }, { "epoch": 0.55, "learning_rate": 0.0008800017044416258, "loss": 2.2886, "step": 20546 }, { "epoch": 0.55, "learning_rate": 0.0008799152946393926, "loss": 2.4136, "step": 20547 }, { "epoch": 0.55, "learning_rate": 0.0008798288857468998, "loss": 2.8622, "step": 20548 }, { "epoch": 0.55, "learning_rate": 0.000879742477764802, "loss": 2.7484, "step": 20549 }, { "epoch": 0.55, "learning_rate": 0.0008796560706937534, "loss": 2.6463, "step": 20550 }, { "epoch": 0.55, "learning_rate": 0.000879569664534409, "loss": 2.6042, "step": 20551 }, { "epoch": 0.55, "learning_rate": 0.0008794832592874235, "loss": 2.8513, "step": 20552 }, { "epoch": 0.55, "learning_rate": 0.000879396854953451, "loss": 2.7011, "step": 20553 }, { "epoch": 0.55, "learning_rate": 0.0008793104515331468, "loss": 2.7613, "step": 20554 }, { "epoch": 0.55, "learning_rate": 0.0008792240490271646, "loss": 2.4113, "step": 20555 }, { "epoch": 0.55, "learning_rate": 0.0008791376474361592, "loss": 2.4216, "step": 20556 }, { "epoch": 0.55, "learning_rate": 0.0008790512467607861, "loss": 2.3469, "step": 20557 }, { "epoch": 0.55, "learning_rate": 0.0008789648470016987, "loss": 2.534, "step": 20558 }, { "epoch": 0.55, "learning_rate": 0.0008788784481595518, "loss": 2.7504, "step": 20559 }, { "epoch": 0.55, "learning_rate": 0.0008787920502350005, "loss": 2.0931, "step": 20560 }, { "epoch": 0.55, "learning_rate": 0.0008787056532286988, "loss": 2.5036, "step": 20561 }, { "epoch": 0.55, "learning_rate": 0.0008786192571413014, "loss": 2.2684, "step": 20562 }, { "epoch": 0.55, "learning_rate": 0.0008785328619734627, "loss": 2.4522, "step": 20563 }, { "epoch": 0.55, "learning_rate": 0.0008784464677258374, "loss": 2.7593, "step": 20564 }, { "epoch": 0.55, "learning_rate": 0.00087836007439908, "loss": 2.8663, "step": 20565 }, { "epoch": 0.55, "learning_rate": 0.0008782736819938448, "loss": 2.623, "step": 20566 }, { "epoch": 0.55, "learning_rate": 0.0008781872905107864, "loss": 2.4134, "step": 20567 }, { "epoch": 0.55, "learning_rate": 0.0008781008999505598, "loss": 2.554, "step": 20568 }, { "epoch": 0.55, "learning_rate": 0.0008780145103138182, "loss": 2.1788, "step": 20569 }, { "epoch": 0.55, "learning_rate": 0.0008779281216012176, "loss": 2.7007, "step": 20570 }, { "epoch": 0.55, "learning_rate": 0.0008778417338134113, "loss": 2.6843, "step": 20571 }, { "epoch": 0.55, "learning_rate": 0.0008777553469510542, "loss": 2.7384, "step": 20572 }, { "epoch": 0.55, "learning_rate": 0.0008776689610148009, "loss": 2.6469, "step": 20573 }, { "epoch": 0.55, "learning_rate": 0.0008775825760053054, "loss": 2.4594, "step": 20574 }, { "epoch": 0.55, "learning_rate": 0.0008774961919232225, "loss": 2.5672, "step": 20575 }, { "epoch": 0.55, "learning_rate": 0.0008774098087692069, "loss": 2.5023, "step": 20576 }, { "epoch": 0.55, "learning_rate": 0.0008773234265439123, "loss": 2.7237, "step": 20577 }, { "epoch": 0.55, "learning_rate": 0.0008772370452479934, "loss": 2.4604, "step": 20578 }, { "epoch": 0.55, "learning_rate": 0.000877150664882105, "loss": 2.5617, "step": 20579 }, { "epoch": 0.55, "learning_rate": 0.0008770642854469011, "loss": 2.6162, "step": 20580 }, { "epoch": 0.55, "learning_rate": 0.0008769779069430365, "loss": 2.5418, "step": 20581 }, { "epoch": 0.55, "learning_rate": 0.0008768915293711647, "loss": 2.7683, "step": 20582 }, { "epoch": 0.55, "learning_rate": 0.0008768051527319408, "loss": 2.3878, "step": 20583 }, { "epoch": 0.55, "learning_rate": 0.0008767187770260196, "loss": 2.6582, "step": 20584 }, { "epoch": 0.55, "learning_rate": 0.0008766324022540542, "loss": 2.3817, "step": 20585 }, { "epoch": 0.55, "learning_rate": 0.0008765460284166997, "loss": 2.5938, "step": 20586 }, { "epoch": 0.55, "learning_rate": 0.0008764596555146111, "loss": 2.9657, "step": 20587 }, { "epoch": 0.55, "learning_rate": 0.0008763732835484415, "loss": 2.1098, "step": 20588 }, { "epoch": 0.55, "learning_rate": 0.0008762869125188461, "loss": 2.6029, "step": 20589 }, { "epoch": 0.55, "learning_rate": 0.0008762005424264787, "loss": 2.7628, "step": 20590 }, { "epoch": 0.55, "learning_rate": 0.0008761141732719938, "loss": 2.3158, "step": 20591 }, { "epoch": 0.55, "learning_rate": 0.000876027805056046, "loss": 2.5342, "step": 20592 }, { "epoch": 0.55, "learning_rate": 0.0008759414377792891, "loss": 2.104, "step": 20593 }, { "epoch": 0.55, "learning_rate": 0.0008758550714423779, "loss": 2.6926, "step": 20594 }, { "epoch": 0.55, "learning_rate": 0.0008757687060459665, "loss": 2.6794, "step": 20595 }, { "epoch": 0.55, "learning_rate": 0.0008756823415907091, "loss": 2.4448, "step": 20596 }, { "epoch": 0.55, "learning_rate": 0.0008755959780772604, "loss": 2.4661, "step": 20597 }, { "epoch": 0.55, "learning_rate": 0.0008755096155062736, "loss": 2.8782, "step": 20598 }, { "epoch": 0.55, "learning_rate": 0.000875423253878404, "loss": 2.2861, "step": 20599 }, { "epoch": 0.55, "learning_rate": 0.0008753368931943061, "loss": 2.7616, "step": 20600 }, { "epoch": 0.55, "learning_rate": 0.0008752505334546331, "loss": 2.2891, "step": 20601 }, { "epoch": 0.55, "learning_rate": 0.0008751641746600395, "loss": 2.3383, "step": 20602 }, { "epoch": 0.55, "learning_rate": 0.0008750778168111805, "loss": 2.3509, "step": 20603 }, { "epoch": 0.55, "learning_rate": 0.0008749914599087091, "loss": 2.6833, "step": 20604 }, { "epoch": 0.55, "learning_rate": 0.0008749051039532803, "loss": 2.56, "step": 20605 }, { "epoch": 0.55, "learning_rate": 0.0008748187489455479, "loss": 2.8252, "step": 20606 }, { "epoch": 0.55, "learning_rate": 0.0008747323948861662, "loss": 2.7279, "step": 20607 }, { "epoch": 0.55, "learning_rate": 0.0008746460417757897, "loss": 2.709, "step": 20608 }, { "epoch": 0.55, "learning_rate": 0.0008745596896150723, "loss": 2.3216, "step": 20609 }, { "epoch": 0.55, "learning_rate": 0.0008744733384046682, "loss": 2.4418, "step": 20610 }, { "epoch": 0.55, "learning_rate": 0.0008743869881452318, "loss": 2.6965, "step": 20611 }, { "epoch": 0.55, "learning_rate": 0.0008743006388374168, "loss": 2.8212, "step": 20612 }, { "epoch": 0.55, "learning_rate": 0.0008742142904818784, "loss": 2.4575, "step": 20613 }, { "epoch": 0.55, "learning_rate": 0.0008741279430792695, "loss": 2.1001, "step": 20614 }, { "epoch": 0.55, "learning_rate": 0.0008740415966302444, "loss": 2.4027, "step": 20615 }, { "epoch": 0.55, "learning_rate": 0.0008739552511354585, "loss": 2.8494, "step": 20616 }, { "epoch": 0.55, "learning_rate": 0.0008738689065955647, "loss": 2.1995, "step": 20617 }, { "epoch": 0.55, "learning_rate": 0.0008737825630112173, "loss": 2.5601, "step": 20618 }, { "epoch": 0.55, "learning_rate": 0.0008736962203830709, "loss": 2.1462, "step": 20619 }, { "epoch": 0.55, "learning_rate": 0.0008736098787117794, "loss": 2.4463, "step": 20620 }, { "epoch": 0.55, "learning_rate": 0.0008735235379979966, "loss": 2.8568, "step": 20621 }, { "epoch": 0.55, "learning_rate": 0.0008734371982423771, "loss": 2.4167, "step": 20622 }, { "epoch": 0.55, "learning_rate": 0.0008733508594455746, "loss": 2.6022, "step": 20623 }, { "epoch": 0.55, "learning_rate": 0.0008732645216082436, "loss": 2.6013, "step": 20624 }, { "epoch": 0.55, "learning_rate": 0.0008731781847310376, "loss": 2.3017, "step": 20625 }, { "epoch": 0.55, "learning_rate": 0.000873091848814611, "loss": 3.0187, "step": 20626 }, { "epoch": 0.55, "learning_rate": 0.0008730055138596184, "loss": 2.3959, "step": 20627 }, { "epoch": 0.55, "learning_rate": 0.0008729191798667127, "loss": 2.2057, "step": 20628 }, { "epoch": 0.55, "learning_rate": 0.0008728328468365486, "loss": 2.5704, "step": 20629 }, { "epoch": 0.55, "learning_rate": 0.0008727465147697807, "loss": 3.0269, "step": 20630 }, { "epoch": 0.55, "learning_rate": 0.0008726601836670621, "loss": 2.7245, "step": 20631 }, { "epoch": 0.55, "learning_rate": 0.0008725738535290472, "loss": 2.6343, "step": 20632 }, { "epoch": 0.55, "learning_rate": 0.0008724875243563899, "loss": 2.5186, "step": 20633 }, { "epoch": 0.55, "learning_rate": 0.0008724011961497442, "loss": 2.2634, "step": 20634 }, { "epoch": 0.55, "learning_rate": 0.0008723148689097647, "loss": 2.151, "step": 20635 }, { "epoch": 0.55, "learning_rate": 0.0008722285426371044, "loss": 2.4634, "step": 20636 }, { "epoch": 0.55, "learning_rate": 0.0008721422173324179, "loss": 2.7808, "step": 20637 }, { "epoch": 0.55, "learning_rate": 0.0008720558929963594, "loss": 2.5455, "step": 20638 }, { "epoch": 0.55, "learning_rate": 0.0008719695696295824, "loss": 2.3492, "step": 20639 }, { "epoch": 0.55, "learning_rate": 0.0008718832472327414, "loss": 2.156, "step": 20640 }, { "epoch": 0.55, "learning_rate": 0.0008717969258064894, "loss": 2.5334, "step": 20641 }, { "epoch": 0.55, "learning_rate": 0.0008717106053514811, "loss": 2.349, "step": 20642 }, { "epoch": 0.55, "learning_rate": 0.000871624285868371, "loss": 2.6358, "step": 20643 }, { "epoch": 0.55, "learning_rate": 0.0008715379673578116, "loss": 2.3459, "step": 20644 }, { "epoch": 0.55, "learning_rate": 0.0008714516498204576, "loss": 2.1, "step": 20645 }, { "epoch": 0.55, "learning_rate": 0.0008713653332569635, "loss": 2.3487, "step": 20646 }, { "epoch": 0.55, "learning_rate": 0.0008712790176679822, "loss": 2.6369, "step": 20647 }, { "epoch": 0.55, "learning_rate": 0.0008711927030541683, "loss": 2.3962, "step": 20648 }, { "epoch": 0.55, "learning_rate": 0.0008711063894161752, "loss": 2.3177, "step": 20649 }, { "epoch": 0.55, "learning_rate": 0.000871020076754657, "loss": 2.4326, "step": 20650 }, { "epoch": 0.55, "learning_rate": 0.000870933765070268, "loss": 2.8499, "step": 20651 }, { "epoch": 0.55, "learning_rate": 0.0008708474543636613, "loss": 2.7534, "step": 20652 }, { "epoch": 0.56, "learning_rate": 0.0008707611446354914, "loss": 2.3962, "step": 20653 }, { "epoch": 0.56, "learning_rate": 0.0008706748358864121, "loss": 2.6258, "step": 20654 }, { "epoch": 0.56, "learning_rate": 0.0008705885281170769, "loss": 2.587, "step": 20655 }, { "epoch": 0.56, "learning_rate": 0.0008705022213281398, "loss": 2.4994, "step": 20656 }, { "epoch": 0.56, "learning_rate": 0.0008704159155202552, "loss": 2.302, "step": 20657 }, { "epoch": 0.56, "learning_rate": 0.0008703296106940759, "loss": 2.7625, "step": 20658 }, { "epoch": 0.56, "learning_rate": 0.0008702433068502568, "loss": 2.3832, "step": 20659 }, { "epoch": 0.56, "learning_rate": 0.0008701570039894509, "loss": 2.3183, "step": 20660 }, { "epoch": 0.56, "learning_rate": 0.0008700707021123122, "loss": 2.4524, "step": 20661 }, { "epoch": 0.56, "learning_rate": 0.000869984401219495, "loss": 2.7626, "step": 20662 }, { "epoch": 0.56, "learning_rate": 0.0008698981013116523, "loss": 2.6049, "step": 20663 }, { "epoch": 0.56, "learning_rate": 0.0008698118023894386, "loss": 2.5774, "step": 20664 }, { "epoch": 0.56, "learning_rate": 0.0008697255044535074, "loss": 2.5763, "step": 20665 }, { "epoch": 0.56, "learning_rate": 0.0008696392075045123, "loss": 3.0662, "step": 20666 }, { "epoch": 0.56, "learning_rate": 0.0008695529115431076, "loss": 2.853, "step": 20667 }, { "epoch": 0.56, "learning_rate": 0.0008694666165699464, "loss": 2.0861, "step": 20668 }, { "epoch": 0.56, "learning_rate": 0.0008693803225856828, "loss": 2.5044, "step": 20669 }, { "epoch": 0.56, "learning_rate": 0.0008692940295909709, "loss": 2.299, "step": 20670 }, { "epoch": 0.56, "learning_rate": 0.0008692077375864636, "loss": 2.7249, "step": 20671 }, { "epoch": 0.56, "learning_rate": 0.0008691214465728151, "loss": 2.3255, "step": 20672 }, { "epoch": 0.56, "learning_rate": 0.0008690351565506796, "loss": 2.4975, "step": 20673 }, { "epoch": 0.56, "learning_rate": 0.00086894886752071, "loss": 3.0193, "step": 20674 }, { "epoch": 0.56, "learning_rate": 0.0008688625794835605, "loss": 2.2453, "step": 20675 }, { "epoch": 0.56, "learning_rate": 0.0008687762924398845, "loss": 2.2143, "step": 20676 }, { "epoch": 0.56, "learning_rate": 0.0008686900063903358, "loss": 2.5644, "step": 20677 }, { "epoch": 0.56, "learning_rate": 0.0008686037213355683, "loss": 2.5292, "step": 20678 }, { "epoch": 0.56, "learning_rate": 0.0008685174372762354, "loss": 2.7262, "step": 20679 }, { "epoch": 0.56, "learning_rate": 0.0008684311542129908, "loss": 2.1169, "step": 20680 }, { "epoch": 0.56, "learning_rate": 0.0008683448721464884, "loss": 3.1134, "step": 20681 }, { "epoch": 0.56, "learning_rate": 0.0008682585910773817, "loss": 2.3885, "step": 20682 }, { "epoch": 0.56, "learning_rate": 0.0008681723110063247, "loss": 2.7288, "step": 20683 }, { "epoch": 0.56, "learning_rate": 0.00086808603193397, "loss": 2.324, "step": 20684 }, { "epoch": 0.56, "learning_rate": 0.0008679997538609723, "loss": 2.5113, "step": 20685 }, { "epoch": 0.56, "learning_rate": 0.0008679134767879852, "loss": 2.3537, "step": 20686 }, { "epoch": 0.56, "learning_rate": 0.0008678272007156616, "loss": 2.1899, "step": 20687 }, { "epoch": 0.56, "learning_rate": 0.0008677409256446551, "loss": 2.3245, "step": 20688 }, { "epoch": 0.56, "learning_rate": 0.0008676546515756205, "loss": 2.2642, "step": 20689 }, { "epoch": 0.56, "learning_rate": 0.0008675683785092102, "loss": 2.7067, "step": 20690 }, { "epoch": 0.56, "learning_rate": 0.0008674821064460781, "loss": 2.6312, "step": 20691 }, { "epoch": 0.56, "learning_rate": 0.0008673958353868781, "loss": 2.5119, "step": 20692 }, { "epoch": 0.56, "learning_rate": 0.0008673095653322633, "loss": 2.6542, "step": 20693 }, { "epoch": 0.56, "learning_rate": 0.0008672232962828878, "loss": 2.3751, "step": 20694 }, { "epoch": 0.56, "learning_rate": 0.0008671370282394048, "loss": 2.3522, "step": 20695 }, { "epoch": 0.56, "learning_rate": 0.0008670507612024677, "loss": 2.332, "step": 20696 }, { "epoch": 0.56, "learning_rate": 0.0008669644951727304, "loss": 2.5072, "step": 20697 }, { "epoch": 0.56, "learning_rate": 0.0008668782301508464, "loss": 2.4767, "step": 20698 }, { "epoch": 0.56, "learning_rate": 0.000866791966137469, "loss": 2.2228, "step": 20699 }, { "epoch": 0.56, "learning_rate": 0.0008667057031332521, "loss": 2.8123, "step": 20700 }, { "epoch": 0.56, "learning_rate": 0.0008666194411388484, "loss": 2.211, "step": 20701 }, { "epoch": 0.56, "learning_rate": 0.0008665331801549126, "loss": 2.1738, "step": 20702 }, { "epoch": 0.56, "learning_rate": 0.0008664469201820973, "loss": 2.4183, "step": 20703 }, { "epoch": 0.56, "learning_rate": 0.0008663606612210561, "loss": 2.4397, "step": 20704 }, { "epoch": 0.56, "learning_rate": 0.000866274403272443, "loss": 2.833, "step": 20705 }, { "epoch": 0.56, "learning_rate": 0.0008661881463369107, "loss": 2.2753, "step": 20706 }, { "epoch": 0.56, "learning_rate": 0.0008661018904151133, "loss": 3.1006, "step": 20707 }, { "epoch": 0.56, "learning_rate": 0.000866015635507704, "loss": 2.7038, "step": 20708 }, { "epoch": 0.56, "learning_rate": 0.0008659293816153362, "loss": 2.7918, "step": 20709 }, { "epoch": 0.56, "learning_rate": 0.0008658431287386636, "loss": 2.7422, "step": 20710 }, { "epoch": 0.56, "learning_rate": 0.0008657568768783394, "loss": 2.6139, "step": 20711 }, { "epoch": 0.56, "learning_rate": 0.000865670626035017, "loss": 2.6423, "step": 20712 }, { "epoch": 0.56, "learning_rate": 0.0008655843762093504, "loss": 2.5158, "step": 20713 }, { "epoch": 0.56, "learning_rate": 0.0008654981274019919, "loss": 2.8322, "step": 20714 }, { "epoch": 0.56, "learning_rate": 0.0008654118796135957, "loss": 2.0999, "step": 20715 }, { "epoch": 0.56, "learning_rate": 0.0008653256328448155, "loss": 2.4925, "step": 20716 }, { "epoch": 0.56, "learning_rate": 0.0008652393870963038, "loss": 2.5089, "step": 20717 }, { "epoch": 0.56, "learning_rate": 0.0008651531423687146, "loss": 2.4448, "step": 20718 }, { "epoch": 0.56, "learning_rate": 0.0008650668986627008, "loss": 2.7121, "step": 20719 }, { "epoch": 0.56, "learning_rate": 0.0008649806559789162, "loss": 2.9362, "step": 20720 }, { "epoch": 0.56, "learning_rate": 0.0008648944143180141, "loss": 2.9237, "step": 20721 }, { "epoch": 0.56, "learning_rate": 0.0008648081736806476, "loss": 2.9726, "step": 20722 }, { "epoch": 0.56, "learning_rate": 0.0008647219340674701, "loss": 2.5644, "step": 20723 }, { "epoch": 0.56, "learning_rate": 0.0008646356954791354, "loss": 2.56, "step": 20724 }, { "epoch": 0.56, "learning_rate": 0.0008645494579162963, "loss": 2.7997, "step": 20725 }, { "epoch": 0.56, "learning_rate": 0.0008644632213796067, "loss": 2.8534, "step": 20726 }, { "epoch": 0.56, "learning_rate": 0.0008643769858697187, "loss": 3.0661, "step": 20727 }, { "epoch": 0.56, "learning_rate": 0.0008642907513872868, "loss": 2.4379, "step": 20728 }, { "epoch": 0.56, "learning_rate": 0.0008642045179329641, "loss": 2.1979, "step": 20729 }, { "epoch": 0.56, "learning_rate": 0.0008641182855074035, "loss": 2.7467, "step": 20730 }, { "epoch": 0.56, "learning_rate": 0.0008640320541112582, "loss": 2.1603, "step": 20731 }, { "epoch": 0.56, "learning_rate": 0.0008639458237451823, "loss": 2.1115, "step": 20732 }, { "epoch": 0.56, "learning_rate": 0.0008638595944098282, "loss": 2.7222, "step": 20733 }, { "epoch": 0.56, "learning_rate": 0.0008637733661058495, "loss": 2.2507, "step": 20734 }, { "epoch": 0.56, "learning_rate": 0.0008636871388338995, "loss": 2.4147, "step": 20735 }, { "epoch": 0.56, "learning_rate": 0.0008636009125946311, "loss": 2.4051, "step": 20736 }, { "epoch": 0.56, "learning_rate": 0.0008635146873886982, "loss": 2.6445, "step": 20737 }, { "epoch": 0.56, "learning_rate": 0.0008634284632167534, "loss": 2.9644, "step": 20738 }, { "epoch": 0.56, "learning_rate": 0.00086334224007945, "loss": 2.7673, "step": 20739 }, { "epoch": 0.56, "learning_rate": 0.0008632560179774418, "loss": 2.5722, "step": 20740 }, { "epoch": 0.56, "learning_rate": 0.0008631697969113812, "loss": 1.9571, "step": 20741 }, { "epoch": 0.56, "learning_rate": 0.0008630835768819217, "loss": 2.8285, "step": 20742 }, { "epoch": 0.56, "learning_rate": 0.000862997357889717, "loss": 2.5901, "step": 20743 }, { "epoch": 0.56, "learning_rate": 0.0008629111399354192, "loss": 2.9334, "step": 20744 }, { "epoch": 0.56, "learning_rate": 0.0008628249230196828, "loss": 2.2605, "step": 20745 }, { "epoch": 0.56, "learning_rate": 0.0008627387071431598, "loss": 2.7703, "step": 20746 }, { "epoch": 0.56, "learning_rate": 0.0008626524923065038, "loss": 2.6393, "step": 20747 }, { "epoch": 0.56, "learning_rate": 0.0008625662785103681, "loss": 2.3434, "step": 20748 }, { "epoch": 0.56, "learning_rate": 0.0008624800657554057, "loss": 2.4295, "step": 20749 }, { "epoch": 0.56, "learning_rate": 0.0008623938540422696, "loss": 2.4263, "step": 20750 }, { "epoch": 0.56, "learning_rate": 0.0008623076433716132, "loss": 2.2371, "step": 20751 }, { "epoch": 0.56, "learning_rate": 0.0008622214337440893, "loss": 2.3878, "step": 20752 }, { "epoch": 0.56, "learning_rate": 0.0008621352251603515, "loss": 2.0806, "step": 20753 }, { "epoch": 0.56, "learning_rate": 0.0008620490176210522, "loss": 2.5831, "step": 20754 }, { "epoch": 0.56, "learning_rate": 0.0008619628111268451, "loss": 2.4383, "step": 20755 }, { "epoch": 0.56, "learning_rate": 0.0008618766056783832, "loss": 2.6982, "step": 20756 }, { "epoch": 0.56, "learning_rate": 0.0008617904012763191, "loss": 2.6239, "step": 20757 }, { "epoch": 0.56, "learning_rate": 0.0008617041979213064, "loss": 2.6293, "step": 20758 }, { "epoch": 0.56, "learning_rate": 0.0008616179956139982, "loss": 2.5562, "step": 20759 }, { "epoch": 0.56, "learning_rate": 0.0008615317943550469, "loss": 2.4483, "step": 20760 }, { "epoch": 0.56, "learning_rate": 0.0008614455941451064, "loss": 2.1777, "step": 20761 }, { "epoch": 0.56, "learning_rate": 0.000861359394984829, "loss": 2.3159, "step": 20762 }, { "epoch": 0.56, "learning_rate": 0.000861273196874868, "loss": 2.4283, "step": 20763 }, { "epoch": 0.56, "learning_rate": 0.0008611869998158768, "loss": 2.1361, "step": 20764 }, { "epoch": 0.56, "learning_rate": 0.0008611008038085078, "loss": 2.6743, "step": 20765 }, { "epoch": 0.56, "learning_rate": 0.0008610146088534141, "loss": 2.2839, "step": 20766 }, { "epoch": 0.56, "learning_rate": 0.0008609284149512493, "loss": 2.4337, "step": 20767 }, { "epoch": 0.56, "learning_rate": 0.0008608422221026656, "loss": 2.3807, "step": 20768 }, { "epoch": 0.56, "learning_rate": 0.0008607560303083164, "loss": 2.5092, "step": 20769 }, { "epoch": 0.56, "learning_rate": 0.0008606698395688548, "loss": 2.6091, "step": 20770 }, { "epoch": 0.56, "learning_rate": 0.0008605836498849336, "loss": 2.562, "step": 20771 }, { "epoch": 0.56, "learning_rate": 0.0008604974612572058, "loss": 2.7051, "step": 20772 }, { "epoch": 0.56, "learning_rate": 0.0008604112736863239, "loss": 2.1721, "step": 20773 }, { "epoch": 0.56, "learning_rate": 0.0008603250871729413, "loss": 2.5097, "step": 20774 }, { "epoch": 0.56, "learning_rate": 0.0008602389017177115, "loss": 2.8139, "step": 20775 }, { "epoch": 0.56, "learning_rate": 0.0008601527173212862, "loss": 2.4341, "step": 20776 }, { "epoch": 0.56, "learning_rate": 0.0008600665339843188, "loss": 2.4058, "step": 20777 }, { "epoch": 0.56, "learning_rate": 0.000859980351707463, "loss": 2.3478, "step": 20778 }, { "epoch": 0.56, "learning_rate": 0.0008598941704913703, "loss": 2.2373, "step": 20779 }, { "epoch": 0.56, "learning_rate": 0.0008598079903366948, "loss": 2.5075, "step": 20780 }, { "epoch": 0.56, "learning_rate": 0.0008597218112440886, "loss": 3.1008, "step": 20781 }, { "epoch": 0.56, "learning_rate": 0.0008596356332142049, "loss": 2.2774, "step": 20782 }, { "epoch": 0.56, "learning_rate": 0.0008595494562476968, "loss": 2.1871, "step": 20783 }, { "epoch": 0.56, "learning_rate": 0.0008594632803452167, "loss": 2.1205, "step": 20784 }, { "epoch": 0.56, "learning_rate": 0.0008593771055074175, "loss": 2.7296, "step": 20785 }, { "epoch": 0.56, "learning_rate": 0.0008592909317349526, "loss": 2.3985, "step": 20786 }, { "epoch": 0.56, "learning_rate": 0.0008592047590284742, "loss": 2.1908, "step": 20787 }, { "epoch": 0.56, "learning_rate": 0.0008591185873886357, "loss": 2.632, "step": 20788 }, { "epoch": 0.56, "learning_rate": 0.0008590324168160893, "loss": 2.6364, "step": 20789 }, { "epoch": 0.56, "learning_rate": 0.0008589462473114878, "loss": 2.4553, "step": 20790 }, { "epoch": 0.56, "learning_rate": 0.0008588600788754851, "loss": 2.1449, "step": 20791 }, { "epoch": 0.56, "learning_rate": 0.0008587739115087325, "loss": 2.5975, "step": 20792 }, { "epoch": 0.56, "learning_rate": 0.0008586877452118838, "loss": 2.7916, "step": 20793 }, { "epoch": 0.56, "learning_rate": 0.0008586015799855915, "loss": 2.362, "step": 20794 }, { "epoch": 0.56, "learning_rate": 0.0008585154158305082, "loss": 2.6791, "step": 20795 }, { "epoch": 0.56, "learning_rate": 0.000858429252747287, "loss": 2.6333, "step": 20796 }, { "epoch": 0.56, "learning_rate": 0.0008583430907365803, "loss": 2.6127, "step": 20797 }, { "epoch": 0.56, "learning_rate": 0.000858256929799041, "loss": 2.7454, "step": 20798 }, { "epoch": 0.56, "learning_rate": 0.0008581707699353221, "loss": 2.3996, "step": 20799 }, { "epoch": 0.56, "learning_rate": 0.0008580846111460759, "loss": 2.5865, "step": 20800 }, { "epoch": 0.56, "learning_rate": 0.0008579984534319552, "loss": 2.3201, "step": 20801 }, { "epoch": 0.56, "learning_rate": 0.0008579122967936133, "loss": 2.4027, "step": 20802 }, { "epoch": 0.56, "learning_rate": 0.0008578261412317018, "loss": 2.3187, "step": 20803 }, { "epoch": 0.56, "learning_rate": 0.0008577399867468743, "loss": 2.7162, "step": 20804 }, { "epoch": 0.56, "learning_rate": 0.0008576538333397836, "loss": 2.8449, "step": 20805 }, { "epoch": 0.56, "learning_rate": 0.0008575676810110816, "loss": 2.6916, "step": 20806 }, { "epoch": 0.56, "learning_rate": 0.0008574815297614216, "loss": 2.1224, "step": 20807 }, { "epoch": 0.56, "learning_rate": 0.0008573953795914558, "loss": 2.4002, "step": 20808 }, { "epoch": 0.56, "learning_rate": 0.000857309230501837, "loss": 2.4021, "step": 20809 }, { "epoch": 0.56, "learning_rate": 0.0008572230824932185, "loss": 2.6639, "step": 20810 }, { "epoch": 0.56, "learning_rate": 0.000857136935566252, "loss": 2.746, "step": 20811 }, { "epoch": 0.56, "learning_rate": 0.0008570507897215905, "loss": 2.3491, "step": 20812 }, { "epoch": 0.56, "learning_rate": 0.0008569646449598869, "loss": 2.5548, "step": 20813 }, { "epoch": 0.56, "learning_rate": 0.0008568785012817934, "loss": 2.6602, "step": 20814 }, { "epoch": 0.56, "learning_rate": 0.0008567923586879631, "loss": 2.3844, "step": 20815 }, { "epoch": 0.56, "learning_rate": 0.0008567062171790478, "loss": 2.3311, "step": 20816 }, { "epoch": 0.56, "learning_rate": 0.0008566200767557006, "loss": 2.1571, "step": 20817 }, { "epoch": 0.56, "learning_rate": 0.0008565339374185748, "loss": 2.4705, "step": 20818 }, { "epoch": 0.56, "learning_rate": 0.0008564477991683215, "loss": 3.159, "step": 20819 }, { "epoch": 0.56, "learning_rate": 0.0008563616620055939, "loss": 2.5447, "step": 20820 }, { "epoch": 0.56, "learning_rate": 0.0008562755259310454, "loss": 2.6345, "step": 20821 }, { "epoch": 0.56, "learning_rate": 0.0008561893909453274, "loss": 2.5957, "step": 20822 }, { "epoch": 0.56, "learning_rate": 0.0008561032570490929, "loss": 2.5427, "step": 20823 }, { "epoch": 0.56, "learning_rate": 0.0008560171242429944, "loss": 2.1471, "step": 20824 }, { "epoch": 0.56, "learning_rate": 0.0008559309925276843, "loss": 2.3198, "step": 20825 }, { "epoch": 0.56, "learning_rate": 0.0008558448619038155, "loss": 2.4912, "step": 20826 }, { "epoch": 0.56, "learning_rate": 0.0008557587323720399, "loss": 2.717, "step": 20827 }, { "epoch": 0.56, "learning_rate": 0.0008556726039330105, "loss": 2.6455, "step": 20828 }, { "epoch": 0.56, "learning_rate": 0.0008555864765873799, "loss": 2.2831, "step": 20829 }, { "epoch": 0.56, "learning_rate": 0.0008555003503358, "loss": 2.3605, "step": 20830 }, { "epoch": 0.56, "learning_rate": 0.0008554142251789241, "loss": 2.8281, "step": 20831 }, { "epoch": 0.56, "learning_rate": 0.0008553281011174038, "loss": 2.5242, "step": 20832 }, { "epoch": 0.56, "learning_rate": 0.0008552419781518916, "loss": 2.8278, "step": 20833 }, { "epoch": 0.56, "learning_rate": 0.000855155856283041, "loss": 2.4554, "step": 20834 }, { "epoch": 0.56, "learning_rate": 0.0008550697355115033, "loss": 2.6782, "step": 20835 }, { "epoch": 0.56, "learning_rate": 0.0008549836158379313, "loss": 2.5063, "step": 20836 }, { "epoch": 0.56, "learning_rate": 0.0008548974972629779, "loss": 2.7174, "step": 20837 }, { "epoch": 0.56, "learning_rate": 0.0008548113797872948, "loss": 2.8167, "step": 20838 }, { "epoch": 0.56, "learning_rate": 0.0008547252634115347, "loss": 2.9226, "step": 20839 }, { "epoch": 0.56, "learning_rate": 0.0008546391481363503, "loss": 1.8778, "step": 20840 }, { "epoch": 0.56, "learning_rate": 0.0008545530339623936, "loss": 2.8028, "step": 20841 }, { "epoch": 0.56, "learning_rate": 0.0008544669208903171, "loss": 2.1919, "step": 20842 }, { "epoch": 0.56, "learning_rate": 0.0008543808089207732, "loss": 2.5295, "step": 20843 }, { "epoch": 0.56, "learning_rate": 0.0008542946980544142, "loss": 2.5109, "step": 20844 }, { "epoch": 0.56, "learning_rate": 0.0008542085882918928, "loss": 2.6671, "step": 20845 }, { "epoch": 0.56, "learning_rate": 0.0008541224796338605, "loss": 2.5726, "step": 20846 }, { "epoch": 0.56, "learning_rate": 0.0008540363720809705, "loss": 2.5715, "step": 20847 }, { "epoch": 0.56, "learning_rate": 0.0008539502656338753, "loss": 2.4125, "step": 20848 }, { "epoch": 0.56, "learning_rate": 0.0008538641602932263, "loss": 2.5779, "step": 20849 }, { "epoch": 0.56, "learning_rate": 0.0008537780560596763, "loss": 3.0656, "step": 20850 }, { "epoch": 0.56, "learning_rate": 0.0008536919529338777, "loss": 2.4053, "step": 20851 }, { "epoch": 0.56, "learning_rate": 0.0008536058509164826, "loss": 2.4698, "step": 20852 }, { "epoch": 0.56, "learning_rate": 0.0008535197500081435, "loss": 2.4201, "step": 20853 }, { "epoch": 0.56, "learning_rate": 0.0008534336502095125, "loss": 2.5539, "step": 20854 }, { "epoch": 0.56, "learning_rate": 0.000853347551521242, "loss": 2.1477, "step": 20855 }, { "epoch": 0.56, "learning_rate": 0.0008532614539439843, "loss": 2.5194, "step": 20856 }, { "epoch": 0.56, "learning_rate": 0.0008531753574783916, "loss": 2.8551, "step": 20857 }, { "epoch": 0.56, "learning_rate": 0.0008530892621251164, "loss": 2.5885, "step": 20858 }, { "epoch": 0.56, "learning_rate": 0.0008530031678848101, "loss": 2.6358, "step": 20859 }, { "epoch": 0.56, "learning_rate": 0.0008529170747581256, "loss": 2.7464, "step": 20860 }, { "epoch": 0.56, "learning_rate": 0.0008528309827457156, "loss": 2.4447, "step": 20861 }, { "epoch": 0.56, "learning_rate": 0.0008527448918482313, "loss": 2.1122, "step": 20862 }, { "epoch": 0.56, "learning_rate": 0.0008526588020663252, "loss": 2.825, "step": 20863 }, { "epoch": 0.56, "learning_rate": 0.0008525727134006502, "loss": 2.3745, "step": 20864 }, { "epoch": 0.56, "learning_rate": 0.0008524866258518578, "loss": 2.5525, "step": 20865 }, { "epoch": 0.56, "learning_rate": 0.0008524005394206002, "loss": 2.2759, "step": 20866 }, { "epoch": 0.56, "learning_rate": 0.0008523144541075299, "loss": 2.4707, "step": 20867 }, { "epoch": 0.56, "learning_rate": 0.0008522283699132986, "loss": 2.5409, "step": 20868 }, { "epoch": 0.56, "learning_rate": 0.000852142286838559, "loss": 2.2009, "step": 20869 }, { "epoch": 0.56, "learning_rate": 0.0008520562048839629, "loss": 3.1089, "step": 20870 }, { "epoch": 0.56, "learning_rate": 0.0008519701240501625, "loss": 3.0754, "step": 20871 }, { "epoch": 0.56, "learning_rate": 0.0008518840443378102, "loss": 2.8889, "step": 20872 }, { "epoch": 0.56, "learning_rate": 0.0008517979657475576, "loss": 3.0128, "step": 20873 }, { "epoch": 0.56, "learning_rate": 0.0008517118882800576, "loss": 2.7899, "step": 20874 }, { "epoch": 0.56, "learning_rate": 0.0008516258119359614, "loss": 2.4364, "step": 20875 }, { "epoch": 0.56, "learning_rate": 0.0008515397367159212, "loss": 2.5235, "step": 20876 }, { "epoch": 0.56, "learning_rate": 0.0008514536626205902, "loss": 2.0807, "step": 20877 }, { "epoch": 0.56, "learning_rate": 0.0008513675896506192, "loss": 2.6013, "step": 20878 }, { "epoch": 0.56, "learning_rate": 0.0008512815178066609, "loss": 2.0803, "step": 20879 }, { "epoch": 0.56, "learning_rate": 0.0008511954470893673, "loss": 2.5472, "step": 20880 }, { "epoch": 0.56, "learning_rate": 0.0008511093774993902, "loss": 2.8293, "step": 20881 }, { "epoch": 0.56, "learning_rate": 0.0008510233090373819, "loss": 2.9155, "step": 20882 }, { "epoch": 0.56, "learning_rate": 0.0008509372417039946, "loss": 1.9316, "step": 20883 }, { "epoch": 0.56, "learning_rate": 0.0008508511754998797, "loss": 2.377, "step": 20884 }, { "epoch": 0.56, "learning_rate": 0.00085076511042569, "loss": 2.7045, "step": 20885 }, { "epoch": 0.56, "learning_rate": 0.000850679046482077, "loss": 2.0982, "step": 20886 }, { "epoch": 0.56, "learning_rate": 0.0008505929836696926, "loss": 2.5596, "step": 20887 }, { "epoch": 0.56, "learning_rate": 0.0008505069219891896, "loss": 2.3118, "step": 20888 }, { "epoch": 0.56, "learning_rate": 0.000850420861441219, "loss": 2.3056, "step": 20889 }, { "epoch": 0.56, "learning_rate": 0.0008503348020264332, "loss": 2.6965, "step": 20890 }, { "epoch": 0.56, "learning_rate": 0.0008502487437454846, "loss": 2.6224, "step": 20891 }, { "epoch": 0.56, "learning_rate": 0.0008501626865990244, "loss": 2.5467, "step": 20892 }, { "epoch": 0.56, "learning_rate": 0.0008500766305877052, "loss": 2.6241, "step": 20893 }, { "epoch": 0.56, "learning_rate": 0.0008499905757121782, "loss": 2.7641, "step": 20894 }, { "epoch": 0.56, "learning_rate": 0.0008499045219730959, "loss": 2.5637, "step": 20895 }, { "epoch": 0.56, "learning_rate": 0.0008498184693711102, "loss": 2.9139, "step": 20896 }, { "epoch": 0.56, "learning_rate": 0.0008497324179068729, "loss": 2.5834, "step": 20897 }, { "epoch": 0.56, "learning_rate": 0.0008496463675810358, "loss": 2.3269, "step": 20898 }, { "epoch": 0.56, "learning_rate": 0.0008495603183942512, "loss": 2.3936, "step": 20899 }, { "epoch": 0.56, "learning_rate": 0.0008494742703471707, "loss": 2.4952, "step": 20900 }, { "epoch": 0.56, "learning_rate": 0.0008493882234404464, "loss": 2.5672, "step": 20901 }, { "epoch": 0.56, "learning_rate": 0.0008493021776747294, "loss": 2.1106, "step": 20902 }, { "epoch": 0.56, "learning_rate": 0.0008492161330506724, "loss": 2.6233, "step": 20903 }, { "epoch": 0.56, "learning_rate": 0.0008491300895689275, "loss": 2.5072, "step": 20904 }, { "epoch": 0.56, "learning_rate": 0.0008490440472301455, "loss": 2.6768, "step": 20905 }, { "epoch": 0.56, "learning_rate": 0.0008489580060349786, "loss": 2.3996, "step": 20906 }, { "epoch": 0.56, "learning_rate": 0.0008488719659840797, "loss": 2.3584, "step": 20907 }, { "epoch": 0.56, "learning_rate": 0.0008487859270780992, "loss": 2.6528, "step": 20908 }, { "epoch": 0.56, "learning_rate": 0.0008486998893176898, "loss": 2.7058, "step": 20909 }, { "epoch": 0.56, "learning_rate": 0.0008486138527035025, "loss": 2.7791, "step": 20910 }, { "epoch": 0.56, "learning_rate": 0.0008485278172361898, "loss": 2.6784, "step": 20911 }, { "epoch": 0.56, "learning_rate": 0.0008484417829164035, "loss": 2.5662, "step": 20912 }, { "epoch": 0.56, "learning_rate": 0.0008483557497447949, "loss": 2.5845, "step": 20913 }, { "epoch": 0.56, "learning_rate": 0.000848269717722016, "loss": 2.6817, "step": 20914 }, { "epoch": 0.56, "learning_rate": 0.0008481836868487188, "loss": 2.2321, "step": 20915 }, { "epoch": 0.56, "learning_rate": 0.0008480976571255546, "loss": 2.6616, "step": 20916 }, { "epoch": 0.56, "learning_rate": 0.0008480116285531755, "loss": 2.401, "step": 20917 }, { "epoch": 0.56, "learning_rate": 0.0008479256011322335, "loss": 2.362, "step": 20918 }, { "epoch": 0.56, "learning_rate": 0.0008478395748633794, "loss": 2.552, "step": 20919 }, { "epoch": 0.56, "learning_rate": 0.000847753549747266, "loss": 1.9338, "step": 20920 }, { "epoch": 0.56, "learning_rate": 0.0008476675257845441, "loss": 2.9309, "step": 20921 }, { "epoch": 0.56, "learning_rate": 0.0008475815029758655, "loss": 2.3715, "step": 20922 }, { "epoch": 0.56, "learning_rate": 0.0008474954813218829, "loss": 2.3129, "step": 20923 }, { "epoch": 0.56, "learning_rate": 0.0008474094608232469, "loss": 2.6713, "step": 20924 }, { "epoch": 0.56, "learning_rate": 0.0008473234414806094, "loss": 2.5986, "step": 20925 }, { "epoch": 0.56, "learning_rate": 0.0008472374232946226, "loss": 2.6683, "step": 20926 }, { "epoch": 0.56, "learning_rate": 0.0008471514062659374, "loss": 2.4266, "step": 20927 }, { "epoch": 0.56, "learning_rate": 0.0008470653903952061, "loss": 2.6462, "step": 20928 }, { "epoch": 0.56, "learning_rate": 0.0008469793756830799, "loss": 2.6432, "step": 20929 }, { "epoch": 0.56, "learning_rate": 0.0008468933621302106, "loss": 2.4715, "step": 20930 }, { "epoch": 0.56, "learning_rate": 0.0008468073497372499, "loss": 2.492, "step": 20931 }, { "epoch": 0.56, "learning_rate": 0.0008467213385048492, "loss": 2.6944, "step": 20932 }, { "epoch": 0.56, "learning_rate": 0.0008466353284336604, "loss": 2.8432, "step": 20933 }, { "epoch": 0.56, "learning_rate": 0.000846549319524335, "loss": 2.4617, "step": 20934 }, { "epoch": 0.56, "learning_rate": 0.0008464633117775241, "loss": 2.7356, "step": 20935 }, { "epoch": 0.56, "learning_rate": 0.0008463773051938803, "loss": 2.7139, "step": 20936 }, { "epoch": 0.56, "learning_rate": 0.0008462912997740542, "loss": 2.7344, "step": 20937 }, { "epoch": 0.56, "learning_rate": 0.0008462052955186977, "loss": 2.5701, "step": 20938 }, { "epoch": 0.56, "learning_rate": 0.0008461192924284625, "loss": 2.6562, "step": 20939 }, { "epoch": 0.56, "learning_rate": 0.0008460332905039999, "loss": 2.4635, "step": 20940 }, { "epoch": 0.56, "learning_rate": 0.0008459472897459616, "loss": 2.2382, "step": 20941 }, { "epoch": 0.56, "learning_rate": 0.0008458612901549993, "loss": 2.9201, "step": 20942 }, { "epoch": 0.56, "learning_rate": 0.0008457752917317641, "loss": 2.4842, "step": 20943 }, { "epoch": 0.56, "learning_rate": 0.0008456892944769078, "loss": 2.4487, "step": 20944 }, { "epoch": 0.56, "learning_rate": 0.0008456032983910817, "loss": 3.0471, "step": 20945 }, { "epoch": 0.56, "learning_rate": 0.0008455173034749374, "loss": 2.557, "step": 20946 }, { "epoch": 0.56, "learning_rate": 0.0008454313097291269, "loss": 2.6412, "step": 20947 }, { "epoch": 0.56, "learning_rate": 0.0008453453171543003, "loss": 2.4765, "step": 20948 }, { "epoch": 0.56, "learning_rate": 0.0008452593257511103, "loss": 2.4899, "step": 20949 }, { "epoch": 0.56, "learning_rate": 0.0008451733355202085, "loss": 2.5428, "step": 20950 }, { "epoch": 0.56, "learning_rate": 0.0008450873464622453, "loss": 2.3035, "step": 20951 }, { "epoch": 0.56, "learning_rate": 0.0008450013585778724, "loss": 2.9061, "step": 20952 }, { "epoch": 0.56, "learning_rate": 0.0008449153718677421, "loss": 2.9407, "step": 20953 }, { "epoch": 0.56, "learning_rate": 0.0008448293863325049, "loss": 2.8618, "step": 20954 }, { "epoch": 0.56, "learning_rate": 0.0008447434019728127, "loss": 2.2339, "step": 20955 }, { "epoch": 0.56, "learning_rate": 0.0008446574187893166, "loss": 2.9466, "step": 20956 }, { "epoch": 0.56, "learning_rate": 0.000844571436782668, "loss": 2.246, "step": 20957 }, { "epoch": 0.56, "learning_rate": 0.0008444854559535187, "loss": 2.6854, "step": 20958 }, { "epoch": 0.56, "learning_rate": 0.0008443994763025196, "loss": 2.6273, "step": 20959 }, { "epoch": 0.56, "learning_rate": 0.0008443134978303221, "loss": 2.6828, "step": 20960 }, { "epoch": 0.56, "learning_rate": 0.000844227520537578, "loss": 2.8787, "step": 20961 }, { "epoch": 0.56, "learning_rate": 0.0008441415444249381, "loss": 2.6739, "step": 20962 }, { "epoch": 0.56, "learning_rate": 0.0008440555694930545, "loss": 2.3512, "step": 20963 }, { "epoch": 0.56, "learning_rate": 0.0008439695957425776, "loss": 2.6747, "step": 20964 }, { "epoch": 0.56, "learning_rate": 0.0008438836231741589, "loss": 2.7306, "step": 20965 }, { "epoch": 0.56, "learning_rate": 0.0008437976517884507, "loss": 2.4182, "step": 20966 }, { "epoch": 0.56, "learning_rate": 0.000843711681586103, "loss": 1.929, "step": 20967 }, { "epoch": 0.56, "learning_rate": 0.0008436257125677677, "loss": 3.0551, "step": 20968 }, { "epoch": 0.56, "learning_rate": 0.0008435397447340963, "loss": 3.0524, "step": 20969 }, { "epoch": 0.56, "learning_rate": 0.0008434537780857395, "loss": 2.4236, "step": 20970 }, { "epoch": 0.56, "learning_rate": 0.0008433678126233492, "loss": 2.562, "step": 20971 }, { "epoch": 0.56, "learning_rate": 0.0008432818483475761, "loss": 2.4658, "step": 20972 }, { "epoch": 0.56, "learning_rate": 0.0008431958852590717, "loss": 2.2215, "step": 20973 }, { "epoch": 0.56, "learning_rate": 0.0008431099233584874, "loss": 2.2265, "step": 20974 }, { "epoch": 0.56, "learning_rate": 0.0008430239626464742, "loss": 2.7875, "step": 20975 }, { "epoch": 0.56, "learning_rate": 0.0008429380031236833, "loss": 2.2464, "step": 20976 }, { "epoch": 0.56, "learning_rate": 0.0008428520447907664, "loss": 2.7112, "step": 20977 }, { "epoch": 0.56, "learning_rate": 0.0008427660876483737, "loss": 2.457, "step": 20978 }, { "epoch": 0.56, "learning_rate": 0.0008426801316971577, "loss": 2.6676, "step": 20979 }, { "epoch": 0.56, "learning_rate": 0.0008425941769377684, "loss": 2.77, "step": 20980 }, { "epoch": 0.56, "learning_rate": 0.0008425082233708576, "loss": 2.596, "step": 20981 }, { "epoch": 0.56, "learning_rate": 0.0008424222709970763, "loss": 2.2697, "step": 20982 }, { "epoch": 0.56, "learning_rate": 0.0008423363198170757, "loss": 2.5927, "step": 20983 }, { "epoch": 0.56, "learning_rate": 0.0008422503698315069, "loss": 2.3587, "step": 20984 }, { "epoch": 0.56, "learning_rate": 0.0008421644210410213, "loss": 3.0278, "step": 20985 }, { "epoch": 0.56, "learning_rate": 0.0008420784734462696, "loss": 2.5862, "step": 20986 }, { "epoch": 0.56, "learning_rate": 0.0008419925270479035, "loss": 2.5872, "step": 20987 }, { "epoch": 0.56, "learning_rate": 0.0008419065818465734, "loss": 2.8697, "step": 20988 }, { "epoch": 0.56, "learning_rate": 0.0008418206378429309, "loss": 2.4104, "step": 20989 }, { "epoch": 0.56, "learning_rate": 0.0008417346950376272, "loss": 2.3482, "step": 20990 }, { "epoch": 0.56, "learning_rate": 0.0008416487534313126, "loss": 2.6372, "step": 20991 }, { "epoch": 0.56, "learning_rate": 0.0008415628130246391, "loss": 2.4213, "step": 20992 }, { "epoch": 0.56, "learning_rate": 0.0008414768738182576, "loss": 2.5059, "step": 20993 }, { "epoch": 0.56, "learning_rate": 0.0008413909358128186, "loss": 2.6635, "step": 20994 }, { "epoch": 0.56, "learning_rate": 0.0008413049990089735, "loss": 2.578, "step": 20995 }, { "epoch": 0.56, "learning_rate": 0.0008412190634073738, "loss": 2.0818, "step": 20996 }, { "epoch": 0.56, "learning_rate": 0.0008411331290086697, "loss": 2.7459, "step": 20997 }, { "epoch": 0.56, "learning_rate": 0.0008410471958135129, "loss": 2.4752, "step": 20998 }, { "epoch": 0.56, "learning_rate": 0.0008409612638225537, "loss": 2.3867, "step": 20999 }, { "epoch": 0.56, "learning_rate": 0.0008408753330364437, "loss": 2.6755, "step": 21000 }, { "epoch": 0.56, "learning_rate": 0.0008407894034558339, "loss": 2.6298, "step": 21001 }, { "epoch": 0.56, "learning_rate": 0.0008407034750813749, "loss": 2.2291, "step": 21002 }, { "epoch": 0.56, "learning_rate": 0.000840617547913718, "loss": 2.7314, "step": 21003 }, { "epoch": 0.56, "learning_rate": 0.0008405316219535141, "loss": 2.6062, "step": 21004 }, { "epoch": 0.56, "learning_rate": 0.0008404456972014141, "loss": 2.5242, "step": 21005 }, { "epoch": 0.56, "learning_rate": 0.0008403597736580693, "loss": 2.526, "step": 21006 }, { "epoch": 0.56, "learning_rate": 0.0008402738513241298, "loss": 2.6453, "step": 21007 }, { "epoch": 0.56, "learning_rate": 0.0008401879302002469, "loss": 2.4527, "step": 21008 }, { "epoch": 0.56, "learning_rate": 0.0008401020102870723, "loss": 2.5747, "step": 21009 }, { "epoch": 0.56, "learning_rate": 0.0008400160915852559, "loss": 2.3568, "step": 21010 }, { "epoch": 0.56, "learning_rate": 0.000839930174095449, "loss": 2.1154, "step": 21011 }, { "epoch": 0.56, "learning_rate": 0.0008398442578183027, "loss": 2.9787, "step": 21012 }, { "epoch": 0.56, "learning_rate": 0.0008397583427544673, "loss": 2.5444, "step": 21013 }, { "epoch": 0.56, "learning_rate": 0.0008396724289045944, "loss": 2.5764, "step": 21014 }, { "epoch": 0.56, "learning_rate": 0.0008395865162693344, "loss": 2.6113, "step": 21015 }, { "epoch": 0.56, "learning_rate": 0.0008395006048493381, "loss": 2.6996, "step": 21016 }, { "epoch": 0.56, "learning_rate": 0.0008394146946452568, "loss": 2.5355, "step": 21017 }, { "epoch": 0.56, "learning_rate": 0.0008393287856577408, "loss": 2.4644, "step": 21018 }, { "epoch": 0.56, "learning_rate": 0.0008392428778874413, "loss": 2.9061, "step": 21019 }, { "epoch": 0.56, "learning_rate": 0.0008391569713350093, "loss": 2.6154, "step": 21020 }, { "epoch": 0.56, "learning_rate": 0.0008390710660010947, "loss": 2.4497, "step": 21021 }, { "epoch": 0.56, "learning_rate": 0.0008389851618863497, "loss": 2.5117, "step": 21022 }, { "epoch": 0.56, "learning_rate": 0.0008388992589914238, "loss": 2.6602, "step": 21023 }, { "epoch": 0.56, "learning_rate": 0.0008388133573169683, "loss": 2.3596, "step": 21024 }, { "epoch": 0.57, "learning_rate": 0.0008387274568636343, "loss": 2.1945, "step": 21025 }, { "epoch": 0.57, "learning_rate": 0.0008386415576320719, "loss": 2.7975, "step": 21026 }, { "epoch": 0.57, "learning_rate": 0.0008385556596229324, "loss": 2.9245, "step": 21027 }, { "epoch": 0.57, "learning_rate": 0.0008384697628368665, "loss": 2.5058, "step": 21028 }, { "epoch": 0.57, "learning_rate": 0.0008383838672745245, "loss": 2.4224, "step": 21029 }, { "epoch": 0.57, "learning_rate": 0.0008382979729365575, "loss": 2.821, "step": 21030 }, { "epoch": 0.57, "learning_rate": 0.0008382120798236163, "loss": 2.6176, "step": 21031 }, { "epoch": 0.57, "learning_rate": 0.0008381261879363513, "loss": 2.8513, "step": 21032 }, { "epoch": 0.57, "learning_rate": 0.0008380402972754138, "loss": 2.5071, "step": 21033 }, { "epoch": 0.57, "learning_rate": 0.0008379544078414533, "loss": 1.8492, "step": 21034 }, { "epoch": 0.57, "learning_rate": 0.0008378685196351217, "loss": 2.4444, "step": 21035 }, { "epoch": 0.57, "learning_rate": 0.0008377826326570694, "loss": 2.4702, "step": 21036 }, { "epoch": 0.57, "learning_rate": 0.0008376967469079465, "loss": 2.8093, "step": 21037 }, { "epoch": 0.57, "learning_rate": 0.0008376108623884038, "loss": 2.6042, "step": 21038 }, { "epoch": 0.57, "learning_rate": 0.0008375249790990929, "loss": 2.3792, "step": 21039 }, { "epoch": 0.57, "learning_rate": 0.0008374390970406632, "loss": 2.579, "step": 21040 }, { "epoch": 0.57, "learning_rate": 0.0008373532162137662, "loss": 2.8965, "step": 21041 }, { "epoch": 0.57, "learning_rate": 0.0008372673366190518, "loss": 2.2747, "step": 21042 }, { "epoch": 0.57, "learning_rate": 0.0008371814582571709, "loss": 2.9332, "step": 21043 }, { "epoch": 0.57, "learning_rate": 0.0008370955811287745, "loss": 2.4579, "step": 21044 }, { "epoch": 0.57, "learning_rate": 0.0008370097052345126, "loss": 2.7391, "step": 21045 }, { "epoch": 0.57, "learning_rate": 0.0008369238305750361, "loss": 2.7588, "step": 21046 }, { "epoch": 0.57, "learning_rate": 0.0008368379571509956, "loss": 2.1751, "step": 21047 }, { "epoch": 0.57, "learning_rate": 0.0008367520849630414, "loss": 2.7649, "step": 21048 }, { "epoch": 0.57, "learning_rate": 0.0008366662140118247, "loss": 2.7448, "step": 21049 }, { "epoch": 0.57, "learning_rate": 0.000836580344297995, "loss": 2.5141, "step": 21050 }, { "epoch": 0.57, "learning_rate": 0.0008364944758222033, "loss": 2.2457, "step": 21051 }, { "epoch": 0.57, "learning_rate": 0.0008364086085851008, "loss": 2.6224, "step": 21052 }, { "epoch": 0.57, "learning_rate": 0.0008363227425873371, "loss": 2.6956, "step": 21053 }, { "epoch": 0.57, "learning_rate": 0.0008362368778295629, "loss": 2.5964, "step": 21054 }, { "epoch": 0.57, "learning_rate": 0.0008361510143124291, "loss": 2.2904, "step": 21055 }, { "epoch": 0.57, "learning_rate": 0.0008360651520365859, "loss": 2.8375, "step": 21056 }, { "epoch": 0.57, "learning_rate": 0.0008359792910026838, "loss": 2.6485, "step": 21057 }, { "epoch": 0.57, "learning_rate": 0.000835893431211373, "loss": 2.291, "step": 21058 }, { "epoch": 0.57, "learning_rate": 0.0008358075726633043, "loss": 2.2081, "step": 21059 }, { "epoch": 0.57, "learning_rate": 0.0008357217153591284, "loss": 2.1458, "step": 21060 }, { "epoch": 0.57, "learning_rate": 0.000835635859299495, "loss": 2.3269, "step": 21061 }, { "epoch": 0.57, "learning_rate": 0.0008355500044850551, "loss": 2.3581, "step": 21062 }, { "epoch": 0.57, "learning_rate": 0.0008354641509164594, "loss": 2.3941, "step": 21063 }, { "epoch": 0.57, "learning_rate": 0.0008353782985943573, "loss": 2.8834, "step": 21064 }, { "epoch": 0.57, "learning_rate": 0.0008352924475193998, "loss": 2.2776, "step": 21065 }, { "epoch": 0.57, "learning_rate": 0.0008352065976922377, "loss": 2.704, "step": 21066 }, { "epoch": 0.57, "learning_rate": 0.0008351207491135206, "loss": 2.7313, "step": 21067 }, { "epoch": 0.57, "learning_rate": 0.0008350349017838995, "loss": 2.0061, "step": 21068 }, { "epoch": 0.57, "learning_rate": 0.0008349490557040243, "loss": 2.0219, "step": 21069 }, { "epoch": 0.57, "learning_rate": 0.0008348632108745453, "loss": 2.5136, "step": 21070 }, { "epoch": 0.57, "learning_rate": 0.0008347773672961135, "loss": 2.3882, "step": 21071 }, { "epoch": 0.57, "learning_rate": 0.0008346915249693787, "loss": 2.5985, "step": 21072 }, { "epoch": 0.57, "learning_rate": 0.0008346056838949912, "loss": 2.9115, "step": 21073 }, { "epoch": 0.57, "learning_rate": 0.0008345198440736017, "loss": 2.2774, "step": 21074 }, { "epoch": 0.57, "learning_rate": 0.0008344340055058601, "loss": 2.3399, "step": 21075 }, { "epoch": 0.57, "learning_rate": 0.0008343481681924172, "loss": 2.5432, "step": 21076 }, { "epoch": 0.57, "learning_rate": 0.0008342623321339225, "loss": 2.711, "step": 21077 }, { "epoch": 0.57, "learning_rate": 0.0008341764973310269, "loss": 2.6303, "step": 21078 }, { "epoch": 0.57, "learning_rate": 0.0008340906637843808, "loss": 2.4264, "step": 21079 }, { "epoch": 0.57, "learning_rate": 0.0008340048314946338, "loss": 2.4551, "step": 21080 }, { "epoch": 0.57, "learning_rate": 0.0008339190004624364, "loss": 2.4356, "step": 21081 }, { "epoch": 0.57, "learning_rate": 0.0008338331706884396, "loss": 2.2866, "step": 21082 }, { "epoch": 0.57, "learning_rate": 0.0008337473421732924, "loss": 2.7744, "step": 21083 }, { "epoch": 0.57, "learning_rate": 0.0008336615149176459, "loss": 2.5032, "step": 21084 }, { "epoch": 0.57, "learning_rate": 0.0008335756889221499, "loss": 2.4812, "step": 21085 }, { "epoch": 0.57, "learning_rate": 0.0008334898641874546, "loss": 2.7065, "step": 21086 }, { "epoch": 0.57, "learning_rate": 0.0008334040407142107, "loss": 2.6311, "step": 21087 }, { "epoch": 0.57, "learning_rate": 0.0008333182185030676, "loss": 2.3757, "step": 21088 }, { "epoch": 0.57, "learning_rate": 0.0008332323975546761, "loss": 2.3726, "step": 21089 }, { "epoch": 0.57, "learning_rate": 0.0008331465778696861, "loss": 2.2231, "step": 21090 }, { "epoch": 0.57, "learning_rate": 0.0008330607594487479, "loss": 2.7222, "step": 21091 }, { "epoch": 0.57, "learning_rate": 0.0008329749422925117, "loss": 2.4856, "step": 21092 }, { "epoch": 0.57, "learning_rate": 0.0008328891264016269, "loss": 2.329, "step": 21093 }, { "epoch": 0.57, "learning_rate": 0.0008328033117767444, "loss": 2.849, "step": 21094 }, { "epoch": 0.57, "learning_rate": 0.0008327174984185145, "loss": 2.9535, "step": 21095 }, { "epoch": 0.57, "learning_rate": 0.0008326316863275867, "loss": 2.4797, "step": 21096 }, { "epoch": 0.57, "learning_rate": 0.0008325458755046109, "loss": 2.8021, "step": 21097 }, { "epoch": 0.57, "learning_rate": 0.0008324600659502384, "loss": 1.7697, "step": 21098 }, { "epoch": 0.57, "learning_rate": 0.0008323742576651178, "loss": 2.668, "step": 21099 }, { "epoch": 0.57, "learning_rate": 0.0008322884506499001, "loss": 2.6633, "step": 21100 }, { "epoch": 0.57, "learning_rate": 0.0008322026449052353, "loss": 2.7628, "step": 21101 }, { "epoch": 0.57, "learning_rate": 0.000832116840431773, "loss": 2.3847, "step": 21102 }, { "epoch": 0.57, "learning_rate": 0.0008320310372301638, "loss": 2.6586, "step": 21103 }, { "epoch": 0.57, "learning_rate": 0.0008319452353010571, "loss": 2.7287, "step": 21104 }, { "epoch": 0.57, "learning_rate": 0.0008318594346451032, "loss": 2.3534, "step": 21105 }, { "epoch": 0.57, "learning_rate": 0.0008317736352629525, "loss": 2.9112, "step": 21106 }, { "epoch": 0.57, "learning_rate": 0.0008316878371552545, "loss": 2.3418, "step": 21107 }, { "epoch": 0.57, "learning_rate": 0.0008316020403226592, "loss": 2.7553, "step": 21108 }, { "epoch": 0.57, "learning_rate": 0.0008315162447658173, "loss": 2.4756, "step": 21109 }, { "epoch": 0.57, "learning_rate": 0.0008314304504853776, "loss": 2.8285, "step": 21110 }, { "epoch": 0.57, "learning_rate": 0.0008313446574819912, "loss": 2.0258, "step": 21111 }, { "epoch": 0.57, "learning_rate": 0.0008312588657563071, "loss": 2.4747, "step": 21112 }, { "epoch": 0.57, "learning_rate": 0.0008311730753089757, "loss": 2.4428, "step": 21113 }, { "epoch": 0.57, "learning_rate": 0.0008310872861406471, "loss": 2.482, "step": 21114 }, { "epoch": 0.57, "learning_rate": 0.0008310014982519708, "loss": 2.5079, "step": 21115 }, { "epoch": 0.57, "learning_rate": 0.0008309157116435969, "loss": 2.4652, "step": 21116 }, { "epoch": 0.57, "learning_rate": 0.0008308299263161756, "loss": 2.2141, "step": 21117 }, { "epoch": 0.57, "learning_rate": 0.0008307441422703563, "loss": 2.0696, "step": 21118 }, { "epoch": 0.57, "learning_rate": 0.0008306583595067893, "loss": 2.422, "step": 21119 }, { "epoch": 0.57, "learning_rate": 0.0008305725780261242, "loss": 2.6804, "step": 21120 }, { "epoch": 0.57, "learning_rate": 0.0008304867978290109, "loss": 2.1432, "step": 21121 }, { "epoch": 0.57, "learning_rate": 0.0008304010189160997, "loss": 2.7669, "step": 21122 }, { "epoch": 0.57, "learning_rate": 0.0008303152412880394, "loss": 2.616, "step": 21123 }, { "epoch": 0.57, "learning_rate": 0.0008302294649454808, "loss": 2.8066, "step": 21124 }, { "epoch": 0.57, "learning_rate": 0.0008301436898890737, "loss": 2.2351, "step": 21125 }, { "epoch": 0.57, "learning_rate": 0.0008300579161194673, "loss": 2.4679, "step": 21126 }, { "epoch": 0.57, "learning_rate": 0.000829972143637312, "loss": 2.5146, "step": 21127 }, { "epoch": 0.57, "learning_rate": 0.0008298863724432572, "loss": 2.6911, "step": 21128 }, { "epoch": 0.57, "learning_rate": 0.0008298006025379527, "loss": 2.3413, "step": 21129 }, { "epoch": 0.57, "learning_rate": 0.0008297148339220486, "loss": 2.4117, "step": 21130 }, { "epoch": 0.57, "learning_rate": 0.0008296290665961943, "loss": 2.4568, "step": 21131 }, { "epoch": 0.57, "learning_rate": 0.0008295433005610398, "loss": 2.3665, "step": 21132 }, { "epoch": 0.57, "learning_rate": 0.0008294575358172349, "loss": 2.6965, "step": 21133 }, { "epoch": 0.57, "learning_rate": 0.0008293717723654291, "loss": 2.6651, "step": 21134 }, { "epoch": 0.57, "learning_rate": 0.0008292860102062725, "loss": 2.5008, "step": 21135 }, { "epoch": 0.57, "learning_rate": 0.0008292002493404141, "loss": 2.0824, "step": 21136 }, { "epoch": 0.57, "learning_rate": 0.0008291144897685041, "loss": 2.1616, "step": 21137 }, { "epoch": 0.57, "learning_rate": 0.0008290287314911928, "loss": 2.5941, "step": 21138 }, { "epoch": 0.57, "learning_rate": 0.0008289429745091287, "loss": 2.67, "step": 21139 }, { "epoch": 0.57, "learning_rate": 0.0008288572188229619, "loss": 2.6267, "step": 21140 }, { "epoch": 0.57, "learning_rate": 0.0008287714644333429, "loss": 2.6683, "step": 21141 }, { "epoch": 0.57, "learning_rate": 0.0008286857113409202, "loss": 2.3962, "step": 21142 }, { "epoch": 0.57, "learning_rate": 0.0008285999595463438, "loss": 2.5018, "step": 21143 }, { "epoch": 0.57, "learning_rate": 0.0008285142090502639, "loss": 2.4956, "step": 21144 }, { "epoch": 0.57, "learning_rate": 0.0008284284598533293, "loss": 2.6578, "step": 21145 }, { "epoch": 0.57, "learning_rate": 0.0008283427119561903, "loss": 2.6075, "step": 21146 }, { "epoch": 0.57, "learning_rate": 0.000828256965359496, "loss": 2.7962, "step": 21147 }, { "epoch": 0.57, "learning_rate": 0.0008281712200638962, "loss": 2.52, "step": 21148 }, { "epoch": 0.57, "learning_rate": 0.0008280854760700408, "loss": 2.4954, "step": 21149 }, { "epoch": 0.57, "learning_rate": 0.0008279997333785788, "loss": 2.5392, "step": 21150 }, { "epoch": 0.57, "learning_rate": 0.0008279139919901602, "loss": 2.0279, "step": 21151 }, { "epoch": 0.57, "learning_rate": 0.0008278282519054347, "loss": 2.9083, "step": 21152 }, { "epoch": 0.57, "learning_rate": 0.0008277425131250511, "loss": 2.5992, "step": 21153 }, { "epoch": 0.57, "learning_rate": 0.0008276567756496599, "loss": 2.5625, "step": 21154 }, { "epoch": 0.57, "learning_rate": 0.0008275710394799098, "loss": 2.6538, "step": 21155 }, { "epoch": 0.57, "learning_rate": 0.0008274853046164508, "loss": 2.3938, "step": 21156 }, { "epoch": 0.57, "learning_rate": 0.0008273995710599322, "loss": 2.4614, "step": 21157 }, { "epoch": 0.57, "learning_rate": 0.0008273138388110036, "loss": 2.6954, "step": 21158 }, { "epoch": 0.57, "learning_rate": 0.0008272281078703145, "loss": 2.5192, "step": 21159 }, { "epoch": 0.57, "learning_rate": 0.0008271423782385146, "loss": 2.2941, "step": 21160 }, { "epoch": 0.57, "learning_rate": 0.0008270566499162528, "loss": 2.5542, "step": 21161 }, { "epoch": 0.57, "learning_rate": 0.0008269709229041792, "loss": 2.5891, "step": 21162 }, { "epoch": 0.57, "learning_rate": 0.0008268851972029426, "loss": 2.3679, "step": 21163 }, { "epoch": 0.57, "learning_rate": 0.000826799472813193, "loss": 2.5473, "step": 21164 }, { "epoch": 0.57, "learning_rate": 0.0008267137497355799, "loss": 2.312, "step": 21165 }, { "epoch": 0.57, "learning_rate": 0.0008266280279707518, "loss": 2.2854, "step": 21166 }, { "epoch": 0.57, "learning_rate": 0.0008265423075193592, "loss": 2.6195, "step": 21167 }, { "epoch": 0.57, "learning_rate": 0.0008264565883820512, "loss": 3.2265, "step": 21168 }, { "epoch": 0.57, "learning_rate": 0.0008263708705594769, "loss": 2.3114, "step": 21169 }, { "epoch": 0.57, "learning_rate": 0.0008262851540522859, "loss": 2.4955, "step": 21170 }, { "epoch": 0.57, "learning_rate": 0.0008261994388611274, "loss": 2.5132, "step": 21171 }, { "epoch": 0.57, "learning_rate": 0.0008261137249866507, "loss": 2.7871, "step": 21172 }, { "epoch": 0.57, "learning_rate": 0.0008260280124295057, "loss": 2.0651, "step": 21173 }, { "epoch": 0.57, "learning_rate": 0.0008259423011903411, "loss": 2.4971, "step": 21174 }, { "epoch": 0.57, "learning_rate": 0.0008258565912698065, "loss": 2.3699, "step": 21175 }, { "epoch": 0.57, "learning_rate": 0.0008257708826685515, "loss": 2.5669, "step": 21176 }, { "epoch": 0.57, "learning_rate": 0.0008256851753872249, "loss": 2.42, "step": 21177 }, { "epoch": 0.57, "learning_rate": 0.0008255994694264762, "loss": 2.6725, "step": 21178 }, { "epoch": 0.57, "learning_rate": 0.0008255137647869551, "loss": 2.6874, "step": 21179 }, { "epoch": 0.57, "learning_rate": 0.0008254280614693101, "loss": 2.8814, "step": 21180 }, { "epoch": 0.57, "learning_rate": 0.0008253423594741916, "loss": 2.6214, "step": 21181 }, { "epoch": 0.57, "learning_rate": 0.0008252566588022475, "loss": 2.3228, "step": 21182 }, { "epoch": 0.57, "learning_rate": 0.0008251709594541274, "loss": 2.9692, "step": 21183 }, { "epoch": 0.57, "learning_rate": 0.0008250852614304818, "loss": 2.86, "step": 21184 }, { "epoch": 0.57, "learning_rate": 0.0008249995647319583, "loss": 2.5107, "step": 21185 }, { "epoch": 0.57, "learning_rate": 0.0008249138693592069, "loss": 2.6678, "step": 21186 }, { "epoch": 0.57, "learning_rate": 0.0008248281753128771, "loss": 2.8745, "step": 21187 }, { "epoch": 0.57, "learning_rate": 0.0008247424825936174, "loss": 2.2227, "step": 21188 }, { "epoch": 0.57, "learning_rate": 0.0008246567912020775, "loss": 2.3836, "step": 21189 }, { "epoch": 0.57, "learning_rate": 0.0008245711011389061, "loss": 2.5062, "step": 21190 }, { "epoch": 0.57, "learning_rate": 0.0008244854124047528, "loss": 2.2266, "step": 21191 }, { "epoch": 0.57, "learning_rate": 0.0008243997250002668, "loss": 2.7222, "step": 21192 }, { "epoch": 0.57, "learning_rate": 0.0008243140389260969, "loss": 2.6055, "step": 21193 }, { "epoch": 0.57, "learning_rate": 0.0008242283541828924, "loss": 2.8981, "step": 21194 }, { "epoch": 0.57, "learning_rate": 0.000824142670771303, "loss": 2.6278, "step": 21195 }, { "epoch": 0.57, "learning_rate": 0.0008240569886919766, "loss": 2.435, "step": 21196 }, { "epoch": 0.57, "learning_rate": 0.0008239713079455635, "loss": 2.6408, "step": 21197 }, { "epoch": 0.57, "learning_rate": 0.0008238856285327121, "loss": 2.6904, "step": 21198 }, { "epoch": 0.57, "learning_rate": 0.0008237999504540715, "loss": 2.9866, "step": 21199 }, { "epoch": 0.57, "learning_rate": 0.0008237142737102913, "loss": 2.3166, "step": 21200 }, { "epoch": 0.57, "learning_rate": 0.00082362859830202, "loss": 2.6063, "step": 21201 }, { "epoch": 0.57, "learning_rate": 0.0008235429242299068, "loss": 2.455, "step": 21202 }, { "epoch": 0.57, "learning_rate": 0.0008234572514946013, "loss": 2.4358, "step": 21203 }, { "epoch": 0.57, "learning_rate": 0.0008233715800967516, "loss": 2.766, "step": 21204 }, { "epoch": 0.57, "learning_rate": 0.0008232859100370075, "loss": 2.6162, "step": 21205 }, { "epoch": 0.57, "learning_rate": 0.0008232002413160178, "loss": 2.2836, "step": 21206 }, { "epoch": 0.57, "learning_rate": 0.0008231145739344312, "loss": 2.6296, "step": 21207 }, { "epoch": 0.57, "learning_rate": 0.0008230289078928976, "loss": 2.4945, "step": 21208 }, { "epoch": 0.57, "learning_rate": 0.0008229432431920646, "loss": 2.4994, "step": 21209 }, { "epoch": 0.57, "learning_rate": 0.0008228575798325821, "loss": 2.5067, "step": 21210 }, { "epoch": 0.57, "learning_rate": 0.0008227719178150994, "loss": 2.6527, "step": 21211 }, { "epoch": 0.57, "learning_rate": 0.0008226862571402645, "loss": 2.7677, "step": 21212 }, { "epoch": 0.57, "learning_rate": 0.0008226005978087266, "loss": 2.6064, "step": 21213 }, { "epoch": 0.57, "learning_rate": 0.0008225149398211355, "loss": 2.3721, "step": 21214 }, { "epoch": 0.57, "learning_rate": 0.0008224292831781391, "loss": 2.3947, "step": 21215 }, { "epoch": 0.57, "learning_rate": 0.000822343627880387, "loss": 2.2343, "step": 21216 }, { "epoch": 0.57, "learning_rate": 0.0008222579739285274, "loss": 2.5796, "step": 21217 }, { "epoch": 0.57, "learning_rate": 0.0008221723213232097, "loss": 2.1728, "step": 21218 }, { "epoch": 0.57, "learning_rate": 0.0008220866700650829, "loss": 2.5994, "step": 21219 }, { "epoch": 0.57, "learning_rate": 0.0008220010201547955, "loss": 2.515, "step": 21220 }, { "epoch": 0.57, "learning_rate": 0.0008219153715929966, "loss": 2.3542, "step": 21221 }, { "epoch": 0.57, "learning_rate": 0.0008218297243803351, "loss": 2.2709, "step": 21222 }, { "epoch": 0.57, "learning_rate": 0.0008217440785174596, "loss": 2.8132, "step": 21223 }, { "epoch": 0.57, "learning_rate": 0.0008216584340050195, "loss": 2.5526, "step": 21224 }, { "epoch": 0.57, "learning_rate": 0.0008215727908436628, "loss": 2.4404, "step": 21225 }, { "epoch": 0.57, "learning_rate": 0.0008214871490340386, "loss": 2.6083, "step": 21226 }, { "epoch": 0.57, "learning_rate": 0.0008214015085767964, "loss": 2.5853, "step": 21227 }, { "epoch": 0.57, "learning_rate": 0.000821315869472584, "loss": 2.7735, "step": 21228 }, { "epoch": 0.57, "learning_rate": 0.0008212302317220506, "loss": 2.4226, "step": 21229 }, { "epoch": 0.57, "learning_rate": 0.0008211445953258453, "loss": 2.5802, "step": 21230 }, { "epoch": 0.57, "learning_rate": 0.0008210589602846163, "loss": 2.25, "step": 21231 }, { "epoch": 0.57, "learning_rate": 0.0008209733265990129, "loss": 2.8866, "step": 21232 }, { "epoch": 0.57, "learning_rate": 0.0008208876942696834, "loss": 2.7201, "step": 21233 }, { "epoch": 0.57, "learning_rate": 0.0008208020632972766, "loss": 2.353, "step": 21234 }, { "epoch": 0.57, "learning_rate": 0.0008207164336824415, "loss": 2.2218, "step": 21235 }, { "epoch": 0.57, "learning_rate": 0.0008206308054258265, "loss": 2.7084, "step": 21236 }, { "epoch": 0.57, "learning_rate": 0.0008205451785280806, "loss": 2.6302, "step": 21237 }, { "epoch": 0.57, "learning_rate": 0.0008204595529898525, "loss": 2.3818, "step": 21238 }, { "epoch": 0.57, "learning_rate": 0.0008203739288117902, "loss": 2.6809, "step": 21239 }, { "epoch": 0.57, "learning_rate": 0.0008202883059945436, "loss": 2.6049, "step": 21240 }, { "epoch": 0.57, "learning_rate": 0.0008202026845387602, "loss": 2.3839, "step": 21241 }, { "epoch": 0.57, "learning_rate": 0.000820117064445089, "loss": 2.0528, "step": 21242 }, { "epoch": 0.57, "learning_rate": 0.0008200314457141793, "loss": 2.2777, "step": 21243 }, { "epoch": 0.57, "learning_rate": 0.0008199458283466787, "loss": 2.17, "step": 21244 }, { "epoch": 0.57, "learning_rate": 0.0008198602123432363, "loss": 2.1761, "step": 21245 }, { "epoch": 0.57, "learning_rate": 0.000819774597704501, "loss": 2.4586, "step": 21246 }, { "epoch": 0.57, "learning_rate": 0.000819688984431121, "loss": 2.583, "step": 21247 }, { "epoch": 0.57, "learning_rate": 0.0008196033725237448, "loss": 2.6412, "step": 21248 }, { "epoch": 0.57, "learning_rate": 0.0008195177619830217, "loss": 2.2723, "step": 21249 }, { "epoch": 0.57, "learning_rate": 0.0008194321528095993, "loss": 2.5428, "step": 21250 }, { "epoch": 0.57, "learning_rate": 0.0008193465450041272, "loss": 2.3608, "step": 21251 }, { "epoch": 0.57, "learning_rate": 0.0008192609385672527, "loss": 2.4361, "step": 21252 }, { "epoch": 0.57, "learning_rate": 0.0008191753334996253, "loss": 2.5433, "step": 21253 }, { "epoch": 0.57, "learning_rate": 0.0008190897298018936, "loss": 2.7186, "step": 21254 }, { "epoch": 0.57, "learning_rate": 0.0008190041274747051, "loss": 2.4267, "step": 21255 }, { "epoch": 0.57, "learning_rate": 0.0008189185265187091, "loss": 2.5504, "step": 21256 }, { "epoch": 0.57, "learning_rate": 0.0008188329269345545, "loss": 2.4346, "step": 21257 }, { "epoch": 0.57, "learning_rate": 0.000818747328722889, "loss": 2.4765, "step": 21258 }, { "epoch": 0.57, "learning_rate": 0.0008186617318843613, "loss": 2.4911, "step": 21259 }, { "epoch": 0.57, "learning_rate": 0.0008185761364196199, "loss": 2.5063, "step": 21260 }, { "epoch": 0.57, "learning_rate": 0.0008184905423293129, "loss": 2.1669, "step": 21261 }, { "epoch": 0.57, "learning_rate": 0.0008184049496140896, "loss": 2.4963, "step": 21262 }, { "epoch": 0.57, "learning_rate": 0.0008183193582745977, "loss": 2.5092, "step": 21263 }, { "epoch": 0.57, "learning_rate": 0.0008182337683114857, "loss": 2.8694, "step": 21264 }, { "epoch": 0.57, "learning_rate": 0.0008181481797254026, "loss": 2.2999, "step": 21265 }, { "epoch": 0.57, "learning_rate": 0.0008180625925169961, "loss": 2.5344, "step": 21266 }, { "epoch": 0.57, "learning_rate": 0.0008179770066869152, "loss": 2.7087, "step": 21267 }, { "epoch": 0.57, "learning_rate": 0.0008178914222358075, "loss": 1.8977, "step": 21268 }, { "epoch": 0.57, "learning_rate": 0.0008178058391643218, "loss": 2.8685, "step": 21269 }, { "epoch": 0.57, "learning_rate": 0.000817720257473107, "loss": 2.8474, "step": 21270 }, { "epoch": 0.57, "learning_rate": 0.0008176346771628107, "loss": 2.25, "step": 21271 }, { "epoch": 0.57, "learning_rate": 0.0008175490982340811, "loss": 2.5332, "step": 21272 }, { "epoch": 0.57, "learning_rate": 0.0008174635206875675, "loss": 2.8038, "step": 21273 }, { "epoch": 0.57, "learning_rate": 0.0008173779445239173, "loss": 2.4287, "step": 21274 }, { "epoch": 0.57, "learning_rate": 0.0008172923697437794, "loss": 2.1472, "step": 21275 }, { "epoch": 0.57, "learning_rate": 0.0008172067963478016, "loss": 2.2822, "step": 21276 }, { "epoch": 0.57, "learning_rate": 0.0008171212243366324, "loss": 2.355, "step": 21277 }, { "epoch": 0.57, "learning_rate": 0.0008170356537109203, "loss": 2.3907, "step": 21278 }, { "epoch": 0.57, "learning_rate": 0.0008169500844713132, "loss": 2.6201, "step": 21279 }, { "epoch": 0.57, "learning_rate": 0.0008168645166184594, "loss": 1.9702, "step": 21280 }, { "epoch": 0.57, "learning_rate": 0.0008167789501530076, "loss": 2.6648, "step": 21281 }, { "epoch": 0.57, "learning_rate": 0.0008166933850756056, "loss": 2.7669, "step": 21282 }, { "epoch": 0.57, "learning_rate": 0.0008166078213869021, "loss": 2.4176, "step": 21283 }, { "epoch": 0.57, "learning_rate": 0.0008165222590875445, "loss": 2.7734, "step": 21284 }, { "epoch": 0.57, "learning_rate": 0.0008164366981781812, "loss": 2.5666, "step": 21285 }, { "epoch": 0.57, "learning_rate": 0.0008163511386594614, "loss": 2.171, "step": 21286 }, { "epoch": 0.57, "learning_rate": 0.000816265580532032, "loss": 2.3566, "step": 21287 }, { "epoch": 0.57, "learning_rate": 0.0008161800237965419, "loss": 2.1179, "step": 21288 }, { "epoch": 0.57, "learning_rate": 0.0008160944684536391, "loss": 2.4262, "step": 21289 }, { "epoch": 0.57, "learning_rate": 0.0008160089145039716, "loss": 2.8537, "step": 21290 }, { "epoch": 0.57, "learning_rate": 0.0008159233619481876, "loss": 2.6635, "step": 21291 }, { "epoch": 0.57, "learning_rate": 0.0008158378107869357, "loss": 2.4411, "step": 21292 }, { "epoch": 0.57, "learning_rate": 0.0008157522610208632, "loss": 2.3116, "step": 21293 }, { "epoch": 0.57, "learning_rate": 0.000815666712650619, "loss": 2.1148, "step": 21294 }, { "epoch": 0.57, "learning_rate": 0.0008155811656768505, "loss": 2.2188, "step": 21295 }, { "epoch": 0.57, "learning_rate": 0.0008154956201002062, "loss": 2.7381, "step": 21296 }, { "epoch": 0.57, "learning_rate": 0.0008154100759213345, "loss": 2.7017, "step": 21297 }, { "epoch": 0.57, "learning_rate": 0.0008153245331408823, "loss": 2.8095, "step": 21298 }, { "epoch": 0.57, "learning_rate": 0.0008152389917594988, "loss": 2.351, "step": 21299 }, { "epoch": 0.57, "learning_rate": 0.0008151534517778319, "loss": 2.8142, "step": 21300 }, { "epoch": 0.57, "learning_rate": 0.0008150679131965292, "loss": 2.4278, "step": 21301 }, { "epoch": 0.57, "learning_rate": 0.000814982376016239, "loss": 2.2294, "step": 21302 }, { "epoch": 0.57, "learning_rate": 0.0008148968402376092, "loss": 3.0577, "step": 21303 }, { "epoch": 0.57, "learning_rate": 0.0008148113058612876, "loss": 2.2829, "step": 21304 }, { "epoch": 0.57, "learning_rate": 0.0008147257728879228, "loss": 2.7428, "step": 21305 }, { "epoch": 0.57, "learning_rate": 0.0008146402413181621, "loss": 2.2524, "step": 21306 }, { "epoch": 0.57, "learning_rate": 0.0008145547111526539, "loss": 2.3395, "step": 21307 }, { "epoch": 0.57, "learning_rate": 0.0008144691823920463, "loss": 2.2949, "step": 21308 }, { "epoch": 0.57, "learning_rate": 0.0008143836550369868, "loss": 2.2696, "step": 21309 }, { "epoch": 0.57, "learning_rate": 0.0008142981290881238, "loss": 2.5453, "step": 21310 }, { "epoch": 0.57, "learning_rate": 0.0008142126045461045, "loss": 2.5088, "step": 21311 }, { "epoch": 0.57, "learning_rate": 0.0008141270814115773, "loss": 2.6217, "step": 21312 }, { "epoch": 0.57, "learning_rate": 0.0008140415596851907, "loss": 2.449, "step": 21313 }, { "epoch": 0.57, "learning_rate": 0.0008139560393675916, "loss": 2.5447, "step": 21314 }, { "epoch": 0.57, "learning_rate": 0.000813870520459428, "loss": 2.614, "step": 21315 }, { "epoch": 0.57, "learning_rate": 0.0008137850029613488, "loss": 2.4476, "step": 21316 }, { "epoch": 0.57, "learning_rate": 0.0008136994868740004, "loss": 2.2739, "step": 21317 }, { "epoch": 0.57, "learning_rate": 0.0008136139721980319, "loss": 2.3543, "step": 21318 }, { "epoch": 0.57, "learning_rate": 0.0008135284589340904, "loss": 2.418, "step": 21319 }, { "epoch": 0.57, "learning_rate": 0.0008134429470828238, "loss": 2.9118, "step": 21320 }, { "epoch": 0.57, "learning_rate": 0.0008133574366448803, "loss": 2.6796, "step": 21321 }, { "epoch": 0.57, "learning_rate": 0.0008132719276209073, "loss": 2.7776, "step": 21322 }, { "epoch": 0.57, "learning_rate": 0.0008131864200115528, "loss": 2.4849, "step": 21323 }, { "epoch": 0.57, "learning_rate": 0.0008131009138174648, "loss": 2.7923, "step": 21324 }, { "epoch": 0.57, "learning_rate": 0.0008130154090392908, "loss": 2.6773, "step": 21325 }, { "epoch": 0.57, "learning_rate": 0.0008129299056776785, "loss": 2.2008, "step": 21326 }, { "epoch": 0.57, "learning_rate": 0.0008128444037332762, "loss": 2.2767, "step": 21327 }, { "epoch": 0.57, "learning_rate": 0.0008127589032067307, "loss": 2.4644, "step": 21328 }, { "epoch": 0.57, "learning_rate": 0.0008126734040986907, "loss": 2.7533, "step": 21329 }, { "epoch": 0.57, "learning_rate": 0.0008125879064098033, "loss": 2.7672, "step": 21330 }, { "epoch": 0.57, "learning_rate": 0.0008125024101407162, "loss": 2.5071, "step": 21331 }, { "epoch": 0.57, "learning_rate": 0.0008124169152920777, "loss": 2.467, "step": 21332 }, { "epoch": 0.57, "learning_rate": 0.0008123314218645349, "loss": 2.653, "step": 21333 }, { "epoch": 0.57, "learning_rate": 0.0008122459298587357, "loss": 2.2079, "step": 21334 }, { "epoch": 0.57, "learning_rate": 0.000812160439275328, "loss": 2.7628, "step": 21335 }, { "epoch": 0.57, "learning_rate": 0.0008120749501149588, "loss": 2.4236, "step": 21336 }, { "epoch": 0.57, "learning_rate": 0.0008119894623782766, "loss": 2.9143, "step": 21337 }, { "epoch": 0.57, "learning_rate": 0.0008119039760659283, "loss": 2.6045, "step": 21338 }, { "epoch": 0.57, "learning_rate": 0.0008118184911785619, "loss": 2.613, "step": 21339 }, { "epoch": 0.57, "learning_rate": 0.0008117330077168254, "loss": 2.3901, "step": 21340 }, { "epoch": 0.57, "learning_rate": 0.0008116475256813654, "loss": 2.3077, "step": 21341 }, { "epoch": 0.57, "learning_rate": 0.0008115620450728301, "loss": 2.4532, "step": 21342 }, { "epoch": 0.57, "learning_rate": 0.0008114765658918675, "loss": 2.3705, "step": 21343 }, { "epoch": 0.57, "learning_rate": 0.0008113910881391244, "loss": 2.5675, "step": 21344 }, { "epoch": 0.57, "learning_rate": 0.000811305611815249, "loss": 2.1715, "step": 21345 }, { "epoch": 0.57, "learning_rate": 0.0008112201369208882, "loss": 2.3173, "step": 21346 }, { "epoch": 0.57, "learning_rate": 0.00081113466345669, "loss": 2.4751, "step": 21347 }, { "epoch": 0.57, "learning_rate": 0.0008110491914233019, "loss": 2.653, "step": 21348 }, { "epoch": 0.57, "learning_rate": 0.0008109637208213713, "loss": 2.1934, "step": 21349 }, { "epoch": 0.57, "learning_rate": 0.0008108782516515456, "loss": 2.9573, "step": 21350 }, { "epoch": 0.57, "learning_rate": 0.0008107927839144728, "loss": 2.4492, "step": 21351 }, { "epoch": 0.57, "learning_rate": 0.0008107073176107998, "loss": 2.6768, "step": 21352 }, { "epoch": 0.57, "learning_rate": 0.0008106218527411746, "loss": 2.3134, "step": 21353 }, { "epoch": 0.57, "learning_rate": 0.0008105363893062439, "loss": 2.7152, "step": 21354 }, { "epoch": 0.57, "learning_rate": 0.0008104509273066557, "loss": 2.746, "step": 21355 }, { "epoch": 0.57, "learning_rate": 0.000810365466743058, "loss": 2.4373, "step": 21356 }, { "epoch": 0.57, "learning_rate": 0.000810280007616097, "loss": 2.6056, "step": 21357 }, { "epoch": 0.57, "learning_rate": 0.0008101945499264207, "loss": 2.462, "step": 21358 }, { "epoch": 0.57, "learning_rate": 0.0008101090936746771, "loss": 2.6699, "step": 21359 }, { "epoch": 0.57, "learning_rate": 0.0008100236388615126, "loss": 2.1359, "step": 21360 }, { "epoch": 0.57, "learning_rate": 0.0008099381854875751, "loss": 2.4809, "step": 21361 }, { "epoch": 0.57, "learning_rate": 0.0008098527335535122, "loss": 2.7882, "step": 21362 }, { "epoch": 0.57, "learning_rate": 0.0008097672830599707, "loss": 2.4007, "step": 21363 }, { "epoch": 0.57, "learning_rate": 0.0008096818340075986, "loss": 2.6441, "step": 21364 }, { "epoch": 0.57, "learning_rate": 0.0008095963863970426, "loss": 2.2646, "step": 21365 }, { "epoch": 0.57, "learning_rate": 0.0008095109402289502, "loss": 2.206, "step": 21366 }, { "epoch": 0.57, "learning_rate": 0.0008094254955039692, "loss": 2.4921, "step": 21367 }, { "epoch": 0.57, "learning_rate": 0.0008093400522227464, "loss": 2.4903, "step": 21368 }, { "epoch": 0.57, "learning_rate": 0.0008092546103859293, "loss": 2.4314, "step": 21369 }, { "epoch": 0.57, "learning_rate": 0.0008091691699941654, "loss": 2.443, "step": 21370 }, { "epoch": 0.57, "learning_rate": 0.0008090837310481014, "loss": 2.6482, "step": 21371 }, { "epoch": 0.57, "learning_rate": 0.0008089982935483854, "loss": 2.2663, "step": 21372 }, { "epoch": 0.57, "learning_rate": 0.0008089128574956637, "loss": 2.104, "step": 21373 }, { "epoch": 0.57, "learning_rate": 0.0008088274228905841, "loss": 2.6291, "step": 21374 }, { "epoch": 0.57, "learning_rate": 0.000808741989733794, "loss": 2.5653, "step": 21375 }, { "epoch": 0.57, "learning_rate": 0.0008086565580259401, "loss": 2.0015, "step": 21376 }, { "epoch": 0.57, "learning_rate": 0.0008085711277676699, "loss": 2.6401, "step": 21377 }, { "epoch": 0.57, "learning_rate": 0.000808485698959631, "loss": 2.6721, "step": 21378 }, { "epoch": 0.57, "learning_rate": 0.0008084002716024697, "loss": 2.5365, "step": 21379 }, { "epoch": 0.57, "learning_rate": 0.0008083148456968341, "loss": 2.6351, "step": 21380 }, { "epoch": 0.57, "learning_rate": 0.0008082294212433707, "loss": 2.2474, "step": 21381 }, { "epoch": 0.57, "learning_rate": 0.000808143998242727, "loss": 2.6675, "step": 21382 }, { "epoch": 0.57, "learning_rate": 0.0008080585766955504, "loss": 2.427, "step": 21383 }, { "epoch": 0.57, "learning_rate": 0.0008079731566024871, "loss": 2.5836, "step": 21384 }, { "epoch": 0.57, "learning_rate": 0.0008078877379641851, "loss": 3.0226, "step": 21385 }, { "epoch": 0.57, "learning_rate": 0.0008078023207812915, "loss": 2.2497, "step": 21386 }, { "epoch": 0.57, "learning_rate": 0.0008077169050544529, "loss": 2.3573, "step": 21387 }, { "epoch": 0.57, "learning_rate": 0.0008076314907843169, "loss": 2.6125, "step": 21388 }, { "epoch": 0.57, "learning_rate": 0.00080754607797153, "loss": 1.8125, "step": 21389 }, { "epoch": 0.57, "learning_rate": 0.0008074606666167396, "loss": 2.2251, "step": 21390 }, { "epoch": 0.57, "learning_rate": 0.000807375256720593, "loss": 2.4452, "step": 21391 }, { "epoch": 0.57, "learning_rate": 0.0008072898482837369, "loss": 2.6547, "step": 21392 }, { "epoch": 0.57, "learning_rate": 0.0008072044413068184, "loss": 2.4552, "step": 21393 }, { "epoch": 0.57, "learning_rate": 0.0008071190357904847, "loss": 2.2992, "step": 21394 }, { "epoch": 0.57, "learning_rate": 0.0008070336317353826, "loss": 2.6089, "step": 21395 }, { "epoch": 0.57, "learning_rate": 0.0008069482291421596, "loss": 2.9719, "step": 21396 }, { "epoch": 0.58, "learning_rate": 0.0008068628280114616, "loss": 2.3572, "step": 21397 }, { "epoch": 0.58, "learning_rate": 0.0008067774283439367, "loss": 2.5676, "step": 21398 }, { "epoch": 0.58, "learning_rate": 0.0008066920301402316, "loss": 2.4972, "step": 21399 }, { "epoch": 0.58, "learning_rate": 0.0008066066334009929, "loss": 2.5896, "step": 21400 }, { "epoch": 0.58, "learning_rate": 0.0008065212381268674, "loss": 2.3618, "step": 21401 }, { "epoch": 0.58, "learning_rate": 0.0008064358443185031, "loss": 2.4688, "step": 21402 }, { "epoch": 0.58, "learning_rate": 0.0008063504519765459, "loss": 2.3258, "step": 21403 }, { "epoch": 0.58, "learning_rate": 0.0008062650611016431, "loss": 2.555, "step": 21404 }, { "epoch": 0.58, "learning_rate": 0.0008061796716944416, "loss": 2.5574, "step": 21405 }, { "epoch": 0.58, "learning_rate": 0.0008060942837555882, "loss": 2.8611, "step": 21406 }, { "epoch": 0.58, "learning_rate": 0.0008060088972857299, "loss": 2.2133, "step": 21407 }, { "epoch": 0.58, "learning_rate": 0.0008059235122855134, "loss": 2.734, "step": 21408 }, { "epoch": 0.58, "learning_rate": 0.0008058381287555856, "loss": 2.4893, "step": 21409 }, { "epoch": 0.58, "learning_rate": 0.0008057527466965937, "loss": 2.2278, "step": 21410 }, { "epoch": 0.58, "learning_rate": 0.000805667366109184, "loss": 2.5448, "step": 21411 }, { "epoch": 0.58, "learning_rate": 0.0008055819869940037, "loss": 2.3986, "step": 21412 }, { "epoch": 0.58, "learning_rate": 0.0008054966093516998, "loss": 2.5436, "step": 21413 }, { "epoch": 0.58, "learning_rate": 0.0008054112331829182, "loss": 2.6836, "step": 21414 }, { "epoch": 0.58, "learning_rate": 0.0008053258584883071, "loss": 2.279, "step": 21415 }, { "epoch": 0.58, "learning_rate": 0.0008052404852685119, "loss": 3.0478, "step": 21416 }, { "epoch": 0.58, "learning_rate": 0.0008051551135241801, "loss": 2.9072, "step": 21417 }, { "epoch": 0.58, "learning_rate": 0.0008050697432559584, "loss": 2.6739, "step": 21418 }, { "epoch": 0.58, "learning_rate": 0.0008049843744644933, "loss": 2.5631, "step": 21419 }, { "epoch": 0.58, "learning_rate": 0.0008048990071504316, "loss": 2.4384, "step": 21420 }, { "epoch": 0.58, "learning_rate": 0.0008048136413144205, "loss": 2.6303, "step": 21421 }, { "epoch": 0.58, "learning_rate": 0.0008047282769571061, "loss": 2.2493, "step": 21422 }, { "epoch": 0.58, "learning_rate": 0.0008046429140791357, "loss": 2.5019, "step": 21423 }, { "epoch": 0.58, "learning_rate": 0.0008045575526811553, "loss": 2.2979, "step": 21424 }, { "epoch": 0.58, "learning_rate": 0.000804472192763812, "loss": 2.1448, "step": 21425 }, { "epoch": 0.58, "learning_rate": 0.0008043868343277526, "loss": 2.3581, "step": 21426 }, { "epoch": 0.58, "learning_rate": 0.0008043014773736234, "loss": 2.4793, "step": 21427 }, { "epoch": 0.58, "learning_rate": 0.0008042161219020712, "loss": 2.1307, "step": 21428 }, { "epoch": 0.58, "learning_rate": 0.0008041307679137429, "loss": 2.2846, "step": 21429 }, { "epoch": 0.58, "learning_rate": 0.0008040454154092844, "loss": 2.2731, "step": 21430 }, { "epoch": 0.58, "learning_rate": 0.0008039600643893435, "loss": 2.4423, "step": 21431 }, { "epoch": 0.58, "learning_rate": 0.0008038747148545656, "loss": 2.7893, "step": 21432 }, { "epoch": 0.58, "learning_rate": 0.0008037893668055979, "loss": 2.5679, "step": 21433 }, { "epoch": 0.58, "learning_rate": 0.000803704020243087, "loss": 2.1566, "step": 21434 }, { "epoch": 0.58, "learning_rate": 0.0008036186751676791, "loss": 2.3533, "step": 21435 }, { "epoch": 0.58, "learning_rate": 0.0008035333315800211, "loss": 2.8462, "step": 21436 }, { "epoch": 0.58, "learning_rate": 0.0008034479894807596, "loss": 2.9942, "step": 21437 }, { "epoch": 0.58, "learning_rate": 0.0008033626488705408, "loss": 2.3733, "step": 21438 }, { "epoch": 0.58, "learning_rate": 0.0008032773097500115, "loss": 2.6523, "step": 21439 }, { "epoch": 0.58, "learning_rate": 0.0008031919721198182, "loss": 2.7225, "step": 21440 }, { "epoch": 0.58, "learning_rate": 0.0008031066359806072, "loss": 2.2967, "step": 21441 }, { "epoch": 0.58, "learning_rate": 0.0008030213013330255, "loss": 2.9559, "step": 21442 }, { "epoch": 0.58, "learning_rate": 0.0008029359681777186, "loss": 2.1284, "step": 21443 }, { "epoch": 0.58, "learning_rate": 0.0008028506365153337, "loss": 2.4593, "step": 21444 }, { "epoch": 0.58, "learning_rate": 0.0008027653063465177, "loss": 2.4803, "step": 21445 }, { "epoch": 0.58, "learning_rate": 0.000802679977671916, "loss": 2.6714, "step": 21446 }, { "epoch": 0.58, "learning_rate": 0.0008025946504921753, "loss": 2.4567, "step": 21447 }, { "epoch": 0.58, "learning_rate": 0.0008025093248079429, "loss": 2.5589, "step": 21448 }, { "epoch": 0.58, "learning_rate": 0.0008024240006198641, "loss": 2.4414, "step": 21449 }, { "epoch": 0.58, "learning_rate": 0.000802338677928586, "loss": 2.8359, "step": 21450 }, { "epoch": 0.58, "learning_rate": 0.0008022533567347544, "loss": 2.3299, "step": 21451 }, { "epoch": 0.58, "learning_rate": 0.0008021680370390161, "loss": 2.135, "step": 21452 }, { "epoch": 0.58, "learning_rate": 0.0008020827188420176, "loss": 2.6465, "step": 21453 }, { "epoch": 0.58, "learning_rate": 0.0008019974021444047, "loss": 2.1342, "step": 21454 }, { "epoch": 0.58, "learning_rate": 0.0008019120869468243, "loss": 2.2545, "step": 21455 }, { "epoch": 0.58, "learning_rate": 0.0008018267732499225, "loss": 2.0683, "step": 21456 }, { "epoch": 0.58, "learning_rate": 0.0008017414610543457, "loss": 2.5941, "step": 21457 }, { "epoch": 0.58, "learning_rate": 0.0008016561503607402, "loss": 2.7697, "step": 21458 }, { "epoch": 0.58, "learning_rate": 0.0008015708411697521, "loss": 2.7672, "step": 21459 }, { "epoch": 0.58, "learning_rate": 0.0008014855334820275, "loss": 3.051, "step": 21460 }, { "epoch": 0.58, "learning_rate": 0.0008014002272982137, "loss": 2.7515, "step": 21461 }, { "epoch": 0.58, "learning_rate": 0.0008013149226189559, "loss": 2.427, "step": 21462 }, { "epoch": 0.58, "learning_rate": 0.0008012296194449007, "loss": 2.4842, "step": 21463 }, { "epoch": 0.58, "learning_rate": 0.0008011443177766946, "loss": 2.79, "step": 21464 }, { "epoch": 0.58, "learning_rate": 0.0008010590176149833, "loss": 1.8817, "step": 21465 }, { "epoch": 0.58, "learning_rate": 0.0008009737189604135, "loss": 2.396, "step": 21466 }, { "epoch": 0.58, "learning_rate": 0.000800888421813631, "loss": 2.1622, "step": 21467 }, { "epoch": 0.58, "learning_rate": 0.0008008031261752823, "loss": 2.3983, "step": 21468 }, { "epoch": 0.58, "learning_rate": 0.0008007178320460137, "loss": 2.2421, "step": 21469 }, { "epoch": 0.58, "learning_rate": 0.000800632539426471, "loss": 2.6249, "step": 21470 }, { "epoch": 0.58, "learning_rate": 0.0008005472483173005, "loss": 2.2517, "step": 21471 }, { "epoch": 0.58, "learning_rate": 0.0008004619587191488, "loss": 3.0239, "step": 21472 }, { "epoch": 0.58, "learning_rate": 0.0008003766706326609, "loss": 2.579, "step": 21473 }, { "epoch": 0.58, "learning_rate": 0.000800291384058484, "loss": 2.5578, "step": 21474 }, { "epoch": 0.58, "learning_rate": 0.0008002060989972644, "loss": 2.8335, "step": 21475 }, { "epoch": 0.58, "learning_rate": 0.0008001208154496471, "loss": 2.6289, "step": 21476 }, { "epoch": 0.58, "learning_rate": 0.000800035533416279, "loss": 2.7302, "step": 21477 }, { "epoch": 0.58, "learning_rate": 0.0007999502528978057, "loss": 2.6164, "step": 21478 }, { "epoch": 0.58, "learning_rate": 0.0007998649738948736, "loss": 1.9753, "step": 21479 }, { "epoch": 0.58, "learning_rate": 0.0007997796964081288, "loss": 2.5517, "step": 21480 }, { "epoch": 0.58, "learning_rate": 0.000799694420438217, "loss": 2.5814, "step": 21481 }, { "epoch": 0.58, "learning_rate": 0.0007996091459857845, "loss": 2.3233, "step": 21482 }, { "epoch": 0.58, "learning_rate": 0.0007995238730514776, "loss": 3.0818, "step": 21483 }, { "epoch": 0.58, "learning_rate": 0.0007994386016359417, "loss": 2.8183, "step": 21484 }, { "epoch": 0.58, "learning_rate": 0.0007993533317398234, "loss": 2.7463, "step": 21485 }, { "epoch": 0.58, "learning_rate": 0.0007992680633637679, "loss": 2.4864, "step": 21486 }, { "epoch": 0.58, "learning_rate": 0.0007991827965084218, "loss": 2.448, "step": 21487 }, { "epoch": 0.58, "learning_rate": 0.0007990975311744314, "loss": 2.4697, "step": 21488 }, { "epoch": 0.58, "learning_rate": 0.0007990122673624417, "loss": 2.6075, "step": 21489 }, { "epoch": 0.58, "learning_rate": 0.000798927005073099, "loss": 3.111, "step": 21490 }, { "epoch": 0.58, "learning_rate": 0.0007988417443070499, "loss": 2.5444, "step": 21491 }, { "epoch": 0.58, "learning_rate": 0.0007987564850649395, "loss": 2.4158, "step": 21492 }, { "epoch": 0.58, "learning_rate": 0.0007986712273474142, "loss": 2.4909, "step": 21493 }, { "epoch": 0.58, "learning_rate": 0.0007985859711551193, "loss": 2.7398, "step": 21494 }, { "epoch": 0.58, "learning_rate": 0.0007985007164887011, "loss": 2.6712, "step": 21495 }, { "epoch": 0.58, "learning_rate": 0.0007984154633488058, "loss": 2.3238, "step": 21496 }, { "epoch": 0.58, "learning_rate": 0.0007983302117360786, "loss": 2.5788, "step": 21497 }, { "epoch": 0.58, "learning_rate": 0.0007982449616511657, "loss": 2.7152, "step": 21498 }, { "epoch": 0.58, "learning_rate": 0.0007981597130947132, "loss": 2.615, "step": 21499 }, { "epoch": 0.58, "learning_rate": 0.0007980744660673662, "loss": 2.1778, "step": 21500 }, { "epoch": 0.58, "learning_rate": 0.0007979892205697716, "loss": 2.6317, "step": 21501 }, { "epoch": 0.58, "learning_rate": 0.000797903976602574, "loss": 2.6476, "step": 21502 }, { "epoch": 0.58, "learning_rate": 0.0007978187341664194, "loss": 2.5643, "step": 21503 }, { "epoch": 0.58, "learning_rate": 0.0007977334932619548, "loss": 2.032, "step": 21504 }, { "epoch": 0.58, "learning_rate": 0.0007976482538898245, "loss": 2.6299, "step": 21505 }, { "epoch": 0.58, "learning_rate": 0.000797563016050675, "loss": 2.4295, "step": 21506 }, { "epoch": 0.58, "learning_rate": 0.000797477779745152, "loss": 2.8753, "step": 21507 }, { "epoch": 0.58, "learning_rate": 0.000797392544973901, "loss": 2.3035, "step": 21508 }, { "epoch": 0.58, "learning_rate": 0.0007973073117375678, "loss": 2.7073, "step": 21509 }, { "epoch": 0.58, "learning_rate": 0.0007972220800367984, "loss": 2.3386, "step": 21510 }, { "epoch": 0.58, "learning_rate": 0.000797136849872238, "loss": 2.4072, "step": 21511 }, { "epoch": 0.58, "learning_rate": 0.0007970516212445329, "loss": 2.5716, "step": 21512 }, { "epoch": 0.58, "learning_rate": 0.0007969663941543282, "loss": 2.1638, "step": 21513 }, { "epoch": 0.58, "learning_rate": 0.0007968811686022697, "loss": 2.3891, "step": 21514 }, { "epoch": 0.58, "learning_rate": 0.0007967959445890035, "loss": 2.63, "step": 21515 }, { "epoch": 0.58, "learning_rate": 0.0007967107221151744, "loss": 2.5247, "step": 21516 }, { "epoch": 0.58, "learning_rate": 0.0007966255011814287, "loss": 2.6501, "step": 21517 }, { "epoch": 0.58, "learning_rate": 0.0007965402817884124, "loss": 2.5985, "step": 21518 }, { "epoch": 0.58, "learning_rate": 0.0007964550639367698, "loss": 2.4752, "step": 21519 }, { "epoch": 0.58, "learning_rate": 0.0007963698476271477, "loss": 2.2865, "step": 21520 }, { "epoch": 0.58, "learning_rate": 0.0007962846328601911, "loss": 2.8306, "step": 21521 }, { "epoch": 0.58, "learning_rate": 0.0007961994196365455, "loss": 2.0667, "step": 21522 }, { "epoch": 0.58, "learning_rate": 0.0007961142079568569, "loss": 2.4659, "step": 21523 }, { "epoch": 0.58, "learning_rate": 0.0007960289978217705, "loss": 2.4973, "step": 21524 }, { "epoch": 0.58, "learning_rate": 0.0007959437892319319, "loss": 2.5495, "step": 21525 }, { "epoch": 0.58, "learning_rate": 0.0007958585821879869, "loss": 2.4782, "step": 21526 }, { "epoch": 0.58, "learning_rate": 0.0007957733766905805, "loss": 2.6802, "step": 21527 }, { "epoch": 0.58, "learning_rate": 0.0007956881727403589, "loss": 2.6612, "step": 21528 }, { "epoch": 0.58, "learning_rate": 0.0007956029703379666, "loss": 2.1202, "step": 21529 }, { "epoch": 0.58, "learning_rate": 0.0007955177694840499, "loss": 2.21, "step": 21530 }, { "epoch": 0.58, "learning_rate": 0.0007954325701792544, "loss": 2.7716, "step": 21531 }, { "epoch": 0.58, "learning_rate": 0.0007953473724242248, "loss": 2.209, "step": 21532 }, { "epoch": 0.58, "learning_rate": 0.0007952621762196066, "loss": 2.6077, "step": 21533 }, { "epoch": 0.58, "learning_rate": 0.0007951769815660462, "loss": 2.2882, "step": 21534 }, { "epoch": 0.58, "learning_rate": 0.0007950917884641881, "loss": 2.3316, "step": 21535 }, { "epoch": 0.58, "learning_rate": 0.0007950065969146781, "loss": 1.9197, "step": 21536 }, { "epoch": 0.58, "learning_rate": 0.0007949214069181611, "loss": 1.7751, "step": 21537 }, { "epoch": 0.58, "learning_rate": 0.000794836218475283, "loss": 2.4683, "step": 21538 }, { "epoch": 0.58, "learning_rate": 0.0007947510315866892, "loss": 2.4961, "step": 21539 }, { "epoch": 0.58, "learning_rate": 0.0007946658462530249, "loss": 2.5186, "step": 21540 }, { "epoch": 0.58, "learning_rate": 0.0007945806624749352, "loss": 2.8407, "step": 21541 }, { "epoch": 0.58, "learning_rate": 0.0007944954802530659, "loss": 2.5441, "step": 21542 }, { "epoch": 0.58, "learning_rate": 0.000794410299588062, "loss": 2.4875, "step": 21543 }, { "epoch": 0.58, "learning_rate": 0.0007943251204805692, "loss": 2.3495, "step": 21544 }, { "epoch": 0.58, "learning_rate": 0.0007942399429312321, "loss": 3.2388, "step": 21545 }, { "epoch": 0.58, "learning_rate": 0.0007941547669406963, "loss": 2.7508, "step": 21546 }, { "epoch": 0.58, "learning_rate": 0.0007940695925096079, "loss": 2.6095, "step": 21547 }, { "epoch": 0.58, "learning_rate": 0.0007939844196386108, "loss": 2.49, "step": 21548 }, { "epoch": 0.58, "learning_rate": 0.0007938992483283511, "loss": 2.4662, "step": 21549 }, { "epoch": 0.58, "learning_rate": 0.0007938140785794739, "loss": 2.4447, "step": 21550 }, { "epoch": 0.58, "learning_rate": 0.0007937289103926242, "loss": 2.3643, "step": 21551 }, { "epoch": 0.58, "learning_rate": 0.0007936437437684473, "loss": 2.252, "step": 21552 }, { "epoch": 0.58, "learning_rate": 0.000793558578707589, "loss": 2.6098, "step": 21553 }, { "epoch": 0.58, "learning_rate": 0.0007934734152106936, "loss": 2.2953, "step": 21554 }, { "epoch": 0.58, "learning_rate": 0.0007933882532784069, "loss": 2.4337, "step": 21555 }, { "epoch": 0.58, "learning_rate": 0.0007933030929113737, "loss": 2.5733, "step": 21556 }, { "epoch": 0.58, "learning_rate": 0.0007932179341102394, "loss": 2.6161, "step": 21557 }, { "epoch": 0.58, "learning_rate": 0.0007931327768756493, "loss": 2.5374, "step": 21558 }, { "epoch": 0.58, "learning_rate": 0.0007930476212082477, "loss": 2.5689, "step": 21559 }, { "epoch": 0.58, "learning_rate": 0.0007929624671086805, "loss": 2.5623, "step": 21560 }, { "epoch": 0.58, "learning_rate": 0.0007928773145775931, "loss": 2.5204, "step": 21561 }, { "epoch": 0.58, "learning_rate": 0.0007927921636156299, "loss": 2.7082, "step": 21562 }, { "epoch": 0.58, "learning_rate": 0.0007927070142234363, "loss": 2.3705, "step": 21563 }, { "epoch": 0.58, "learning_rate": 0.0007926218664016569, "loss": 2.682, "step": 21564 }, { "epoch": 0.58, "learning_rate": 0.0007925367201509374, "loss": 2.6792, "step": 21565 }, { "epoch": 0.58, "learning_rate": 0.0007924515754719227, "loss": 2.4731, "step": 21566 }, { "epoch": 0.58, "learning_rate": 0.0007923664323652576, "loss": 2.3551, "step": 21567 }, { "epoch": 0.58, "learning_rate": 0.0007922812908315873, "loss": 2.3288, "step": 21568 }, { "epoch": 0.58, "learning_rate": 0.000792196150871557, "loss": 2.5939, "step": 21569 }, { "epoch": 0.58, "learning_rate": 0.0007921110124858113, "loss": 2.3885, "step": 21570 }, { "epoch": 0.58, "learning_rate": 0.0007920258756749959, "loss": 2.5652, "step": 21571 }, { "epoch": 0.58, "learning_rate": 0.0007919407404397545, "loss": 2.5314, "step": 21572 }, { "epoch": 0.58, "learning_rate": 0.0007918556067807332, "loss": 2.473, "step": 21573 }, { "epoch": 0.58, "learning_rate": 0.000791770474698577, "loss": 2.4155, "step": 21574 }, { "epoch": 0.58, "learning_rate": 0.0007916853441939298, "loss": 2.6887, "step": 21575 }, { "epoch": 0.58, "learning_rate": 0.0007916002152674373, "loss": 2.6134, "step": 21576 }, { "epoch": 0.58, "learning_rate": 0.0007915150879197448, "loss": 2.5823, "step": 21577 }, { "epoch": 0.58, "learning_rate": 0.0007914299621514963, "loss": 2.0909, "step": 21578 }, { "epoch": 0.58, "learning_rate": 0.0007913448379633374, "loss": 2.3511, "step": 21579 }, { "epoch": 0.58, "learning_rate": 0.0007912597153559124, "loss": 2.066, "step": 21580 }, { "epoch": 0.58, "learning_rate": 0.0007911745943298666, "loss": 2.3917, "step": 21581 }, { "epoch": 0.58, "learning_rate": 0.0007910894748858449, "loss": 2.5671, "step": 21582 }, { "epoch": 0.58, "learning_rate": 0.0007910043570244917, "loss": 2.6655, "step": 21583 }, { "epoch": 0.58, "learning_rate": 0.0007909192407464521, "loss": 1.9979, "step": 21584 }, { "epoch": 0.58, "learning_rate": 0.0007908341260523713, "loss": 2.5626, "step": 21585 }, { "epoch": 0.58, "learning_rate": 0.0007907490129428935, "loss": 2.7138, "step": 21586 }, { "epoch": 0.58, "learning_rate": 0.0007906639014186637, "loss": 2.4204, "step": 21587 }, { "epoch": 0.58, "learning_rate": 0.000790578791480327, "loss": 3.0368, "step": 21588 }, { "epoch": 0.58, "learning_rate": 0.0007904936831285279, "loss": 2.5545, "step": 21589 }, { "epoch": 0.58, "learning_rate": 0.0007904085763639114, "loss": 2.5653, "step": 21590 }, { "epoch": 0.58, "learning_rate": 0.0007903234711871217, "loss": 2.766, "step": 21591 }, { "epoch": 0.58, "learning_rate": 0.0007902383675988038, "loss": 2.6762, "step": 21592 }, { "epoch": 0.58, "learning_rate": 0.000790153265599603, "loss": 2.5532, "step": 21593 }, { "epoch": 0.58, "learning_rate": 0.0007900681651901631, "loss": 2.2129, "step": 21594 }, { "epoch": 0.58, "learning_rate": 0.0007899830663711294, "loss": 2.8219, "step": 21595 }, { "epoch": 0.58, "learning_rate": 0.0007898979691431465, "loss": 2.6861, "step": 21596 }, { "epoch": 0.58, "learning_rate": 0.000789812873506859, "loss": 2.1483, "step": 21597 }, { "epoch": 0.58, "learning_rate": 0.0007897277794629116, "loss": 2.4907, "step": 21598 }, { "epoch": 0.58, "learning_rate": 0.0007896426870119489, "loss": 2.521, "step": 21599 }, { "epoch": 0.58, "learning_rate": 0.0007895575961546154, "loss": 2.0072, "step": 21600 }, { "epoch": 0.58, "learning_rate": 0.0007894725068915562, "loss": 2.9562, "step": 21601 }, { "epoch": 0.58, "learning_rate": 0.0007893874192234156, "loss": 2.3287, "step": 21602 }, { "epoch": 0.58, "learning_rate": 0.0007893023331508382, "loss": 2.7174, "step": 21603 }, { "epoch": 0.58, "learning_rate": 0.000789217248674469, "loss": 2.3993, "step": 21604 }, { "epoch": 0.58, "learning_rate": 0.0007891321657949517, "loss": 2.3282, "step": 21605 }, { "epoch": 0.58, "learning_rate": 0.000789047084512932, "loss": 2.5015, "step": 21606 }, { "epoch": 0.58, "learning_rate": 0.0007889620048290533, "loss": 2.2362, "step": 21607 }, { "epoch": 0.58, "learning_rate": 0.0007888769267439609, "loss": 2.4187, "step": 21608 }, { "epoch": 0.58, "learning_rate": 0.0007887918502582994, "loss": 2.7475, "step": 21609 }, { "epoch": 0.58, "learning_rate": 0.0007887067753727128, "loss": 2.326, "step": 21610 }, { "epoch": 0.58, "learning_rate": 0.0007886217020878457, "loss": 2.8161, "step": 21611 }, { "epoch": 0.58, "learning_rate": 0.0007885366304043434, "loss": 2.7671, "step": 21612 }, { "epoch": 0.58, "learning_rate": 0.0007884515603228492, "loss": 2.6237, "step": 21613 }, { "epoch": 0.58, "learning_rate": 0.0007883664918440085, "loss": 2.2442, "step": 21614 }, { "epoch": 0.58, "learning_rate": 0.0007882814249684653, "loss": 2.0061, "step": 21615 }, { "epoch": 0.58, "learning_rate": 0.0007881963596968642, "loss": 2.3349, "step": 21616 }, { "epoch": 0.58, "learning_rate": 0.00078811129602985, "loss": 2.9492, "step": 21617 }, { "epoch": 0.58, "learning_rate": 0.0007880262339680659, "loss": 2.6343, "step": 21618 }, { "epoch": 0.58, "learning_rate": 0.0007879411735121576, "loss": 2.5051, "step": 21619 }, { "epoch": 0.58, "learning_rate": 0.0007878561146627694, "loss": 2.73, "step": 21620 }, { "epoch": 0.58, "learning_rate": 0.0007877710574205449, "loss": 2.7891, "step": 21621 }, { "epoch": 0.58, "learning_rate": 0.0007876860017861287, "loss": 1.8772, "step": 21622 }, { "epoch": 0.58, "learning_rate": 0.0007876009477601661, "loss": 2.5623, "step": 21623 }, { "epoch": 0.58, "learning_rate": 0.0007875158953433004, "loss": 2.4408, "step": 21624 }, { "epoch": 0.58, "learning_rate": 0.0007874308445361763, "loss": 2.3682, "step": 21625 }, { "epoch": 0.58, "learning_rate": 0.000787345795339438, "loss": 2.4276, "step": 21626 }, { "epoch": 0.58, "learning_rate": 0.0007872607477537299, "loss": 2.7235, "step": 21627 }, { "epoch": 0.58, "learning_rate": 0.0007871757017796966, "loss": 2.4033, "step": 21628 }, { "epoch": 0.58, "learning_rate": 0.0007870906574179819, "loss": 2.7978, "step": 21629 }, { "epoch": 0.58, "learning_rate": 0.0007870056146692304, "loss": 2.5157, "step": 21630 }, { "epoch": 0.58, "learning_rate": 0.0007869205735340864, "loss": 2.5706, "step": 21631 }, { "epoch": 0.58, "learning_rate": 0.0007868355340131939, "loss": 2.6808, "step": 21632 }, { "epoch": 0.58, "learning_rate": 0.0007867504961071977, "loss": 2.6054, "step": 21633 }, { "epoch": 0.58, "learning_rate": 0.0007866654598167411, "loss": 2.7512, "step": 21634 }, { "epoch": 0.58, "learning_rate": 0.0007865804251424686, "loss": 2.6794, "step": 21635 }, { "epoch": 0.58, "learning_rate": 0.0007864953920850253, "loss": 2.5648, "step": 21636 }, { "epoch": 0.58, "learning_rate": 0.0007864103606450545, "loss": 2.6517, "step": 21637 }, { "epoch": 0.58, "learning_rate": 0.0007863253308232004, "loss": 2.8676, "step": 21638 }, { "epoch": 0.58, "learning_rate": 0.0007862403026201077, "loss": 2.3047, "step": 21639 }, { "epoch": 0.58, "learning_rate": 0.00078615527603642, "loss": 2.3955, "step": 21640 }, { "epoch": 0.58, "learning_rate": 0.000786070251072782, "loss": 2.403, "step": 21641 }, { "epoch": 0.58, "learning_rate": 0.0007859852277298372, "loss": 2.7045, "step": 21642 }, { "epoch": 0.58, "learning_rate": 0.0007859002060082301, "loss": 2.4591, "step": 21643 }, { "epoch": 0.58, "learning_rate": 0.0007858151859086051, "loss": 2.5781, "step": 21644 }, { "epoch": 0.58, "learning_rate": 0.0007857301674316055, "loss": 2.2434, "step": 21645 }, { "epoch": 0.58, "learning_rate": 0.000785645150577876, "loss": 2.7429, "step": 21646 }, { "epoch": 0.58, "learning_rate": 0.0007855601353480609, "loss": 2.459, "step": 21647 }, { "epoch": 0.58, "learning_rate": 0.0007854751217428033, "loss": 2.4226, "step": 21648 }, { "epoch": 0.58, "learning_rate": 0.0007853901097627484, "loss": 2.6267, "step": 21649 }, { "epoch": 0.58, "learning_rate": 0.0007853050994085393, "loss": 2.2802, "step": 21650 }, { "epoch": 0.58, "learning_rate": 0.0007852200906808203, "loss": 2.0055, "step": 21651 }, { "epoch": 0.58, "learning_rate": 0.0007851350835802357, "loss": 2.4775, "step": 21652 }, { "epoch": 0.58, "learning_rate": 0.0007850500781074291, "loss": 2.4007, "step": 21653 }, { "epoch": 0.58, "learning_rate": 0.0007849650742630447, "loss": 2.0412, "step": 21654 }, { "epoch": 0.58, "learning_rate": 0.0007848800720477267, "loss": 2.403, "step": 21655 }, { "epoch": 0.58, "learning_rate": 0.0007847950714621186, "loss": 3.0576, "step": 21656 }, { "epoch": 0.58, "learning_rate": 0.0007847100725068646, "loss": 2.599, "step": 21657 }, { "epoch": 0.58, "learning_rate": 0.0007846250751826086, "loss": 2.8259, "step": 21658 }, { "epoch": 0.58, "learning_rate": 0.0007845400794899944, "loss": 2.4941, "step": 21659 }, { "epoch": 0.58, "learning_rate": 0.0007844550854296666, "loss": 2.6757, "step": 21660 }, { "epoch": 0.58, "learning_rate": 0.0007843700930022678, "loss": 2.5636, "step": 21661 }, { "epoch": 0.58, "learning_rate": 0.0007842851022084429, "loss": 2.2295, "step": 21662 }, { "epoch": 0.58, "learning_rate": 0.0007842001130488359, "loss": 2.7082, "step": 21663 }, { "epoch": 0.58, "learning_rate": 0.0007841151255240897, "loss": 2.3385, "step": 21664 }, { "epoch": 0.58, "learning_rate": 0.0007840301396348486, "loss": 2.5425, "step": 21665 }, { "epoch": 0.58, "learning_rate": 0.0007839451553817572, "loss": 2.3987, "step": 21666 }, { "epoch": 0.58, "learning_rate": 0.0007838601727654582, "loss": 2.6327, "step": 21667 }, { "epoch": 0.58, "learning_rate": 0.0007837751917865963, "loss": 2.5307, "step": 21668 }, { "epoch": 0.58, "learning_rate": 0.0007836902124458145, "loss": 2.8111, "step": 21669 }, { "epoch": 0.58, "learning_rate": 0.000783605234743757, "loss": 2.2192, "step": 21670 }, { "epoch": 0.58, "learning_rate": 0.0007835202586810678, "loss": 2.1629, "step": 21671 }, { "epoch": 0.58, "learning_rate": 0.0007834352842583901, "loss": 2.7697, "step": 21672 }, { "epoch": 0.58, "learning_rate": 0.0007833503114763681, "loss": 2.3035, "step": 21673 }, { "epoch": 0.58, "learning_rate": 0.0007832653403356455, "loss": 2.3617, "step": 21674 }, { "epoch": 0.58, "learning_rate": 0.0007831803708368658, "loss": 2.6255, "step": 21675 }, { "epoch": 0.58, "learning_rate": 0.0007830954029806734, "loss": 2.4431, "step": 21676 }, { "epoch": 0.58, "learning_rate": 0.0007830104367677108, "loss": 2.3569, "step": 21677 }, { "epoch": 0.58, "learning_rate": 0.0007829254721986222, "loss": 2.565, "step": 21678 }, { "epoch": 0.58, "learning_rate": 0.000782840509274052, "loss": 2.3262, "step": 21679 }, { "epoch": 0.58, "learning_rate": 0.000782755547994643, "loss": 2.459, "step": 21680 }, { "epoch": 0.58, "learning_rate": 0.000782670588361039, "loss": 2.819, "step": 21681 }, { "epoch": 0.58, "learning_rate": 0.0007825856303738841, "loss": 2.4569, "step": 21682 }, { "epoch": 0.58, "learning_rate": 0.0007825006740338212, "loss": 2.3374, "step": 21683 }, { "epoch": 0.58, "learning_rate": 0.0007824157193414947, "loss": 2.3935, "step": 21684 }, { "epoch": 0.58, "learning_rate": 0.0007823307662975475, "loss": 3.0162, "step": 21685 }, { "epoch": 0.58, "learning_rate": 0.0007822458149026235, "loss": 2.3449, "step": 21686 }, { "epoch": 0.58, "learning_rate": 0.0007821608651573665, "loss": 2.6695, "step": 21687 }, { "epoch": 0.58, "learning_rate": 0.0007820759170624196, "loss": 2.9062, "step": 21688 }, { "epoch": 0.58, "learning_rate": 0.0007819909706184268, "loss": 2.4906, "step": 21689 }, { "epoch": 0.58, "learning_rate": 0.0007819060258260315, "loss": 2.5793, "step": 21690 }, { "epoch": 0.58, "learning_rate": 0.0007818210826858767, "loss": 2.6388, "step": 21691 }, { "epoch": 0.58, "learning_rate": 0.0007817361411986071, "loss": 2.4813, "step": 21692 }, { "epoch": 0.58, "learning_rate": 0.0007816512013648648, "loss": 2.4534, "step": 21693 }, { "epoch": 0.58, "learning_rate": 0.0007815662631852942, "loss": 2.35, "step": 21694 }, { "epoch": 0.58, "learning_rate": 0.0007814813266605387, "loss": 2.3401, "step": 21695 }, { "epoch": 0.58, "learning_rate": 0.0007813963917912413, "loss": 2.6126, "step": 21696 }, { "epoch": 0.58, "learning_rate": 0.0007813114585780459, "loss": 2.2822, "step": 21697 }, { "epoch": 0.58, "learning_rate": 0.000781226527021596, "loss": 2.3549, "step": 21698 }, { "epoch": 0.58, "learning_rate": 0.0007811415971225344, "loss": 2.1514, "step": 21699 }, { "epoch": 0.58, "learning_rate": 0.0007810566688815051, "loss": 2.4558, "step": 21700 }, { "epoch": 0.58, "learning_rate": 0.0007809717422991515, "loss": 2.2937, "step": 21701 }, { "epoch": 0.58, "learning_rate": 0.0007808868173761165, "loss": 2.6623, "step": 21702 }, { "epoch": 0.58, "learning_rate": 0.0007808018941130444, "loss": 3.0648, "step": 21703 }, { "epoch": 0.58, "learning_rate": 0.0007807169725105772, "loss": 2.5581, "step": 21704 }, { "epoch": 0.58, "learning_rate": 0.0007806320525693593, "loss": 2.5575, "step": 21705 }, { "epoch": 0.58, "learning_rate": 0.0007805471342900341, "loss": 2.0923, "step": 21706 }, { "epoch": 0.58, "learning_rate": 0.0007804622176732442, "loss": 2.5765, "step": 21707 }, { "epoch": 0.58, "learning_rate": 0.0007803773027196332, "loss": 2.6954, "step": 21708 }, { "epoch": 0.58, "learning_rate": 0.000780292389429845, "loss": 2.5649, "step": 21709 }, { "epoch": 0.58, "learning_rate": 0.0007802074778045219, "loss": 2.8086, "step": 21710 }, { "epoch": 0.58, "learning_rate": 0.0007801225678443079, "loss": 2.4612, "step": 21711 }, { "epoch": 0.58, "learning_rate": 0.0007800376595498459, "loss": 2.8109, "step": 21712 }, { "epoch": 0.58, "learning_rate": 0.0007799527529217792, "loss": 2.5012, "step": 21713 }, { "epoch": 0.58, "learning_rate": 0.0007798678479607513, "loss": 2.1549, "step": 21714 }, { "epoch": 0.58, "learning_rate": 0.000779782944667405, "loss": 2.7024, "step": 21715 }, { "epoch": 0.58, "learning_rate": 0.0007796980430423838, "loss": 2.4555, "step": 21716 }, { "epoch": 0.58, "learning_rate": 0.0007796131430863309, "loss": 2.7861, "step": 21717 }, { "epoch": 0.58, "learning_rate": 0.0007795282447998894, "loss": 2.6972, "step": 21718 }, { "epoch": 0.58, "learning_rate": 0.0007794433481837029, "loss": 2.3374, "step": 21719 }, { "epoch": 0.58, "learning_rate": 0.0007793584532384137, "loss": 2.3143, "step": 21720 }, { "epoch": 0.58, "learning_rate": 0.0007792735599646652, "loss": 2.1647, "step": 21721 }, { "epoch": 0.58, "learning_rate": 0.0007791886683631013, "loss": 2.2083, "step": 21722 }, { "epoch": 0.58, "learning_rate": 0.0007791037784343642, "loss": 2.313, "step": 21723 }, { "epoch": 0.58, "learning_rate": 0.0007790188901790975, "loss": 2.3163, "step": 21724 }, { "epoch": 0.58, "learning_rate": 0.0007789340035979442, "loss": 1.8751, "step": 21725 }, { "epoch": 0.58, "learning_rate": 0.0007788491186915473, "loss": 2.4834, "step": 21726 }, { "epoch": 0.58, "learning_rate": 0.0007787642354605501, "loss": 2.0511, "step": 21727 }, { "epoch": 0.58, "learning_rate": 0.0007786793539055953, "loss": 2.6745, "step": 21728 }, { "epoch": 0.58, "learning_rate": 0.000778594474027326, "loss": 2.5189, "step": 21729 }, { "epoch": 0.58, "learning_rate": 0.0007785095958263859, "loss": 2.4246, "step": 21730 }, { "epoch": 0.58, "learning_rate": 0.0007784247193034171, "loss": 2.6596, "step": 21731 }, { "epoch": 0.58, "learning_rate": 0.0007783398444590631, "loss": 2.4761, "step": 21732 }, { "epoch": 0.58, "learning_rate": 0.0007782549712939671, "loss": 2.687, "step": 21733 }, { "epoch": 0.58, "learning_rate": 0.0007781700998087712, "loss": 2.8084, "step": 21734 }, { "epoch": 0.58, "learning_rate": 0.0007780852300041192, "loss": 2.5932, "step": 21735 }, { "epoch": 0.58, "learning_rate": 0.0007780003618806543, "loss": 3.1197, "step": 21736 }, { "epoch": 0.58, "learning_rate": 0.0007779154954390184, "loss": 2.6626, "step": 21737 }, { "epoch": 0.58, "learning_rate": 0.0007778306306798554, "loss": 2.5253, "step": 21738 }, { "epoch": 0.58, "learning_rate": 0.0007777457676038075, "loss": 2.4964, "step": 21739 }, { "epoch": 0.58, "learning_rate": 0.0007776609062115178, "loss": 2.9284, "step": 21740 }, { "epoch": 0.58, "learning_rate": 0.0007775760465036298, "loss": 2.6125, "step": 21741 }, { "epoch": 0.58, "learning_rate": 0.0007774911884807856, "loss": 2.5272, "step": 21742 }, { "epoch": 0.58, "learning_rate": 0.0007774063321436284, "loss": 2.5483, "step": 21743 }, { "epoch": 0.58, "learning_rate": 0.0007773214774928011, "loss": 2.5957, "step": 21744 }, { "epoch": 0.58, "learning_rate": 0.0007772366245289464, "loss": 2.3104, "step": 21745 }, { "epoch": 0.58, "learning_rate": 0.0007771517732527075, "loss": 2.2716, "step": 21746 }, { "epoch": 0.58, "learning_rate": 0.0007770669236647264, "loss": 2.6225, "step": 21747 }, { "epoch": 0.58, "learning_rate": 0.0007769820757656467, "loss": 2.7927, "step": 21748 }, { "epoch": 0.58, "learning_rate": 0.0007768972295561112, "loss": 2.594, "step": 21749 }, { "epoch": 0.58, "learning_rate": 0.0007768123850367621, "loss": 2.7501, "step": 21750 }, { "epoch": 0.58, "learning_rate": 0.0007767275422082421, "loss": 2.2813, "step": 21751 }, { "epoch": 0.58, "learning_rate": 0.0007766427010711952, "loss": 2.7431, "step": 21752 }, { "epoch": 0.58, "learning_rate": 0.0007765578616262626, "loss": 1.9359, "step": 21753 }, { "epoch": 0.58, "learning_rate": 0.000776473023874088, "loss": 2.4864, "step": 21754 }, { "epoch": 0.58, "learning_rate": 0.0007763881878153136, "loss": 2.5738, "step": 21755 }, { "epoch": 0.58, "learning_rate": 0.0007763033534505824, "loss": 2.1582, "step": 21756 }, { "epoch": 0.58, "learning_rate": 0.000776218520780537, "loss": 2.4181, "step": 21757 }, { "epoch": 0.58, "learning_rate": 0.00077613368980582, "loss": 2.4433, "step": 21758 }, { "epoch": 0.58, "learning_rate": 0.0007760488605270742, "loss": 2.3373, "step": 21759 }, { "epoch": 0.58, "learning_rate": 0.0007759640329449423, "loss": 2.7074, "step": 21760 }, { "epoch": 0.58, "learning_rate": 0.0007758792070600666, "loss": 2.348, "step": 21761 }, { "epoch": 0.58, "learning_rate": 0.0007757943828730904, "loss": 2.733, "step": 21762 }, { "epoch": 0.58, "learning_rate": 0.0007757095603846553, "loss": 2.8627, "step": 21763 }, { "epoch": 0.58, "learning_rate": 0.0007756247395954047, "loss": 2.919, "step": 21764 }, { "epoch": 0.58, "learning_rate": 0.0007755399205059814, "loss": 2.5591, "step": 21765 }, { "epoch": 0.58, "learning_rate": 0.000775455103117027, "loss": 2.3091, "step": 21766 }, { "epoch": 0.58, "learning_rate": 0.0007753702874291845, "loss": 2.3492, "step": 21767 }, { "epoch": 0.58, "learning_rate": 0.000775285473443097, "loss": 2.3388, "step": 21768 }, { "epoch": 0.59, "learning_rate": 0.0007752006611594064, "loss": 2.963, "step": 21769 }, { "epoch": 0.59, "learning_rate": 0.0007751158505787553, "loss": 2.6789, "step": 21770 }, { "epoch": 0.59, "learning_rate": 0.0007750310417017864, "loss": 2.7872, "step": 21771 }, { "epoch": 0.59, "learning_rate": 0.000774946234529142, "loss": 2.4324, "step": 21772 }, { "epoch": 0.59, "learning_rate": 0.0007748614290614648, "loss": 2.5063, "step": 21773 }, { "epoch": 0.59, "learning_rate": 0.000774776625299397, "loss": 2.5939, "step": 21774 }, { "epoch": 0.59, "learning_rate": 0.0007746918232435814, "loss": 2.9265, "step": 21775 }, { "epoch": 0.59, "learning_rate": 0.0007746070228946602, "loss": 2.273, "step": 21776 }, { "epoch": 0.59, "learning_rate": 0.0007745222242532759, "loss": 3.0378, "step": 21777 }, { "epoch": 0.59, "learning_rate": 0.0007744374273200708, "loss": 2.1042, "step": 21778 }, { "epoch": 0.59, "learning_rate": 0.0007743526320956879, "loss": 2.2354, "step": 21779 }, { "epoch": 0.59, "learning_rate": 0.0007742678385807684, "loss": 2.3027, "step": 21780 }, { "epoch": 0.59, "learning_rate": 0.0007741830467759562, "loss": 2.4905, "step": 21781 }, { "epoch": 0.59, "learning_rate": 0.0007740982566818924, "loss": 2.6223, "step": 21782 }, { "epoch": 0.59, "learning_rate": 0.0007740134682992197, "loss": 2.5321, "step": 21783 }, { "epoch": 0.59, "learning_rate": 0.0007739286816285807, "loss": 2.6268, "step": 21784 }, { "epoch": 0.59, "learning_rate": 0.0007738438966706176, "loss": 3.1036, "step": 21785 }, { "epoch": 0.59, "learning_rate": 0.0007737591134259726, "loss": 2.7726, "step": 21786 }, { "epoch": 0.59, "learning_rate": 0.0007736743318952884, "loss": 2.3007, "step": 21787 }, { "epoch": 0.59, "learning_rate": 0.0007735895520792067, "loss": 2.197, "step": 21788 }, { "epoch": 0.59, "learning_rate": 0.0007735047739783703, "loss": 2.65, "step": 21789 }, { "epoch": 0.59, "learning_rate": 0.0007734199975934211, "loss": 2.3349, "step": 21790 }, { "epoch": 0.59, "learning_rate": 0.0007733352229250014, "loss": 2.2427, "step": 21791 }, { "epoch": 0.59, "learning_rate": 0.000773250449973754, "loss": 2.7615, "step": 21792 }, { "epoch": 0.59, "learning_rate": 0.0007731656787403199, "loss": 2.1057, "step": 21793 }, { "epoch": 0.59, "learning_rate": 0.0007730809092253425, "loss": 2.4724, "step": 21794 }, { "epoch": 0.59, "learning_rate": 0.0007729961414294637, "loss": 2.7517, "step": 21795 }, { "epoch": 0.59, "learning_rate": 0.0007729113753533254, "loss": 2.5127, "step": 21796 }, { "epoch": 0.59, "learning_rate": 0.00077282661099757, "loss": 2.9541, "step": 21797 }, { "epoch": 0.59, "learning_rate": 0.0007727418483628394, "loss": 2.7906, "step": 21798 }, { "epoch": 0.59, "learning_rate": 0.0007726570874497759, "loss": 2.7826, "step": 21799 }, { "epoch": 0.59, "learning_rate": 0.0007725723282590219, "loss": 2.698, "step": 21800 }, { "epoch": 0.59, "learning_rate": 0.000772487570791219, "loss": 2.5653, "step": 21801 }, { "epoch": 0.59, "learning_rate": 0.0007724028150470098, "loss": 2.2846, "step": 21802 }, { "epoch": 0.59, "learning_rate": 0.0007723180610270361, "loss": 2.2999, "step": 21803 }, { "epoch": 0.59, "learning_rate": 0.00077223330873194, "loss": 2.3017, "step": 21804 }, { "epoch": 0.59, "learning_rate": 0.0007721485581623639, "loss": 2.63, "step": 21805 }, { "epoch": 0.59, "learning_rate": 0.0007720638093189491, "loss": 3.2223, "step": 21806 }, { "epoch": 0.59, "learning_rate": 0.0007719790622023383, "loss": 2.7318, "step": 21807 }, { "epoch": 0.59, "learning_rate": 0.000771894316813174, "loss": 2.7753, "step": 21808 }, { "epoch": 0.59, "learning_rate": 0.0007718095731520969, "loss": 2.8078, "step": 21809 }, { "epoch": 0.59, "learning_rate": 0.0007717248312197496, "loss": 2.3967, "step": 21810 }, { "epoch": 0.59, "learning_rate": 0.0007716400910167747, "loss": 2.783, "step": 21811 }, { "epoch": 0.59, "learning_rate": 0.0007715553525438133, "loss": 2.0481, "step": 21812 }, { "epoch": 0.59, "learning_rate": 0.0007714706158015077, "loss": 2.6392, "step": 21813 }, { "epoch": 0.59, "learning_rate": 0.0007713858807905, "loss": 2.3267, "step": 21814 }, { "epoch": 0.59, "learning_rate": 0.0007713011475114317, "loss": 2.3983, "step": 21815 }, { "epoch": 0.59, "learning_rate": 0.0007712164159649455, "loss": 2.0993, "step": 21816 }, { "epoch": 0.59, "learning_rate": 0.0007711316861516824, "loss": 2.6052, "step": 21817 }, { "epoch": 0.59, "learning_rate": 0.0007710469580722848, "loss": 2.3043, "step": 21818 }, { "epoch": 0.59, "learning_rate": 0.0007709622317273947, "loss": 2.7382, "step": 21819 }, { "epoch": 0.59, "learning_rate": 0.0007708775071176536, "loss": 2.4331, "step": 21820 }, { "epoch": 0.59, "learning_rate": 0.0007707927842437035, "loss": 2.374, "step": 21821 }, { "epoch": 0.59, "learning_rate": 0.0007707080631061867, "loss": 2.5205, "step": 21822 }, { "epoch": 0.59, "learning_rate": 0.000770623343705744, "loss": 2.709, "step": 21823 }, { "epoch": 0.59, "learning_rate": 0.0007705386260430186, "loss": 2.3604, "step": 21824 }, { "epoch": 0.59, "learning_rate": 0.000770453910118651, "loss": 2.5916, "step": 21825 }, { "epoch": 0.59, "learning_rate": 0.0007703691959332836, "loss": 2.6915, "step": 21826 }, { "epoch": 0.59, "learning_rate": 0.0007702844834875582, "loss": 2.5535, "step": 21827 }, { "epoch": 0.59, "learning_rate": 0.0007701997727821164, "loss": 2.8306, "step": 21828 }, { "epoch": 0.59, "learning_rate": 0.0007701150638176, "loss": 2.8321, "step": 21829 }, { "epoch": 0.59, "learning_rate": 0.000770030356594651, "loss": 2.4492, "step": 21830 }, { "epoch": 0.59, "learning_rate": 0.0007699456511139107, "loss": 2.3164, "step": 21831 }, { "epoch": 0.59, "learning_rate": 0.0007698609473760212, "loss": 2.9019, "step": 21832 }, { "epoch": 0.59, "learning_rate": 0.0007697762453816238, "loss": 2.5991, "step": 21833 }, { "epoch": 0.59, "learning_rate": 0.0007696915451313604, "loss": 2.1741, "step": 21834 }, { "epoch": 0.59, "learning_rate": 0.0007696068466258732, "loss": 2.3959, "step": 21835 }, { "epoch": 0.59, "learning_rate": 0.0007695221498658026, "loss": 2.7122, "step": 21836 }, { "epoch": 0.59, "learning_rate": 0.0007694374548517913, "loss": 2.6626, "step": 21837 }, { "epoch": 0.59, "learning_rate": 0.0007693527615844809, "loss": 2.7771, "step": 21838 }, { "epoch": 0.59, "learning_rate": 0.0007692680700645124, "loss": 2.2734, "step": 21839 }, { "epoch": 0.59, "learning_rate": 0.0007691833802925278, "loss": 2.8521, "step": 21840 }, { "epoch": 0.59, "learning_rate": 0.0007690986922691687, "loss": 2.4851, "step": 21841 }, { "epoch": 0.59, "learning_rate": 0.0007690140059950766, "loss": 2.3072, "step": 21842 }, { "epoch": 0.59, "learning_rate": 0.0007689293214708931, "loss": 2.3286, "step": 21843 }, { "epoch": 0.59, "learning_rate": 0.0007688446386972598, "loss": 2.6339, "step": 21844 }, { "epoch": 0.59, "learning_rate": 0.000768759957674818, "loss": 2.8715, "step": 21845 }, { "epoch": 0.59, "learning_rate": 0.0007686752784042095, "loss": 3.0641, "step": 21846 }, { "epoch": 0.59, "learning_rate": 0.0007685906008860758, "loss": 2.1703, "step": 21847 }, { "epoch": 0.59, "learning_rate": 0.0007685059251210583, "loss": 2.5903, "step": 21848 }, { "epoch": 0.59, "learning_rate": 0.0007684212511097987, "loss": 2.3656, "step": 21849 }, { "epoch": 0.59, "learning_rate": 0.0007683365788529379, "loss": 2.9625, "step": 21850 }, { "epoch": 0.59, "learning_rate": 0.0007682519083511185, "loss": 2.434, "step": 21851 }, { "epoch": 0.59, "learning_rate": 0.0007681672396049805, "loss": 2.2678, "step": 21852 }, { "epoch": 0.59, "learning_rate": 0.000768082572615166, "loss": 3.0345, "step": 21853 }, { "epoch": 0.59, "learning_rate": 0.0007679979073823172, "loss": 2.5747, "step": 21854 }, { "epoch": 0.59, "learning_rate": 0.0007679132439070741, "loss": 2.4197, "step": 21855 }, { "epoch": 0.59, "learning_rate": 0.0007678285821900789, "loss": 2.2574, "step": 21856 }, { "epoch": 0.59, "learning_rate": 0.0007677439222319731, "loss": 2.367, "step": 21857 }, { "epoch": 0.59, "learning_rate": 0.0007676592640333974, "loss": 2.2944, "step": 21858 }, { "epoch": 0.59, "learning_rate": 0.0007675746075949941, "loss": 2.5986, "step": 21859 }, { "epoch": 0.59, "learning_rate": 0.0007674899529174035, "loss": 2.2842, "step": 21860 }, { "epoch": 0.59, "learning_rate": 0.0007674053000012677, "loss": 2.2016, "step": 21861 }, { "epoch": 0.59, "learning_rate": 0.0007673206488472278, "loss": 2.3691, "step": 21862 }, { "epoch": 0.59, "learning_rate": 0.000767235999455925, "loss": 2.2716, "step": 21863 }, { "epoch": 0.59, "learning_rate": 0.0007671513518280005, "loss": 2.6841, "step": 21864 }, { "epoch": 0.59, "learning_rate": 0.0007670667059640964, "loss": 1.9619, "step": 21865 }, { "epoch": 0.59, "learning_rate": 0.0007669820618648525, "loss": 2.3668, "step": 21866 }, { "epoch": 0.59, "learning_rate": 0.0007668974195309114, "loss": 2.3715, "step": 21867 }, { "epoch": 0.59, "learning_rate": 0.0007668127789629134, "loss": 2.4409, "step": 21868 }, { "epoch": 0.59, "learning_rate": 0.0007667281401615002, "loss": 2.5351, "step": 21869 }, { "epoch": 0.59, "learning_rate": 0.000766643503127313, "loss": 2.652, "step": 21870 }, { "epoch": 0.59, "learning_rate": 0.0007665588678609927, "loss": 2.3464, "step": 21871 }, { "epoch": 0.59, "learning_rate": 0.0007664742343631807, "loss": 2.142, "step": 21872 }, { "epoch": 0.59, "learning_rate": 0.0007663896026345184, "loss": 2.3157, "step": 21873 }, { "epoch": 0.59, "learning_rate": 0.0007663049726756464, "loss": 2.7243, "step": 21874 }, { "epoch": 0.59, "learning_rate": 0.0007662203444872064, "loss": 2.5798, "step": 21875 }, { "epoch": 0.59, "learning_rate": 0.0007661357180698392, "loss": 2.3116, "step": 21876 }, { "epoch": 0.59, "learning_rate": 0.0007660510934241857, "loss": 2.5521, "step": 21877 }, { "epoch": 0.59, "learning_rate": 0.0007659664705508879, "loss": 2.4539, "step": 21878 }, { "epoch": 0.59, "learning_rate": 0.0007658818494505857, "loss": 2.3786, "step": 21879 }, { "epoch": 0.59, "learning_rate": 0.0007657972301239209, "loss": 2.6374, "step": 21880 }, { "epoch": 0.59, "learning_rate": 0.0007657126125715348, "loss": 2.2053, "step": 21881 }, { "epoch": 0.59, "learning_rate": 0.0007656279967940677, "loss": 2.4914, "step": 21882 }, { "epoch": 0.59, "learning_rate": 0.0007655433827921607, "loss": 2.722, "step": 21883 }, { "epoch": 0.59, "learning_rate": 0.0007654587705664558, "loss": 2.2854, "step": 21884 }, { "epoch": 0.59, "learning_rate": 0.0007653741601175929, "loss": 2.2576, "step": 21885 }, { "epoch": 0.59, "learning_rate": 0.0007652895514462136, "loss": 2.8671, "step": 21886 }, { "epoch": 0.59, "learning_rate": 0.0007652049445529585, "loss": 2.9859, "step": 21887 }, { "epoch": 0.59, "learning_rate": 0.0007651203394384689, "loss": 2.3244, "step": 21888 }, { "epoch": 0.59, "learning_rate": 0.0007650357361033857, "loss": 2.7059, "step": 21889 }, { "epoch": 0.59, "learning_rate": 0.0007649511345483494, "loss": 2.8093, "step": 21890 }, { "epoch": 0.59, "learning_rate": 0.0007648665347740015, "loss": 2.3857, "step": 21891 }, { "epoch": 0.59, "learning_rate": 0.0007647819367809827, "loss": 2.4949, "step": 21892 }, { "epoch": 0.59, "learning_rate": 0.0007646973405699339, "loss": 2.872, "step": 21893 }, { "epoch": 0.59, "learning_rate": 0.0007646127461414964, "loss": 2.7391, "step": 21894 }, { "epoch": 0.59, "learning_rate": 0.00076452815349631, "loss": 2.6706, "step": 21895 }, { "epoch": 0.59, "learning_rate": 0.0007644435626350161, "loss": 2.7289, "step": 21896 }, { "epoch": 0.59, "learning_rate": 0.0007643589735582565, "loss": 2.2681, "step": 21897 }, { "epoch": 0.59, "learning_rate": 0.0007642743862666706, "loss": 2.5003, "step": 21898 }, { "epoch": 0.59, "learning_rate": 0.0007641898007608997, "loss": 2.5623, "step": 21899 }, { "epoch": 0.59, "learning_rate": 0.0007641052170415851, "loss": 2.827, "step": 21900 }, { "epoch": 0.59, "learning_rate": 0.0007640206351093668, "loss": 2.5662, "step": 21901 }, { "epoch": 0.59, "learning_rate": 0.0007639360549648864, "loss": 2.0015, "step": 21902 }, { "epoch": 0.59, "learning_rate": 0.0007638514766087839, "loss": 2.5658, "step": 21903 }, { "epoch": 0.59, "learning_rate": 0.0007637669000417005, "loss": 2.2838, "step": 21904 }, { "epoch": 0.59, "learning_rate": 0.0007636823252642769, "loss": 2.7295, "step": 21905 }, { "epoch": 0.59, "learning_rate": 0.0007635977522771535, "loss": 2.3269, "step": 21906 }, { "epoch": 0.59, "learning_rate": 0.0007635131810809715, "loss": 2.5639, "step": 21907 }, { "epoch": 0.59, "learning_rate": 0.0007634286116763717, "loss": 2.6952, "step": 21908 }, { "epoch": 0.59, "learning_rate": 0.0007633440440639937, "loss": 2.6977, "step": 21909 }, { "epoch": 0.59, "learning_rate": 0.0007632594782444797, "loss": 2.7285, "step": 21910 }, { "epoch": 0.59, "learning_rate": 0.000763174914218469, "loss": 2.3701, "step": 21911 }, { "epoch": 0.59, "learning_rate": 0.000763090351986603, "loss": 2.353, "step": 21912 }, { "epoch": 0.59, "learning_rate": 0.0007630057915495221, "loss": 2.3354, "step": 21913 }, { "epoch": 0.59, "learning_rate": 0.0007629212329078669, "loss": 2.9391, "step": 21914 }, { "epoch": 0.59, "learning_rate": 0.000762836676062278, "loss": 3.0715, "step": 21915 }, { "epoch": 0.59, "learning_rate": 0.0007627521210133964, "loss": 2.3872, "step": 21916 }, { "epoch": 0.59, "learning_rate": 0.0007626675677618619, "loss": 2.6762, "step": 21917 }, { "epoch": 0.59, "learning_rate": 0.0007625830163083155, "loss": 2.938, "step": 21918 }, { "epoch": 0.59, "learning_rate": 0.0007624984666533979, "loss": 2.662, "step": 21919 }, { "epoch": 0.59, "learning_rate": 0.0007624139187977493, "loss": 2.1746, "step": 21920 }, { "epoch": 0.59, "learning_rate": 0.0007623293727420106, "loss": 2.351, "step": 21921 }, { "epoch": 0.59, "learning_rate": 0.0007622448284868219, "loss": 2.5521, "step": 21922 }, { "epoch": 0.59, "learning_rate": 0.000762160286032824, "loss": 2.7508, "step": 21923 }, { "epoch": 0.59, "learning_rate": 0.0007620757453806574, "loss": 2.625, "step": 21924 }, { "epoch": 0.59, "learning_rate": 0.000761991206530962, "loss": 2.9583, "step": 21925 }, { "epoch": 0.59, "learning_rate": 0.0007619066694843788, "loss": 2.1254, "step": 21926 }, { "epoch": 0.59, "learning_rate": 0.0007618221342415484, "loss": 2.5593, "step": 21927 }, { "epoch": 0.59, "learning_rate": 0.0007617376008031107, "loss": 2.6954, "step": 21928 }, { "epoch": 0.59, "learning_rate": 0.0007616530691697065, "loss": 2.1163, "step": 21929 }, { "epoch": 0.59, "learning_rate": 0.0007615685393419758, "loss": 2.2257, "step": 21930 }, { "epoch": 0.59, "learning_rate": 0.0007614840113205592, "loss": 2.4765, "step": 21931 }, { "epoch": 0.59, "learning_rate": 0.0007613994851060973, "loss": 2.6929, "step": 21932 }, { "epoch": 0.59, "learning_rate": 0.00076131496069923, "loss": 2.4661, "step": 21933 }, { "epoch": 0.59, "learning_rate": 0.000761230438100598, "loss": 1.9783, "step": 21934 }, { "epoch": 0.59, "learning_rate": 0.0007611459173108416, "loss": 2.2781, "step": 21935 }, { "epoch": 0.59, "learning_rate": 0.000761061398330601, "loss": 2.2556, "step": 21936 }, { "epoch": 0.59, "learning_rate": 0.0007609768811605166, "loss": 2.5197, "step": 21937 }, { "epoch": 0.59, "learning_rate": 0.0007608923658012284, "loss": 2.3001, "step": 21938 }, { "epoch": 0.59, "learning_rate": 0.0007608078522533768, "loss": 2.2502, "step": 21939 }, { "epoch": 0.59, "learning_rate": 0.0007607233405176028, "loss": 2.4256, "step": 21940 }, { "epoch": 0.59, "learning_rate": 0.0007606388305945453, "loss": 2.3439, "step": 21941 }, { "epoch": 0.59, "learning_rate": 0.0007605543224848452, "loss": 2.6257, "step": 21942 }, { "epoch": 0.59, "learning_rate": 0.0007604698161891433, "loss": 2.7174, "step": 21943 }, { "epoch": 0.59, "learning_rate": 0.0007603853117080789, "loss": 2.4668, "step": 21944 }, { "epoch": 0.59, "learning_rate": 0.0007603008090422927, "loss": 2.4606, "step": 21945 }, { "epoch": 0.59, "learning_rate": 0.0007602163081924245, "loss": 2.5582, "step": 21946 }, { "epoch": 0.59, "learning_rate": 0.0007601318091591148, "loss": 2.1134, "step": 21947 }, { "epoch": 0.59, "learning_rate": 0.0007600473119430037, "loss": 2.7904, "step": 21948 }, { "epoch": 0.59, "learning_rate": 0.0007599628165447311, "loss": 2.4047, "step": 21949 }, { "epoch": 0.59, "learning_rate": 0.0007598783229649372, "loss": 2.5785, "step": 21950 }, { "epoch": 0.59, "learning_rate": 0.0007597938312042625, "loss": 2.5166, "step": 21951 }, { "epoch": 0.59, "learning_rate": 0.0007597093412633466, "loss": 2.4994, "step": 21952 }, { "epoch": 0.59, "learning_rate": 0.0007596248531428301, "loss": 2.1705, "step": 21953 }, { "epoch": 0.59, "learning_rate": 0.0007595403668433525, "loss": 2.6802, "step": 21954 }, { "epoch": 0.59, "learning_rate": 0.0007594558823655536, "loss": 2.4927, "step": 21955 }, { "epoch": 0.59, "learning_rate": 0.0007593713997100748, "loss": 2.6959, "step": 21956 }, { "epoch": 0.59, "learning_rate": 0.0007592869188775547, "loss": 2.5067, "step": 21957 }, { "epoch": 0.59, "learning_rate": 0.0007592024398686339, "loss": 2.6013, "step": 21958 }, { "epoch": 0.59, "learning_rate": 0.0007591179626839526, "loss": 2.2809, "step": 21959 }, { "epoch": 0.59, "learning_rate": 0.0007590334873241503, "loss": 2.4112, "step": 21960 }, { "epoch": 0.59, "learning_rate": 0.0007589490137898673, "loss": 2.5688, "step": 21961 }, { "epoch": 0.59, "learning_rate": 0.0007588645420817437, "loss": 2.5387, "step": 21962 }, { "epoch": 0.59, "learning_rate": 0.0007587800722004188, "loss": 2.4261, "step": 21963 }, { "epoch": 0.59, "learning_rate": 0.0007586956041465334, "loss": 2.7635, "step": 21964 }, { "epoch": 0.59, "learning_rate": 0.0007586111379207267, "loss": 2.7413, "step": 21965 }, { "epoch": 0.59, "learning_rate": 0.0007585266735236388, "loss": 3.0048, "step": 21966 }, { "epoch": 0.59, "learning_rate": 0.0007584422109559101, "loss": 2.289, "step": 21967 }, { "epoch": 0.59, "learning_rate": 0.0007583577502181793, "loss": 2.4309, "step": 21968 }, { "epoch": 0.59, "learning_rate": 0.0007582732913110873, "loss": 2.3399, "step": 21969 }, { "epoch": 0.59, "learning_rate": 0.0007581888342352741, "loss": 2.6242, "step": 21970 }, { "epoch": 0.59, "learning_rate": 0.0007581043789913785, "loss": 2.3626, "step": 21971 }, { "epoch": 0.59, "learning_rate": 0.0007580199255800411, "loss": 2.5943, "step": 21972 }, { "epoch": 0.59, "learning_rate": 0.0007579354740019014, "loss": 2.4464, "step": 21973 }, { "epoch": 0.59, "learning_rate": 0.0007578510242575991, "loss": 2.2087, "step": 21974 }, { "epoch": 0.59, "learning_rate": 0.0007577665763477745, "loss": 2.5018, "step": 21975 }, { "epoch": 0.59, "learning_rate": 0.0007576821302730667, "loss": 2.9289, "step": 21976 }, { "epoch": 0.59, "learning_rate": 0.0007575976860341158, "loss": 2.7423, "step": 21977 }, { "epoch": 0.59, "learning_rate": 0.0007575132436315617, "loss": 2.5383, "step": 21978 }, { "epoch": 0.59, "learning_rate": 0.0007574288030660438, "loss": 2.4088, "step": 21979 }, { "epoch": 0.59, "learning_rate": 0.0007573443643382023, "loss": 2.7784, "step": 21980 }, { "epoch": 0.59, "learning_rate": 0.0007572599274486757, "loss": 2.5963, "step": 21981 }, { "epoch": 0.59, "learning_rate": 0.0007571754923981049, "loss": 2.6293, "step": 21982 }, { "epoch": 0.59, "learning_rate": 0.0007570910591871295, "loss": 2.8421, "step": 21983 }, { "epoch": 0.59, "learning_rate": 0.0007570066278163885, "loss": 2.559, "step": 21984 }, { "epoch": 0.59, "learning_rate": 0.0007569221982865216, "loss": 3.0063, "step": 21985 }, { "epoch": 0.59, "learning_rate": 0.000756837770598169, "loss": 2.7156, "step": 21986 }, { "epoch": 0.59, "learning_rate": 0.0007567533447519699, "loss": 2.5151, "step": 21987 }, { "epoch": 0.59, "learning_rate": 0.000756668920748564, "loss": 2.2941, "step": 21988 }, { "epoch": 0.59, "learning_rate": 0.0007565844985885908, "loss": 2.3774, "step": 21989 }, { "epoch": 0.59, "learning_rate": 0.0007565000782726899, "loss": 2.4003, "step": 21990 }, { "epoch": 0.59, "learning_rate": 0.000756415659801501, "loss": 2.6629, "step": 21991 }, { "epoch": 0.59, "learning_rate": 0.0007563312431756633, "loss": 2.4343, "step": 21992 }, { "epoch": 0.59, "learning_rate": 0.0007562468283958166, "loss": 2.3966, "step": 21993 }, { "epoch": 0.59, "learning_rate": 0.0007561624154626004, "loss": 2.5436, "step": 21994 }, { "epoch": 0.59, "learning_rate": 0.0007560780043766541, "loss": 2.6341, "step": 21995 }, { "epoch": 0.59, "learning_rate": 0.0007559935951386173, "loss": 2.8887, "step": 21996 }, { "epoch": 0.59, "learning_rate": 0.0007559091877491296, "loss": 2.6128, "step": 21997 }, { "epoch": 0.59, "learning_rate": 0.0007558247822088298, "loss": 2.5993, "step": 21998 }, { "epoch": 0.59, "learning_rate": 0.0007557403785183583, "loss": 2.5843, "step": 21999 }, { "epoch": 0.59, "learning_rate": 0.0007556559766783537, "loss": 2.391, "step": 22000 }, { "epoch": 0.59, "learning_rate": 0.0007555715766894556, "loss": 2.6138, "step": 22001 }, { "epoch": 0.59, "learning_rate": 0.0007554871785523039, "loss": 2.2823, "step": 22002 }, { "epoch": 0.59, "learning_rate": 0.0007554027822675374, "loss": 2.635, "step": 22003 }, { "epoch": 0.59, "learning_rate": 0.0007553183878357956, "loss": 2.653, "step": 22004 }, { "epoch": 0.59, "learning_rate": 0.0007552339952577182, "loss": 2.8281, "step": 22005 }, { "epoch": 0.59, "learning_rate": 0.000755149604533944, "loss": 2.1426, "step": 22006 }, { "epoch": 0.59, "learning_rate": 0.000755065215665113, "loss": 2.4497, "step": 22007 }, { "epoch": 0.59, "learning_rate": 0.0007549808286518637, "loss": 2.3934, "step": 22008 }, { "epoch": 0.59, "learning_rate": 0.0007548964434948361, "loss": 2.6919, "step": 22009 }, { "epoch": 0.59, "learning_rate": 0.0007548120601946696, "loss": 2.6568, "step": 22010 }, { "epoch": 0.59, "learning_rate": 0.0007547276787520024, "loss": 2.5928, "step": 22011 }, { "epoch": 0.59, "learning_rate": 0.0007546432991674746, "loss": 2.8443, "step": 22012 }, { "epoch": 0.59, "learning_rate": 0.0007545589214417257, "loss": 2.2205, "step": 22013 }, { "epoch": 0.59, "learning_rate": 0.0007544745455753942, "loss": 2.2132, "step": 22014 }, { "epoch": 0.59, "learning_rate": 0.0007543901715691198, "loss": 2.2374, "step": 22015 }, { "epoch": 0.59, "learning_rate": 0.0007543057994235414, "loss": 2.1407, "step": 22016 }, { "epoch": 0.59, "learning_rate": 0.0007542214291392983, "loss": 2.3192, "step": 22017 }, { "epoch": 0.59, "learning_rate": 0.0007541370607170299, "loss": 2.4468, "step": 22018 }, { "epoch": 0.59, "learning_rate": 0.0007540526941573751, "loss": 2.2937, "step": 22019 }, { "epoch": 0.59, "learning_rate": 0.000753968329460973, "loss": 2.7043, "step": 22020 }, { "epoch": 0.59, "learning_rate": 0.000753883966628463, "loss": 2.3268, "step": 22021 }, { "epoch": 0.59, "learning_rate": 0.000753799605660484, "loss": 2.7865, "step": 22022 }, { "epoch": 0.59, "learning_rate": 0.0007537152465576755, "loss": 2.8361, "step": 22023 }, { "epoch": 0.59, "learning_rate": 0.0007536308893206757, "loss": 2.1805, "step": 22024 }, { "epoch": 0.59, "learning_rate": 0.0007535465339501244, "loss": 2.1777, "step": 22025 }, { "epoch": 0.59, "learning_rate": 0.000753462180446661, "loss": 2.1045, "step": 22026 }, { "epoch": 0.59, "learning_rate": 0.0007533778288109234, "loss": 2.2204, "step": 22027 }, { "epoch": 0.59, "learning_rate": 0.0007532934790435513, "loss": 2.4236, "step": 22028 }, { "epoch": 0.59, "learning_rate": 0.0007532091311451841, "loss": 2.7681, "step": 22029 }, { "epoch": 0.59, "learning_rate": 0.0007531247851164602, "loss": 2.667, "step": 22030 }, { "epoch": 0.59, "learning_rate": 0.0007530404409580188, "loss": 2.4268, "step": 22031 }, { "epoch": 0.59, "learning_rate": 0.0007529560986704989, "loss": 2.8574, "step": 22032 }, { "epoch": 0.59, "learning_rate": 0.0007528717582545392, "loss": 2.2469, "step": 22033 }, { "epoch": 0.59, "learning_rate": 0.0007527874197107794, "loss": 2.5917, "step": 22034 }, { "epoch": 0.59, "learning_rate": 0.0007527030830398574, "loss": 2.3264, "step": 22035 }, { "epoch": 0.59, "learning_rate": 0.0007526187482424127, "loss": 2.841, "step": 22036 }, { "epoch": 0.59, "learning_rate": 0.0007525344153190844, "loss": 2.9076, "step": 22037 }, { "epoch": 0.59, "learning_rate": 0.0007524500842705109, "loss": 2.7513, "step": 22038 }, { "epoch": 0.59, "learning_rate": 0.0007523657550973313, "loss": 2.3064, "step": 22039 }, { "epoch": 0.59, "learning_rate": 0.0007522814278001849, "loss": 2.4234, "step": 22040 }, { "epoch": 0.59, "learning_rate": 0.0007521971023797094, "loss": 2.3901, "step": 22041 }, { "epoch": 0.59, "learning_rate": 0.0007521127788365449, "loss": 2.4604, "step": 22042 }, { "epoch": 0.59, "learning_rate": 0.0007520284571713295, "loss": 2.3437, "step": 22043 }, { "epoch": 0.59, "learning_rate": 0.000751944137384702, "loss": 2.3209, "step": 22044 }, { "epoch": 0.59, "learning_rate": 0.0007518598194773017, "loss": 2.2923, "step": 22045 }, { "epoch": 0.59, "learning_rate": 0.0007517755034497668, "loss": 2.8121, "step": 22046 }, { "epoch": 0.59, "learning_rate": 0.0007516911893027363, "loss": 2.5276, "step": 22047 }, { "epoch": 0.59, "learning_rate": 0.0007516068770368491, "loss": 2.4629, "step": 22048 }, { "epoch": 0.59, "learning_rate": 0.0007515225666527436, "loss": 2.4934, "step": 22049 }, { "epoch": 0.59, "learning_rate": 0.000751438258151059, "loss": 2.2036, "step": 22050 }, { "epoch": 0.59, "learning_rate": 0.0007513539515324334, "loss": 2.0795, "step": 22051 }, { "epoch": 0.59, "learning_rate": 0.0007512696467975059, "loss": 2.7766, "step": 22052 }, { "epoch": 0.59, "learning_rate": 0.0007511853439469155, "loss": 2.5201, "step": 22053 }, { "epoch": 0.59, "learning_rate": 0.0007511010429812997, "loss": 2.235, "step": 22054 }, { "epoch": 0.59, "learning_rate": 0.0007510167439012983, "loss": 2.578, "step": 22055 }, { "epoch": 0.59, "learning_rate": 0.0007509324467075498, "loss": 2.0662, "step": 22056 }, { "epoch": 0.59, "learning_rate": 0.0007508481514006921, "loss": 2.2979, "step": 22057 }, { "epoch": 0.59, "learning_rate": 0.0007507638579813647, "loss": 2.6863, "step": 22058 }, { "epoch": 0.59, "learning_rate": 0.0007506795664502054, "loss": 2.4729, "step": 22059 }, { "epoch": 0.59, "learning_rate": 0.0007505952768078531, "loss": 2.8401, "step": 22060 }, { "epoch": 0.59, "learning_rate": 0.0007505109890549467, "loss": 2.6879, "step": 22061 }, { "epoch": 0.59, "learning_rate": 0.0007504267031921241, "loss": 2.4568, "step": 22062 }, { "epoch": 0.59, "learning_rate": 0.0007503424192200243, "loss": 2.1394, "step": 22063 }, { "epoch": 0.59, "learning_rate": 0.0007502581371392858, "loss": 2.6904, "step": 22064 }, { "epoch": 0.59, "learning_rate": 0.000750173856950547, "loss": 2.5577, "step": 22065 }, { "epoch": 0.59, "learning_rate": 0.0007500895786544466, "loss": 2.7349, "step": 22066 }, { "epoch": 0.59, "learning_rate": 0.0007500053022516223, "loss": 2.5366, "step": 22067 }, { "epoch": 0.59, "learning_rate": 0.0007499210277427134, "loss": 2.5242, "step": 22068 }, { "epoch": 0.59, "learning_rate": 0.0007498367551283584, "loss": 2.4752, "step": 22069 }, { "epoch": 0.59, "learning_rate": 0.000749752484409195, "loss": 2.9095, "step": 22070 }, { "epoch": 0.59, "learning_rate": 0.0007496682155858619, "loss": 2.0679, "step": 22071 }, { "epoch": 0.59, "learning_rate": 0.0007495839486589982, "loss": 1.9674, "step": 22072 }, { "epoch": 0.59, "learning_rate": 0.0007494996836292415, "loss": 2.6186, "step": 22073 }, { "epoch": 0.59, "learning_rate": 0.0007494154204972303, "loss": 2.548, "step": 22074 }, { "epoch": 0.59, "learning_rate": 0.0007493311592636032, "loss": 2.6019, "step": 22075 }, { "epoch": 0.59, "learning_rate": 0.0007492468999289983, "loss": 2.8123, "step": 22076 }, { "epoch": 0.59, "learning_rate": 0.0007491626424940543, "loss": 2.4641, "step": 22077 }, { "epoch": 0.59, "learning_rate": 0.0007490783869594089, "loss": 2.1722, "step": 22078 }, { "epoch": 0.59, "learning_rate": 0.0007489941333257009, "loss": 2.5951, "step": 22079 }, { "epoch": 0.59, "learning_rate": 0.0007489098815935686, "loss": 2.6009, "step": 22080 }, { "epoch": 0.59, "learning_rate": 0.0007488256317636501, "loss": 2.4687, "step": 22081 }, { "epoch": 0.59, "learning_rate": 0.0007487413838365836, "loss": 2.3037, "step": 22082 }, { "epoch": 0.59, "learning_rate": 0.000748657137813008, "loss": 2.605, "step": 22083 }, { "epoch": 0.59, "learning_rate": 0.0007485728936935601, "loss": 2.5623, "step": 22084 }, { "epoch": 0.59, "learning_rate": 0.0007484886514788798, "loss": 2.5109, "step": 22085 }, { "epoch": 0.59, "learning_rate": 0.0007484044111696042, "loss": 2.9096, "step": 22086 }, { "epoch": 0.59, "learning_rate": 0.0007483201727663715, "loss": 2.3534, "step": 22087 }, { "epoch": 0.59, "learning_rate": 0.0007482359362698207, "loss": 2.6931, "step": 22088 }, { "epoch": 0.59, "learning_rate": 0.000748151701680589, "loss": 2.6661, "step": 22089 }, { "epoch": 0.59, "learning_rate": 0.0007480674689993151, "loss": 2.5733, "step": 22090 }, { "epoch": 0.59, "learning_rate": 0.0007479832382266371, "loss": 2.8174, "step": 22091 }, { "epoch": 0.59, "learning_rate": 0.000747899009363193, "loss": 2.6708, "step": 22092 }, { "epoch": 0.59, "learning_rate": 0.0007478147824096211, "loss": 2.7751, "step": 22093 }, { "epoch": 0.59, "learning_rate": 0.000747730557366559, "loss": 2.312, "step": 22094 }, { "epoch": 0.59, "learning_rate": 0.0007476463342346451, "loss": 2.4907, "step": 22095 }, { "epoch": 0.59, "learning_rate": 0.0007475621130145178, "loss": 2.4701, "step": 22096 }, { "epoch": 0.59, "learning_rate": 0.0007474778937068145, "loss": 2.6375, "step": 22097 }, { "epoch": 0.59, "learning_rate": 0.0007473936763121736, "loss": 2.79, "step": 22098 }, { "epoch": 0.59, "learning_rate": 0.0007473094608312335, "loss": 2.5517, "step": 22099 }, { "epoch": 0.59, "learning_rate": 0.0007472252472646309, "loss": 2.7728, "step": 22100 }, { "epoch": 0.59, "learning_rate": 0.0007471410356130055, "loss": 2.2234, "step": 22101 }, { "epoch": 0.59, "learning_rate": 0.0007470568258769938, "loss": 2.3957, "step": 22102 }, { "epoch": 0.59, "learning_rate": 0.0007469726180572345, "loss": 2.2095, "step": 22103 }, { "epoch": 0.59, "learning_rate": 0.0007468884121543656, "loss": 2.1846, "step": 22104 }, { "epoch": 0.59, "learning_rate": 0.0007468042081690246, "loss": 2.1076, "step": 22105 }, { "epoch": 0.59, "learning_rate": 0.0007467200061018496, "loss": 2.4461, "step": 22106 }, { "epoch": 0.59, "learning_rate": 0.0007466358059534788, "loss": 2.3695, "step": 22107 }, { "epoch": 0.59, "learning_rate": 0.0007465516077245495, "loss": 2.3169, "step": 22108 }, { "epoch": 0.59, "learning_rate": 0.0007464674114157002, "loss": 2.3473, "step": 22109 }, { "epoch": 0.59, "learning_rate": 0.0007463832170275684, "loss": 2.8525, "step": 22110 }, { "epoch": 0.59, "learning_rate": 0.000746299024560792, "loss": 2.3361, "step": 22111 }, { "epoch": 0.59, "learning_rate": 0.0007462148340160091, "loss": 2.6174, "step": 22112 }, { "epoch": 0.59, "learning_rate": 0.0007461306453938568, "loss": 2.5793, "step": 22113 }, { "epoch": 0.59, "learning_rate": 0.0007460464586949734, "loss": 2.2348, "step": 22114 }, { "epoch": 0.59, "learning_rate": 0.000745962273919997, "loss": 2.9403, "step": 22115 }, { "epoch": 0.59, "learning_rate": 0.0007458780910695647, "loss": 2.2835, "step": 22116 }, { "epoch": 0.59, "learning_rate": 0.0007457939101443143, "loss": 2.5694, "step": 22117 }, { "epoch": 0.59, "learning_rate": 0.0007457097311448844, "loss": 2.98, "step": 22118 }, { "epoch": 0.59, "learning_rate": 0.0007456255540719117, "loss": 2.4821, "step": 22119 }, { "epoch": 0.59, "learning_rate": 0.0007455413789260346, "loss": 2.5095, "step": 22120 }, { "epoch": 0.59, "learning_rate": 0.0007454572057078902, "loss": 2.4419, "step": 22121 }, { "epoch": 0.59, "learning_rate": 0.0007453730344181166, "loss": 2.2634, "step": 22122 }, { "epoch": 0.59, "learning_rate": 0.0007452888650573515, "loss": 2.6855, "step": 22123 }, { "epoch": 0.59, "learning_rate": 0.0007452046976262322, "loss": 2.4845, "step": 22124 }, { "epoch": 0.59, "learning_rate": 0.0007451205321253966, "loss": 2.3372, "step": 22125 }, { "epoch": 0.59, "learning_rate": 0.0007450363685554825, "loss": 2.4311, "step": 22126 }, { "epoch": 0.59, "learning_rate": 0.0007449522069171271, "loss": 2.6313, "step": 22127 }, { "epoch": 0.59, "learning_rate": 0.0007448680472109685, "loss": 2.6164, "step": 22128 }, { "epoch": 0.59, "learning_rate": 0.0007447838894376437, "loss": 2.4684, "step": 22129 }, { "epoch": 0.59, "learning_rate": 0.0007446997335977902, "loss": 2.4703, "step": 22130 }, { "epoch": 0.59, "learning_rate": 0.0007446155796920465, "loss": 1.9963, "step": 22131 }, { "epoch": 0.59, "learning_rate": 0.0007445314277210491, "loss": 2.7294, "step": 22132 }, { "epoch": 0.59, "learning_rate": 0.000744447277685436, "loss": 2.5001, "step": 22133 }, { "epoch": 0.59, "learning_rate": 0.0007443631295858448, "loss": 2.3144, "step": 22134 }, { "epoch": 0.59, "learning_rate": 0.0007442789834229127, "loss": 2.2702, "step": 22135 }, { "epoch": 0.59, "learning_rate": 0.0007441948391972773, "loss": 2.264, "step": 22136 }, { "epoch": 0.59, "learning_rate": 0.000744110696909576, "loss": 2.9381, "step": 22137 }, { "epoch": 0.59, "learning_rate": 0.0007440265565604462, "loss": 2.8434, "step": 22138 }, { "epoch": 0.59, "learning_rate": 0.0007439424181505259, "loss": 2.6231, "step": 22139 }, { "epoch": 0.59, "learning_rate": 0.0007438582816804517, "loss": 2.2992, "step": 22140 }, { "epoch": 0.6, "learning_rate": 0.0007437741471508614, "loss": 2.721, "step": 22141 }, { "epoch": 0.6, "learning_rate": 0.0007436900145623926, "loss": 2.7901, "step": 22142 }, { "epoch": 0.6, "learning_rate": 0.0007436058839156819, "loss": 2.4858, "step": 22143 }, { "epoch": 0.6, "learning_rate": 0.0007435217552113675, "loss": 2.3159, "step": 22144 }, { "epoch": 0.6, "learning_rate": 0.0007434376284500868, "loss": 2.3923, "step": 22145 }, { "epoch": 0.6, "learning_rate": 0.0007433535036324763, "loss": 2.3872, "step": 22146 }, { "epoch": 0.6, "learning_rate": 0.0007432693807591739, "loss": 2.2402, "step": 22147 }, { "epoch": 0.6, "learning_rate": 0.0007431852598308167, "loss": 2.886, "step": 22148 }, { "epoch": 0.6, "learning_rate": 0.000743101140848042, "loss": 2.3007, "step": 22149 }, { "epoch": 0.6, "learning_rate": 0.0007430170238114874, "loss": 2.5788, "step": 22150 }, { "epoch": 0.6, "learning_rate": 0.0007429329087217896, "loss": 2.4962, "step": 22151 }, { "epoch": 0.6, "learning_rate": 0.0007428487955795862, "loss": 2.4738, "step": 22152 }, { "epoch": 0.6, "learning_rate": 0.0007427646843855144, "loss": 2.6498, "step": 22153 }, { "epoch": 0.6, "learning_rate": 0.0007426805751402114, "loss": 2.0828, "step": 22154 }, { "epoch": 0.6, "learning_rate": 0.0007425964678443146, "loss": 2.3236, "step": 22155 }, { "epoch": 0.6, "learning_rate": 0.0007425123624984604, "loss": 2.3423, "step": 22156 }, { "epoch": 0.6, "learning_rate": 0.0007424282591032866, "loss": 2.5183, "step": 22157 }, { "epoch": 0.6, "learning_rate": 0.0007423441576594308, "loss": 3.1174, "step": 22158 }, { "epoch": 0.6, "learning_rate": 0.0007422600581675291, "loss": 2.8542, "step": 22159 }, { "epoch": 0.6, "learning_rate": 0.0007421759606282189, "loss": 2.3449, "step": 22160 }, { "epoch": 0.6, "learning_rate": 0.0007420918650421382, "loss": 2.5895, "step": 22161 }, { "epoch": 0.6, "learning_rate": 0.000742007771409923, "loss": 2.7322, "step": 22162 }, { "epoch": 0.6, "learning_rate": 0.000741923679732211, "loss": 2.4879, "step": 22163 }, { "epoch": 0.6, "learning_rate": 0.0007418395900096389, "loss": 3.1617, "step": 22164 }, { "epoch": 0.6, "learning_rate": 0.0007417555022428438, "loss": 2.6625, "step": 22165 }, { "epoch": 0.6, "learning_rate": 0.0007416714164324631, "loss": 2.9574, "step": 22166 }, { "epoch": 0.6, "learning_rate": 0.0007415873325791333, "loss": 2.4881, "step": 22167 }, { "epoch": 0.6, "learning_rate": 0.0007415032506834918, "loss": 2.5542, "step": 22168 }, { "epoch": 0.6, "learning_rate": 0.0007414191707461757, "loss": 2.3673, "step": 22169 }, { "epoch": 0.6, "learning_rate": 0.0007413350927678213, "loss": 2.7835, "step": 22170 }, { "epoch": 0.6, "learning_rate": 0.0007412510167490667, "loss": 2.5506, "step": 22171 }, { "epoch": 0.6, "learning_rate": 0.0007411669426905474, "loss": 2.1833, "step": 22172 }, { "epoch": 0.6, "learning_rate": 0.0007410828705929012, "loss": 2.1063, "step": 22173 }, { "epoch": 0.6, "learning_rate": 0.0007409988004567652, "loss": 2.5233, "step": 22174 }, { "epoch": 0.6, "learning_rate": 0.0007409147322827757, "loss": 2.4748, "step": 22175 }, { "epoch": 0.6, "learning_rate": 0.0007408306660715699, "loss": 2.6933, "step": 22176 }, { "epoch": 0.6, "learning_rate": 0.0007407466018237847, "loss": 2.4315, "step": 22177 }, { "epoch": 0.6, "learning_rate": 0.0007406625395400568, "loss": 2.4587, "step": 22178 }, { "epoch": 0.6, "learning_rate": 0.0007405784792210233, "loss": 2.0395, "step": 22179 }, { "epoch": 0.6, "learning_rate": 0.0007404944208673208, "loss": 2.3332, "step": 22180 }, { "epoch": 0.6, "learning_rate": 0.0007404103644795861, "loss": 2.0541, "step": 22181 }, { "epoch": 0.6, "learning_rate": 0.0007403263100584563, "loss": 2.3913, "step": 22182 }, { "epoch": 0.6, "learning_rate": 0.0007402422576045676, "loss": 2.2878, "step": 22183 }, { "epoch": 0.6, "learning_rate": 0.0007401582071185572, "loss": 2.447, "step": 22184 }, { "epoch": 0.6, "learning_rate": 0.0007400741586010621, "loss": 2.1862, "step": 22185 }, { "epoch": 0.6, "learning_rate": 0.0007399901120527183, "loss": 2.4943, "step": 22186 }, { "epoch": 0.6, "learning_rate": 0.0007399060674741629, "loss": 2.8594, "step": 22187 }, { "epoch": 0.6, "learning_rate": 0.0007398220248660332, "loss": 2.3269, "step": 22188 }, { "epoch": 0.6, "learning_rate": 0.0007397379842289649, "loss": 2.5149, "step": 22189 }, { "epoch": 0.6, "learning_rate": 0.0007396539455635953, "loss": 2.5487, "step": 22190 }, { "epoch": 0.6, "learning_rate": 0.0007395699088705606, "loss": 2.745, "step": 22191 }, { "epoch": 0.6, "learning_rate": 0.0007394858741504977, "loss": 2.7863, "step": 22192 }, { "epoch": 0.6, "learning_rate": 0.0007394018414040434, "loss": 2.2786, "step": 22193 }, { "epoch": 0.6, "learning_rate": 0.0007393178106318341, "loss": 2.3958, "step": 22194 }, { "epoch": 0.6, "learning_rate": 0.0007392337818345063, "loss": 2.5878, "step": 22195 }, { "epoch": 0.6, "learning_rate": 0.0007391497550126971, "loss": 2.3631, "step": 22196 }, { "epoch": 0.6, "learning_rate": 0.0007390657301670425, "loss": 2.2551, "step": 22197 }, { "epoch": 0.6, "learning_rate": 0.0007389817072981795, "loss": 2.4046, "step": 22198 }, { "epoch": 0.6, "learning_rate": 0.000738897686406744, "loss": 2.2025, "step": 22199 }, { "epoch": 0.6, "learning_rate": 0.0007388136674933732, "loss": 2.3125, "step": 22200 }, { "epoch": 0.6, "learning_rate": 0.0007387296505587035, "loss": 2.6444, "step": 22201 }, { "epoch": 0.6, "learning_rate": 0.0007386456356033711, "loss": 2.6681, "step": 22202 }, { "epoch": 0.6, "learning_rate": 0.0007385616226280123, "loss": 2.3466, "step": 22203 }, { "epoch": 0.6, "learning_rate": 0.0007384776116332646, "loss": 2.0297, "step": 22204 }, { "epoch": 0.6, "learning_rate": 0.0007383936026197633, "loss": 2.5844, "step": 22205 }, { "epoch": 0.6, "learning_rate": 0.0007383095955881456, "loss": 2.0577, "step": 22206 }, { "epoch": 0.6, "learning_rate": 0.0007382255905390474, "loss": 2.3568, "step": 22207 }, { "epoch": 0.6, "learning_rate": 0.0007381415874731052, "loss": 2.7158, "step": 22208 }, { "epoch": 0.6, "learning_rate": 0.0007380575863909557, "loss": 2.1647, "step": 22209 }, { "epoch": 0.6, "learning_rate": 0.000737973587293235, "loss": 2.7402, "step": 22210 }, { "epoch": 0.6, "learning_rate": 0.0007378895901805796, "loss": 2.5634, "step": 22211 }, { "epoch": 0.6, "learning_rate": 0.000737805595053626, "loss": 3.1033, "step": 22212 }, { "epoch": 0.6, "learning_rate": 0.00073772160191301, "loss": 2.7315, "step": 22213 }, { "epoch": 0.6, "learning_rate": 0.0007376376107593687, "loss": 2.7112, "step": 22214 }, { "epoch": 0.6, "learning_rate": 0.0007375536215933376, "loss": 2.7249, "step": 22215 }, { "epoch": 0.6, "learning_rate": 0.0007374696344155531, "loss": 2.3282, "step": 22216 }, { "epoch": 0.6, "learning_rate": 0.0007373856492266524, "loss": 2.6138, "step": 22217 }, { "epoch": 0.6, "learning_rate": 0.0007373016660272705, "loss": 2.3194, "step": 22218 }, { "epoch": 0.6, "learning_rate": 0.0007372176848180443, "loss": 2.1813, "step": 22219 }, { "epoch": 0.6, "learning_rate": 0.0007371337055996103, "loss": 2.5419, "step": 22220 }, { "epoch": 0.6, "learning_rate": 0.0007370497283726039, "loss": 2.5446, "step": 22221 }, { "epoch": 0.6, "learning_rate": 0.000736965753137662, "loss": 2.5658, "step": 22222 }, { "epoch": 0.6, "learning_rate": 0.0007368817798954204, "loss": 2.478, "step": 22223 }, { "epoch": 0.6, "learning_rate": 0.0007367978086465155, "loss": 2.4166, "step": 22224 }, { "epoch": 0.6, "learning_rate": 0.0007367138393915833, "loss": 2.575, "step": 22225 }, { "epoch": 0.6, "learning_rate": 0.0007366298721312598, "loss": 2.494, "step": 22226 }, { "epoch": 0.6, "learning_rate": 0.0007365459068661814, "loss": 2.1403, "step": 22227 }, { "epoch": 0.6, "learning_rate": 0.0007364619435969847, "loss": 2.0304, "step": 22228 }, { "epoch": 0.6, "learning_rate": 0.0007363779823243044, "loss": 2.4384, "step": 22229 }, { "epoch": 0.6, "learning_rate": 0.0007362940230487776, "loss": 2.8279, "step": 22230 }, { "epoch": 0.6, "learning_rate": 0.0007362100657710405, "loss": 2.464, "step": 22231 }, { "epoch": 0.6, "learning_rate": 0.0007361261104917284, "loss": 2.833, "step": 22232 }, { "epoch": 0.6, "learning_rate": 0.0007360421572114779, "loss": 2.0747, "step": 22233 }, { "epoch": 0.6, "learning_rate": 0.0007359582059309246, "loss": 2.692, "step": 22234 }, { "epoch": 0.6, "learning_rate": 0.0007358742566507049, "loss": 2.4637, "step": 22235 }, { "epoch": 0.6, "learning_rate": 0.0007357903093714546, "loss": 2.5192, "step": 22236 }, { "epoch": 0.6, "learning_rate": 0.0007357063640938095, "loss": 2.6619, "step": 22237 }, { "epoch": 0.6, "learning_rate": 0.0007356224208184058, "loss": 2.5858, "step": 22238 }, { "epoch": 0.6, "learning_rate": 0.0007355384795458796, "loss": 2.4603, "step": 22239 }, { "epoch": 0.6, "learning_rate": 0.0007354545402768664, "loss": 2.876, "step": 22240 }, { "epoch": 0.6, "learning_rate": 0.0007353706030120027, "loss": 2.2922, "step": 22241 }, { "epoch": 0.6, "learning_rate": 0.0007352866677519232, "loss": 2.8097, "step": 22242 }, { "epoch": 0.6, "learning_rate": 0.000735202734497265, "loss": 2.3178, "step": 22243 }, { "epoch": 0.6, "learning_rate": 0.000735118803248664, "loss": 2.4474, "step": 22244 }, { "epoch": 0.6, "learning_rate": 0.000735034874006755, "loss": 3.0288, "step": 22245 }, { "epoch": 0.6, "learning_rate": 0.0007349509467721742, "loss": 3.0135, "step": 22246 }, { "epoch": 0.6, "learning_rate": 0.0007348670215455584, "loss": 2.4262, "step": 22247 }, { "epoch": 0.6, "learning_rate": 0.0007347830983275423, "loss": 2.4209, "step": 22248 }, { "epoch": 0.6, "learning_rate": 0.0007346991771187622, "loss": 2.5978, "step": 22249 }, { "epoch": 0.6, "learning_rate": 0.0007346152579198533, "loss": 2.1775, "step": 22250 }, { "epoch": 0.6, "learning_rate": 0.0007345313407314518, "loss": 2.5281, "step": 22251 }, { "epoch": 0.6, "learning_rate": 0.0007344474255541937, "loss": 2.5342, "step": 22252 }, { "epoch": 0.6, "learning_rate": 0.0007343635123887143, "loss": 2.2008, "step": 22253 }, { "epoch": 0.6, "learning_rate": 0.0007342796012356493, "loss": 2.7373, "step": 22254 }, { "epoch": 0.6, "learning_rate": 0.0007341956920956347, "loss": 2.2634, "step": 22255 }, { "epoch": 0.6, "learning_rate": 0.000734111784969306, "loss": 2.2814, "step": 22256 }, { "epoch": 0.6, "learning_rate": 0.0007340278798572988, "loss": 2.3291, "step": 22257 }, { "epoch": 0.6, "learning_rate": 0.0007339439767602489, "loss": 2.3404, "step": 22258 }, { "epoch": 0.6, "learning_rate": 0.0007338600756787919, "loss": 2.5773, "step": 22259 }, { "epoch": 0.6, "learning_rate": 0.0007337761766135635, "loss": 2.8442, "step": 22260 }, { "epoch": 0.6, "learning_rate": 0.000733692279565199, "loss": 2.5041, "step": 22261 }, { "epoch": 0.6, "learning_rate": 0.000733608384534334, "loss": 2.206, "step": 22262 }, { "epoch": 0.6, "learning_rate": 0.0007335244915216048, "loss": 1.7473, "step": 22263 }, { "epoch": 0.6, "learning_rate": 0.000733440600527646, "loss": 2.8874, "step": 22264 }, { "epoch": 0.6, "learning_rate": 0.0007333567115530935, "loss": 2.6066, "step": 22265 }, { "epoch": 0.6, "learning_rate": 0.0007332728245985831, "loss": 2.8022, "step": 22266 }, { "epoch": 0.6, "learning_rate": 0.0007331889396647499, "loss": 2.255, "step": 22267 }, { "epoch": 0.6, "learning_rate": 0.0007331050567522299, "loss": 2.487, "step": 22268 }, { "epoch": 0.6, "learning_rate": 0.000733021175861658, "loss": 2.6525, "step": 22269 }, { "epoch": 0.6, "learning_rate": 0.0007329372969936698, "loss": 2.4734, "step": 22270 }, { "epoch": 0.6, "learning_rate": 0.0007328534201489012, "loss": 2.38, "step": 22271 }, { "epoch": 0.6, "learning_rate": 0.0007327695453279873, "loss": 2.3551, "step": 22272 }, { "epoch": 0.6, "learning_rate": 0.0007326856725315634, "loss": 2.5648, "step": 22273 }, { "epoch": 0.6, "learning_rate": 0.0007326018017602653, "loss": 2.376, "step": 22274 }, { "epoch": 0.6, "learning_rate": 0.0007325179330147278, "loss": 2.1687, "step": 22275 }, { "epoch": 0.6, "learning_rate": 0.0007324340662955871, "loss": 2.3939, "step": 22276 }, { "epoch": 0.6, "learning_rate": 0.0007323502016034776, "loss": 1.9858, "step": 22277 }, { "epoch": 0.6, "learning_rate": 0.0007322663389390352, "loss": 2.2244, "step": 22278 }, { "epoch": 0.6, "learning_rate": 0.0007321824783028954, "loss": 2.9325, "step": 22279 }, { "epoch": 0.6, "learning_rate": 0.0007320986196956931, "loss": 2.3581, "step": 22280 }, { "epoch": 0.6, "learning_rate": 0.0007320147631180635, "loss": 2.7105, "step": 22281 }, { "epoch": 0.6, "learning_rate": 0.0007319309085706428, "loss": 2.6675, "step": 22282 }, { "epoch": 0.6, "learning_rate": 0.000731847056054065, "loss": 2.8839, "step": 22283 }, { "epoch": 0.6, "learning_rate": 0.0007317632055689662, "loss": 2.2488, "step": 22284 }, { "epoch": 0.6, "learning_rate": 0.0007316793571159815, "loss": 2.0734, "step": 22285 }, { "epoch": 0.6, "learning_rate": 0.0007315955106957457, "loss": 2.4362, "step": 22286 }, { "epoch": 0.6, "learning_rate": 0.0007315116663088949, "loss": 2.6527, "step": 22287 }, { "epoch": 0.6, "learning_rate": 0.000731427823956063, "loss": 2.2809, "step": 22288 }, { "epoch": 0.6, "learning_rate": 0.0007313439836378862, "loss": 2.7691, "step": 22289 }, { "epoch": 0.6, "learning_rate": 0.0007312601453549996, "loss": 2.9363, "step": 22290 }, { "epoch": 0.6, "learning_rate": 0.0007311763091080379, "loss": 2.3635, "step": 22291 }, { "epoch": 0.6, "learning_rate": 0.000731092474897636, "loss": 2.5335, "step": 22292 }, { "epoch": 0.6, "learning_rate": 0.0007310086427244302, "loss": 2.6238, "step": 22293 }, { "epoch": 0.6, "learning_rate": 0.0007309248125890544, "loss": 2.5993, "step": 22294 }, { "epoch": 0.6, "learning_rate": 0.0007308409844921442, "loss": 2.6169, "step": 22295 }, { "epoch": 0.6, "learning_rate": 0.0007307571584343345, "loss": 2.3199, "step": 22296 }, { "epoch": 0.6, "learning_rate": 0.0007306733344162604, "loss": 2.0017, "step": 22297 }, { "epoch": 0.6, "learning_rate": 0.0007305895124385572, "loss": 2.8079, "step": 22298 }, { "epoch": 0.6, "learning_rate": 0.0007305056925018593, "loss": 2.8447, "step": 22299 }, { "epoch": 0.6, "learning_rate": 0.0007304218746068023, "loss": 2.7617, "step": 22300 }, { "epoch": 0.6, "learning_rate": 0.0007303380587540212, "loss": 2.4307, "step": 22301 }, { "epoch": 0.6, "learning_rate": 0.0007302542449441505, "loss": 2.3744, "step": 22302 }, { "epoch": 0.6, "learning_rate": 0.0007301704331778258, "loss": 2.6216, "step": 22303 }, { "epoch": 0.6, "learning_rate": 0.0007300866234556813, "loss": 2.2965, "step": 22304 }, { "epoch": 0.6, "learning_rate": 0.000730002815778352, "loss": 2.5712, "step": 22305 }, { "epoch": 0.6, "learning_rate": 0.0007299190101464737, "loss": 2.348, "step": 22306 }, { "epoch": 0.6, "learning_rate": 0.0007298352065606803, "loss": 2.2553, "step": 22307 }, { "epoch": 0.6, "learning_rate": 0.0007297514050216072, "loss": 2.5178, "step": 22308 }, { "epoch": 0.6, "learning_rate": 0.0007296676055298892, "loss": 2.2186, "step": 22309 }, { "epoch": 0.6, "learning_rate": 0.0007295838080861609, "loss": 2.5215, "step": 22310 }, { "epoch": 0.6, "learning_rate": 0.0007295000126910576, "loss": 2.5479, "step": 22311 }, { "epoch": 0.6, "learning_rate": 0.0007294162193452136, "loss": 3.2324, "step": 22312 }, { "epoch": 0.6, "learning_rate": 0.000729332428049264, "loss": 2.7747, "step": 22313 }, { "epoch": 0.6, "learning_rate": 0.0007292486388038436, "loss": 2.418, "step": 22314 }, { "epoch": 0.6, "learning_rate": 0.000729164851609587, "loss": 2.4331, "step": 22315 }, { "epoch": 0.6, "learning_rate": 0.000729081066467129, "loss": 2.6594, "step": 22316 }, { "epoch": 0.6, "learning_rate": 0.000728997283377105, "loss": 2.723, "step": 22317 }, { "epoch": 0.6, "learning_rate": 0.0007289135023401483, "loss": 2.5482, "step": 22318 }, { "epoch": 0.6, "learning_rate": 0.0007288297233568953, "loss": 2.2437, "step": 22319 }, { "epoch": 0.6, "learning_rate": 0.0007287459464279791, "loss": 2.1746, "step": 22320 }, { "epoch": 0.6, "learning_rate": 0.0007286621715540353, "loss": 2.5149, "step": 22321 }, { "epoch": 0.6, "learning_rate": 0.0007285783987356986, "loss": 2.7721, "step": 22322 }, { "epoch": 0.6, "learning_rate": 0.0007284946279736031, "loss": 2.2728, "step": 22323 }, { "epoch": 0.6, "learning_rate": 0.0007284108592683838, "loss": 2.6962, "step": 22324 }, { "epoch": 0.6, "learning_rate": 0.0007283270926206755, "loss": 2.4893, "step": 22325 }, { "epoch": 0.6, "learning_rate": 0.0007282433280311125, "loss": 2.4064, "step": 22326 }, { "epoch": 0.6, "learning_rate": 0.0007281595655003292, "loss": 2.634, "step": 22327 }, { "epoch": 0.6, "learning_rate": 0.0007280758050289608, "loss": 2.5762, "step": 22328 }, { "epoch": 0.6, "learning_rate": 0.0007279920466176413, "loss": 2.3772, "step": 22329 }, { "epoch": 0.6, "learning_rate": 0.0007279082902670057, "loss": 2.6482, "step": 22330 }, { "epoch": 0.6, "learning_rate": 0.0007278245359776879, "loss": 2.6547, "step": 22331 }, { "epoch": 0.6, "learning_rate": 0.0007277407837503227, "loss": 2.1692, "step": 22332 }, { "epoch": 0.6, "learning_rate": 0.0007276570335855452, "loss": 2.4675, "step": 22333 }, { "epoch": 0.6, "learning_rate": 0.0007275732854839889, "loss": 1.9814, "step": 22334 }, { "epoch": 0.6, "learning_rate": 0.0007274895394462884, "loss": 2.6825, "step": 22335 }, { "epoch": 0.6, "learning_rate": 0.0007274057954730791, "loss": 2.2971, "step": 22336 }, { "epoch": 0.6, "learning_rate": 0.0007273220535649942, "loss": 2.4785, "step": 22337 }, { "epoch": 0.6, "learning_rate": 0.0007272383137226691, "loss": 2.786, "step": 22338 }, { "epoch": 0.6, "learning_rate": 0.0007271545759467375, "loss": 2.2865, "step": 22339 }, { "epoch": 0.6, "learning_rate": 0.0007270708402378341, "loss": 2.7214, "step": 22340 }, { "epoch": 0.6, "learning_rate": 0.0007269871065965933, "loss": 2.8961, "step": 22341 }, { "epoch": 0.6, "learning_rate": 0.0007269033750236493, "loss": 2.9871, "step": 22342 }, { "epoch": 0.6, "learning_rate": 0.0007268196455196363, "loss": 2.6, "step": 22343 }, { "epoch": 0.6, "learning_rate": 0.0007267359180851891, "loss": 2.58, "step": 22344 }, { "epoch": 0.6, "learning_rate": 0.0007266521927209418, "loss": 2.1954, "step": 22345 }, { "epoch": 0.6, "learning_rate": 0.0007265684694275288, "loss": 2.6855, "step": 22346 }, { "epoch": 0.6, "learning_rate": 0.0007264847482055836, "loss": 2.7302, "step": 22347 }, { "epoch": 0.6, "learning_rate": 0.000726401029055741, "loss": 2.561, "step": 22348 }, { "epoch": 0.6, "learning_rate": 0.000726317311978636, "loss": 2.5319, "step": 22349 }, { "epoch": 0.6, "learning_rate": 0.0007262335969749017, "loss": 2.4431, "step": 22350 }, { "epoch": 0.6, "learning_rate": 0.0007261498840451726, "loss": 2.5635, "step": 22351 }, { "epoch": 0.6, "learning_rate": 0.0007260661731900833, "loss": 2.5091, "step": 22352 }, { "epoch": 0.6, "learning_rate": 0.0007259824644102675, "loss": 2.8519, "step": 22353 }, { "epoch": 0.6, "learning_rate": 0.0007258987577063597, "loss": 2.4324, "step": 22354 }, { "epoch": 0.6, "learning_rate": 0.0007258150530789938, "loss": 2.5342, "step": 22355 }, { "epoch": 0.6, "learning_rate": 0.0007257313505288039, "loss": 2.3521, "step": 22356 }, { "epoch": 0.6, "learning_rate": 0.0007256476500564247, "loss": 2.2417, "step": 22357 }, { "epoch": 0.6, "learning_rate": 0.0007255639516624893, "loss": 2.0301, "step": 22358 }, { "epoch": 0.6, "learning_rate": 0.0007254802553476325, "loss": 2.3592, "step": 22359 }, { "epoch": 0.6, "learning_rate": 0.0007253965611124887, "loss": 2.7373, "step": 22360 }, { "epoch": 0.6, "learning_rate": 0.0007253128689576908, "loss": 2.5971, "step": 22361 }, { "epoch": 0.6, "learning_rate": 0.000725229178883874, "loss": 2.8685, "step": 22362 }, { "epoch": 0.6, "learning_rate": 0.0007251454908916717, "loss": 2.5046, "step": 22363 }, { "epoch": 0.6, "learning_rate": 0.0007250618049817177, "loss": 2.1639, "step": 22364 }, { "epoch": 0.6, "learning_rate": 0.0007249781211546467, "loss": 2.1339, "step": 22365 }, { "epoch": 0.6, "learning_rate": 0.0007248944394110921, "loss": 2.372, "step": 22366 }, { "epoch": 0.6, "learning_rate": 0.0007248107597516879, "loss": 2.525, "step": 22367 }, { "epoch": 0.6, "learning_rate": 0.0007247270821770684, "loss": 2.6164, "step": 22368 }, { "epoch": 0.6, "learning_rate": 0.000724643406687867, "loss": 2.5374, "step": 22369 }, { "epoch": 0.6, "learning_rate": 0.0007245597332847183, "loss": 2.38, "step": 22370 }, { "epoch": 0.6, "learning_rate": 0.0007244760619682558, "loss": 2.5823, "step": 22371 }, { "epoch": 0.6, "learning_rate": 0.0007243923927391132, "loss": 2.4548, "step": 22372 }, { "epoch": 0.6, "learning_rate": 0.000724308725597925, "loss": 2.4422, "step": 22373 }, { "epoch": 0.6, "learning_rate": 0.0007242250605453239, "loss": 2.5299, "step": 22374 }, { "epoch": 0.6, "learning_rate": 0.0007241413975819447, "loss": 2.5537, "step": 22375 }, { "epoch": 0.6, "learning_rate": 0.0007240577367084213, "loss": 2.3546, "step": 22376 }, { "epoch": 0.6, "learning_rate": 0.0007239740779253868, "loss": 2.5265, "step": 22377 }, { "epoch": 0.6, "learning_rate": 0.0007238904212334751, "loss": 2.5595, "step": 22378 }, { "epoch": 0.6, "learning_rate": 0.0007238067666333209, "loss": 2.5078, "step": 22379 }, { "epoch": 0.6, "learning_rate": 0.0007237231141255568, "loss": 2.6165, "step": 22380 }, { "epoch": 0.6, "learning_rate": 0.0007236394637108172, "loss": 2.5265, "step": 22381 }, { "epoch": 0.6, "learning_rate": 0.0007235558153897355, "loss": 2.7824, "step": 22382 }, { "epoch": 0.6, "learning_rate": 0.0007234721691629453, "loss": 2.4586, "step": 22383 }, { "epoch": 0.6, "learning_rate": 0.0007233885250310808, "loss": 2.6257, "step": 22384 }, { "epoch": 0.6, "learning_rate": 0.0007233048829947753, "loss": 2.3852, "step": 22385 }, { "epoch": 0.6, "learning_rate": 0.0007232212430546626, "loss": 2.6301, "step": 22386 }, { "epoch": 0.6, "learning_rate": 0.0007231376052113761, "loss": 2.1072, "step": 22387 }, { "epoch": 0.6, "learning_rate": 0.0007230539694655498, "loss": 2.3808, "step": 22388 }, { "epoch": 0.6, "learning_rate": 0.0007229703358178172, "loss": 2.3918, "step": 22389 }, { "epoch": 0.6, "learning_rate": 0.0007228867042688116, "loss": 2.2916, "step": 22390 }, { "epoch": 0.6, "learning_rate": 0.0007228030748191665, "loss": 2.528, "step": 22391 }, { "epoch": 0.6, "learning_rate": 0.0007227194474695164, "loss": 2.6294, "step": 22392 }, { "epoch": 0.6, "learning_rate": 0.0007226358222204938, "loss": 2.1409, "step": 22393 }, { "epoch": 0.6, "learning_rate": 0.0007225521990727326, "loss": 2.9995, "step": 22394 }, { "epoch": 0.6, "learning_rate": 0.0007224685780268666, "loss": 2.1087, "step": 22395 }, { "epoch": 0.6, "learning_rate": 0.0007223849590835287, "loss": 2.8231, "step": 22396 }, { "epoch": 0.6, "learning_rate": 0.0007223013422433531, "loss": 2.2816, "step": 22397 }, { "epoch": 0.6, "learning_rate": 0.0007222177275069726, "loss": 2.4431, "step": 22398 }, { "epoch": 0.6, "learning_rate": 0.0007221341148750209, "loss": 2.505, "step": 22399 }, { "epoch": 0.6, "learning_rate": 0.0007220505043481317, "loss": 2.2272, "step": 22400 }, { "epoch": 0.6, "learning_rate": 0.0007219668959269379, "loss": 2.3154, "step": 22401 }, { "epoch": 0.6, "learning_rate": 0.0007218832896120732, "loss": 2.6531, "step": 22402 }, { "epoch": 0.6, "learning_rate": 0.0007217996854041715, "loss": 2.5936, "step": 22403 }, { "epoch": 0.6, "learning_rate": 0.000721716083303865, "loss": 2.394, "step": 22404 }, { "epoch": 0.6, "learning_rate": 0.0007216324833117879, "loss": 2.6342, "step": 22405 }, { "epoch": 0.6, "learning_rate": 0.0007215488854285737, "loss": 2.543, "step": 22406 }, { "epoch": 0.6, "learning_rate": 0.000721465289654855, "loss": 2.8418, "step": 22407 }, { "epoch": 0.6, "learning_rate": 0.0007213816959912657, "loss": 2.7402, "step": 22408 }, { "epoch": 0.6, "learning_rate": 0.0007212981044384386, "loss": 2.5346, "step": 22409 }, { "epoch": 0.6, "learning_rate": 0.0007212145149970071, "loss": 2.3119, "step": 22410 }, { "epoch": 0.6, "learning_rate": 0.000721130927667605, "loss": 2.4161, "step": 22411 }, { "epoch": 0.6, "learning_rate": 0.0007210473424508649, "loss": 2.6526, "step": 22412 }, { "epoch": 0.6, "learning_rate": 0.0007209637593474201, "loss": 2.4705, "step": 22413 }, { "epoch": 0.6, "learning_rate": 0.0007208801783579044, "loss": 2.5131, "step": 22414 }, { "epoch": 0.6, "learning_rate": 0.0007207965994829503, "loss": 2.5413, "step": 22415 }, { "epoch": 0.6, "learning_rate": 0.0007207130227231916, "loss": 2.1258, "step": 22416 }, { "epoch": 0.6, "learning_rate": 0.0007206294480792605, "loss": 2.2062, "step": 22417 }, { "epoch": 0.6, "learning_rate": 0.0007205458755517911, "loss": 2.3095, "step": 22418 }, { "epoch": 0.6, "learning_rate": 0.0007204623051414163, "loss": 2.6933, "step": 22419 }, { "epoch": 0.6, "learning_rate": 0.0007203787368487689, "loss": 2.6561, "step": 22420 }, { "epoch": 0.6, "learning_rate": 0.0007202951706744821, "loss": 2.4687, "step": 22421 }, { "epoch": 0.6, "learning_rate": 0.0007202116066191895, "loss": 2.4946, "step": 22422 }, { "epoch": 0.6, "learning_rate": 0.0007201280446835234, "loss": 2.2091, "step": 22423 }, { "epoch": 0.6, "learning_rate": 0.0007200444848681173, "loss": 2.8369, "step": 22424 }, { "epoch": 0.6, "learning_rate": 0.000719960927173604, "loss": 2.4366, "step": 22425 }, { "epoch": 0.6, "learning_rate": 0.0007198773716006167, "loss": 2.5891, "step": 22426 }, { "epoch": 0.6, "learning_rate": 0.0007197938181497885, "loss": 2.4503, "step": 22427 }, { "epoch": 0.6, "learning_rate": 0.0007197102668217521, "loss": 2.5518, "step": 22428 }, { "epoch": 0.6, "learning_rate": 0.0007196267176171405, "loss": 2.3292, "step": 22429 }, { "epoch": 0.6, "learning_rate": 0.000719543170536587, "loss": 2.8803, "step": 22430 }, { "epoch": 0.6, "learning_rate": 0.0007194596255807243, "loss": 2.8245, "step": 22431 }, { "epoch": 0.6, "learning_rate": 0.0007193760827501854, "loss": 2.7289, "step": 22432 }, { "epoch": 0.6, "learning_rate": 0.0007192925420456027, "loss": 3.0068, "step": 22433 }, { "epoch": 0.6, "learning_rate": 0.0007192090034676096, "loss": 2.3179, "step": 22434 }, { "epoch": 0.6, "learning_rate": 0.0007191254670168394, "loss": 2.6172, "step": 22435 }, { "epoch": 0.6, "learning_rate": 0.0007190419326939241, "loss": 2.7541, "step": 22436 }, { "epoch": 0.6, "learning_rate": 0.0007189584004994964, "loss": 2.6246, "step": 22437 }, { "epoch": 0.6, "learning_rate": 0.0007188748704341905, "loss": 2.5164, "step": 22438 }, { "epoch": 0.6, "learning_rate": 0.0007187913424986378, "loss": 2.5229, "step": 22439 }, { "epoch": 0.6, "learning_rate": 0.0007187078166934717, "loss": 2.6781, "step": 22440 }, { "epoch": 0.6, "learning_rate": 0.0007186242930193251, "loss": 2.197, "step": 22441 }, { "epoch": 0.6, "learning_rate": 0.0007185407714768303, "loss": 2.7088, "step": 22442 }, { "epoch": 0.6, "learning_rate": 0.0007184572520666205, "loss": 2.5321, "step": 22443 }, { "epoch": 0.6, "learning_rate": 0.000718373734789328, "loss": 2.5411, "step": 22444 }, { "epoch": 0.6, "learning_rate": 0.0007182902196455857, "loss": 2.7449, "step": 22445 }, { "epoch": 0.6, "learning_rate": 0.0007182067066360266, "loss": 2.3443, "step": 22446 }, { "epoch": 0.6, "learning_rate": 0.0007181231957612828, "loss": 2.7337, "step": 22447 }, { "epoch": 0.6, "learning_rate": 0.0007180396870219874, "loss": 2.5244, "step": 22448 }, { "epoch": 0.6, "learning_rate": 0.0007179561804187733, "loss": 2.6216, "step": 22449 }, { "epoch": 0.6, "learning_rate": 0.0007178726759522723, "loss": 2.2166, "step": 22450 }, { "epoch": 0.6, "learning_rate": 0.0007177891736231178, "loss": 2.7012, "step": 22451 }, { "epoch": 0.6, "learning_rate": 0.0007177056734319418, "loss": 2.5021, "step": 22452 }, { "epoch": 0.6, "learning_rate": 0.000717622175379377, "loss": 2.9978, "step": 22453 }, { "epoch": 0.6, "learning_rate": 0.0007175386794660565, "loss": 2.5122, "step": 22454 }, { "epoch": 0.6, "learning_rate": 0.0007174551856926121, "loss": 2.7188, "step": 22455 }, { "epoch": 0.6, "learning_rate": 0.0007173716940596769, "loss": 2.5095, "step": 22456 }, { "epoch": 0.6, "learning_rate": 0.0007172882045678832, "loss": 2.3332, "step": 22457 }, { "epoch": 0.6, "learning_rate": 0.0007172047172178635, "loss": 1.9844, "step": 22458 }, { "epoch": 0.6, "learning_rate": 0.0007171212320102505, "loss": 2.3688, "step": 22459 }, { "epoch": 0.6, "learning_rate": 0.0007170377489456762, "loss": 2.1857, "step": 22460 }, { "epoch": 0.6, "learning_rate": 0.0007169542680247734, "loss": 2.5339, "step": 22461 }, { "epoch": 0.6, "learning_rate": 0.0007168707892481747, "loss": 2.1822, "step": 22462 }, { "epoch": 0.6, "learning_rate": 0.0007167873126165119, "loss": 2.4536, "step": 22463 }, { "epoch": 0.6, "learning_rate": 0.0007167038381304178, "loss": 2.795, "step": 22464 }, { "epoch": 0.6, "learning_rate": 0.0007166203657905252, "loss": 2.5776, "step": 22465 }, { "epoch": 0.6, "learning_rate": 0.0007165368955974656, "loss": 2.412, "step": 22466 }, { "epoch": 0.6, "learning_rate": 0.0007164534275518722, "loss": 2.5378, "step": 22467 }, { "epoch": 0.6, "learning_rate": 0.0007163699616543766, "loss": 2.6122, "step": 22468 }, { "epoch": 0.6, "learning_rate": 0.0007162864979056114, "loss": 2.2217, "step": 22469 }, { "epoch": 0.6, "learning_rate": 0.0007162030363062093, "loss": 2.3353, "step": 22470 }, { "epoch": 0.6, "learning_rate": 0.0007161195768568021, "loss": 2.5456, "step": 22471 }, { "epoch": 0.6, "learning_rate": 0.0007160361195580221, "loss": 2.1098, "step": 22472 }, { "epoch": 0.6, "learning_rate": 0.0007159526644105019, "loss": 2.227, "step": 22473 }, { "epoch": 0.6, "learning_rate": 0.0007158692114148734, "loss": 2.7394, "step": 22474 }, { "epoch": 0.6, "learning_rate": 0.0007157857605717692, "loss": 2.2952, "step": 22475 }, { "epoch": 0.6, "learning_rate": 0.0007157023118818209, "loss": 2.2119, "step": 22476 }, { "epoch": 0.6, "learning_rate": 0.0007156188653456611, "loss": 2.7371, "step": 22477 }, { "epoch": 0.6, "learning_rate": 0.0007155354209639225, "loss": 2.7131, "step": 22478 }, { "epoch": 0.6, "learning_rate": 0.0007154519787372361, "loss": 2.3723, "step": 22479 }, { "epoch": 0.6, "learning_rate": 0.0007153685386662345, "loss": 2.7364, "step": 22480 }, { "epoch": 0.6, "learning_rate": 0.0007152851007515506, "loss": 2.5273, "step": 22481 }, { "epoch": 0.6, "learning_rate": 0.0007152016649938154, "loss": 2.1627, "step": 22482 }, { "epoch": 0.6, "learning_rate": 0.0007151182313936615, "loss": 2.3525, "step": 22483 }, { "epoch": 0.6, "learning_rate": 0.0007150347999517212, "loss": 2.7234, "step": 22484 }, { "epoch": 0.6, "learning_rate": 0.000714951370668626, "loss": 2.5808, "step": 22485 }, { "epoch": 0.6, "learning_rate": 0.0007148679435450085, "loss": 2.4996, "step": 22486 }, { "epoch": 0.6, "learning_rate": 0.0007147845185815004, "loss": 2.4696, "step": 22487 }, { "epoch": 0.6, "learning_rate": 0.0007147010957787337, "loss": 2.4056, "step": 22488 }, { "epoch": 0.6, "learning_rate": 0.0007146176751373406, "loss": 2.6157, "step": 22489 }, { "epoch": 0.6, "learning_rate": 0.0007145342566579529, "loss": 2.764, "step": 22490 }, { "epoch": 0.6, "learning_rate": 0.0007144508403412027, "loss": 2.764, "step": 22491 }, { "epoch": 0.6, "learning_rate": 0.0007143674261877222, "loss": 2.791, "step": 22492 }, { "epoch": 0.6, "learning_rate": 0.0007142840141981424, "loss": 2.2147, "step": 22493 }, { "epoch": 0.6, "learning_rate": 0.0007142006043730964, "loss": 2.8422, "step": 22494 }, { "epoch": 0.6, "learning_rate": 0.0007141171967132152, "loss": 2.8349, "step": 22495 }, { "epoch": 0.6, "learning_rate": 0.0007140337912191308, "loss": 2.5814, "step": 22496 }, { "epoch": 0.6, "learning_rate": 0.0007139503878914758, "loss": 2.3961, "step": 22497 }, { "epoch": 0.6, "learning_rate": 0.000713866986730881, "loss": 2.6664, "step": 22498 }, { "epoch": 0.6, "learning_rate": 0.0007137835877379789, "loss": 2.2413, "step": 22499 }, { "epoch": 0.6, "learning_rate": 0.0007137001909134014, "loss": 2.5313, "step": 22500 }, { "epoch": 0.6, "learning_rate": 0.0007136167962577798, "loss": 2.7506, "step": 22501 }, { "epoch": 0.6, "learning_rate": 0.0007135334037717464, "loss": 2.2485, "step": 22502 }, { "epoch": 0.6, "learning_rate": 0.0007134500134559326, "loss": 2.3368, "step": 22503 }, { "epoch": 0.6, "learning_rate": 0.0007133666253109701, "loss": 2.565, "step": 22504 }, { "epoch": 0.6, "learning_rate": 0.0007132832393374913, "loss": 2.2599, "step": 22505 }, { "epoch": 0.6, "learning_rate": 0.0007131998555361267, "loss": 2.498, "step": 22506 }, { "epoch": 0.6, "learning_rate": 0.0007131164739075091, "loss": 2.3786, "step": 22507 }, { "epoch": 0.6, "learning_rate": 0.0007130330944522701, "loss": 2.6823, "step": 22508 }, { "epoch": 0.6, "learning_rate": 0.0007129497171710406, "loss": 2.8377, "step": 22509 }, { "epoch": 0.6, "learning_rate": 0.0007128663420644531, "loss": 2.3, "step": 22510 }, { "epoch": 0.6, "learning_rate": 0.0007127829691331386, "loss": 2.6526, "step": 22511 }, { "epoch": 0.6, "learning_rate": 0.0007126995983777289, "loss": 2.5572, "step": 22512 }, { "epoch": 0.61, "learning_rate": 0.0007126162297988558, "loss": 2.4137, "step": 22513 }, { "epoch": 0.61, "learning_rate": 0.0007125328633971509, "loss": 2.7208, "step": 22514 }, { "epoch": 0.61, "learning_rate": 0.0007124494991732453, "loss": 2.4585, "step": 22515 }, { "epoch": 0.61, "learning_rate": 0.0007123661371277712, "loss": 2.8187, "step": 22516 }, { "epoch": 0.61, "learning_rate": 0.0007122827772613596, "loss": 2.6359, "step": 22517 }, { "epoch": 0.61, "learning_rate": 0.0007121994195746424, "loss": 2.6487, "step": 22518 }, { "epoch": 0.61, "learning_rate": 0.0007121160640682509, "loss": 1.8383, "step": 22519 }, { "epoch": 0.61, "learning_rate": 0.0007120327107428166, "loss": 2.3357, "step": 22520 }, { "epoch": 0.61, "learning_rate": 0.0007119493595989713, "loss": 2.7983, "step": 22521 }, { "epoch": 0.61, "learning_rate": 0.0007118660106373458, "loss": 2.4779, "step": 22522 }, { "epoch": 0.61, "learning_rate": 0.0007117826638585717, "loss": 2.5256, "step": 22523 }, { "epoch": 0.61, "learning_rate": 0.0007116993192632813, "loss": 2.5239, "step": 22524 }, { "epoch": 0.61, "learning_rate": 0.0007116159768521047, "loss": 2.3701, "step": 22525 }, { "epoch": 0.61, "learning_rate": 0.000711532636625674, "loss": 2.5175, "step": 22526 }, { "epoch": 0.61, "learning_rate": 0.0007114492985846207, "loss": 2.8233, "step": 22527 }, { "epoch": 0.61, "learning_rate": 0.0007113659627295757, "loss": 2.427, "step": 22528 }, { "epoch": 0.61, "learning_rate": 0.0007112826290611707, "loss": 2.4782, "step": 22529 }, { "epoch": 0.61, "learning_rate": 0.0007111992975800368, "loss": 2.135, "step": 22530 }, { "epoch": 0.61, "learning_rate": 0.0007111159682868053, "loss": 2.5083, "step": 22531 }, { "epoch": 0.61, "learning_rate": 0.0007110326411821078, "loss": 2.9356, "step": 22532 }, { "epoch": 0.61, "learning_rate": 0.0007109493162665752, "loss": 2.9311, "step": 22533 }, { "epoch": 0.61, "learning_rate": 0.0007108659935408389, "loss": 2.91, "step": 22534 }, { "epoch": 0.61, "learning_rate": 0.0007107826730055305, "loss": 2.2101, "step": 22535 }, { "epoch": 0.61, "learning_rate": 0.0007106993546612803, "loss": 2.517, "step": 22536 }, { "epoch": 0.61, "learning_rate": 0.0007106160385087206, "loss": 2.045, "step": 22537 }, { "epoch": 0.61, "learning_rate": 0.0007105327245484817, "loss": 2.436, "step": 22538 }, { "epoch": 0.61, "learning_rate": 0.0007104494127811951, "loss": 2.272, "step": 22539 }, { "epoch": 0.61, "learning_rate": 0.0007103661032074922, "loss": 2.9234, "step": 22540 }, { "epoch": 0.61, "learning_rate": 0.0007102827958280038, "loss": 2.6295, "step": 22541 }, { "epoch": 0.61, "learning_rate": 0.0007101994906433611, "loss": 2.505, "step": 22542 }, { "epoch": 0.61, "learning_rate": 0.0007101161876541952, "loss": 2.5813, "step": 22543 }, { "epoch": 0.61, "learning_rate": 0.0007100328868611375, "loss": 2.6812, "step": 22544 }, { "epoch": 0.61, "learning_rate": 0.0007099495882648186, "loss": 2.7087, "step": 22545 }, { "epoch": 0.61, "learning_rate": 0.0007098662918658698, "loss": 2.3259, "step": 22546 }, { "epoch": 0.61, "learning_rate": 0.000709782997664922, "loss": 2.7769, "step": 22547 }, { "epoch": 0.61, "learning_rate": 0.0007096997056626066, "loss": 2.5737, "step": 22548 }, { "epoch": 0.61, "learning_rate": 0.000709616415859554, "loss": 2.3977, "step": 22549 }, { "epoch": 0.61, "learning_rate": 0.0007095331282563956, "loss": 2.3071, "step": 22550 }, { "epoch": 0.61, "learning_rate": 0.0007094498428537627, "loss": 2.3227, "step": 22551 }, { "epoch": 0.61, "learning_rate": 0.0007093665596522854, "loss": 2.4078, "step": 22552 }, { "epoch": 0.61, "learning_rate": 0.0007092832786525949, "loss": 2.7295, "step": 22553 }, { "epoch": 0.61, "learning_rate": 0.0007091999998553229, "loss": 2.2351, "step": 22554 }, { "epoch": 0.61, "learning_rate": 0.0007091167232610993, "loss": 2.181, "step": 22555 }, { "epoch": 0.61, "learning_rate": 0.0007090334488705556, "loss": 2.3785, "step": 22556 }, { "epoch": 0.61, "learning_rate": 0.0007089501766843224, "loss": 2.0609, "step": 22557 }, { "epoch": 0.61, "learning_rate": 0.0007088669067030304, "loss": 2.2433, "step": 22558 }, { "epoch": 0.61, "learning_rate": 0.0007087836389273111, "loss": 2.1667, "step": 22559 }, { "epoch": 0.61, "learning_rate": 0.0007087003733577946, "loss": 1.9792, "step": 22560 }, { "epoch": 0.61, "learning_rate": 0.000708617109995112, "loss": 2.0287, "step": 22561 }, { "epoch": 0.61, "learning_rate": 0.0007085338488398942, "loss": 2.6507, "step": 22562 }, { "epoch": 0.61, "learning_rate": 0.0007084505898927717, "loss": 2.1761, "step": 22563 }, { "epoch": 0.61, "learning_rate": 0.0007083673331543758, "loss": 2.4857, "step": 22564 }, { "epoch": 0.61, "learning_rate": 0.0007082840786253364, "loss": 2.4645, "step": 22565 }, { "epoch": 0.61, "learning_rate": 0.0007082008263062845, "loss": 2.9284, "step": 22566 }, { "epoch": 0.61, "learning_rate": 0.0007081175761978517, "loss": 2.7699, "step": 22567 }, { "epoch": 0.61, "learning_rate": 0.0007080343283006674, "loss": 2.374, "step": 22568 }, { "epoch": 0.61, "learning_rate": 0.0007079510826153629, "loss": 3.0216, "step": 22569 }, { "epoch": 0.61, "learning_rate": 0.0007078678391425691, "loss": 2.6737, "step": 22570 }, { "epoch": 0.61, "learning_rate": 0.0007077845978829158, "loss": 2.8159, "step": 22571 }, { "epoch": 0.61, "learning_rate": 0.0007077013588370346, "loss": 3.0144, "step": 22572 }, { "epoch": 0.61, "learning_rate": 0.0007076181220055553, "loss": 2.2425, "step": 22573 }, { "epoch": 0.61, "learning_rate": 0.000707534887389109, "loss": 2.9458, "step": 22574 }, { "epoch": 0.61, "learning_rate": 0.0007074516549883261, "loss": 2.5346, "step": 22575 }, { "epoch": 0.61, "learning_rate": 0.0007073684248038371, "loss": 2.528, "step": 22576 }, { "epoch": 0.61, "learning_rate": 0.0007072851968362725, "loss": 2.8194, "step": 22577 }, { "epoch": 0.61, "learning_rate": 0.0007072019710862635, "loss": 2.6324, "step": 22578 }, { "epoch": 0.61, "learning_rate": 0.0007071187475544393, "loss": 2.8815, "step": 22579 }, { "epoch": 0.61, "learning_rate": 0.0007070355262414318, "loss": 2.2587, "step": 22580 }, { "epoch": 0.61, "learning_rate": 0.0007069523071478702, "loss": 2.4346, "step": 22581 }, { "epoch": 0.61, "learning_rate": 0.0007068690902743856, "loss": 2.4007, "step": 22582 }, { "epoch": 0.61, "learning_rate": 0.0007067858756216086, "loss": 2.9371, "step": 22583 }, { "epoch": 0.61, "learning_rate": 0.0007067026631901691, "loss": 2.5474, "step": 22584 }, { "epoch": 0.61, "learning_rate": 0.000706619452980698, "loss": 2.311, "step": 22585 }, { "epoch": 0.61, "learning_rate": 0.0007065362449938255, "loss": 2.4468, "step": 22586 }, { "epoch": 0.61, "learning_rate": 0.0007064530392301818, "loss": 2.3255, "step": 22587 }, { "epoch": 0.61, "learning_rate": 0.0007063698356903973, "loss": 2.6258, "step": 22588 }, { "epoch": 0.61, "learning_rate": 0.0007062866343751027, "loss": 2.696, "step": 22589 }, { "epoch": 0.61, "learning_rate": 0.0007062034352849278, "loss": 2.2029, "step": 22590 }, { "epoch": 0.61, "learning_rate": 0.0007061202384205035, "loss": 2.5411, "step": 22591 }, { "epoch": 0.61, "learning_rate": 0.0007060370437824593, "loss": 2.3489, "step": 22592 }, { "epoch": 0.61, "learning_rate": 0.0007059538513714261, "loss": 2.8122, "step": 22593 }, { "epoch": 0.61, "learning_rate": 0.0007058706611880343, "loss": 2.4538, "step": 22594 }, { "epoch": 0.61, "learning_rate": 0.0007057874732329131, "loss": 2.5348, "step": 22595 }, { "epoch": 0.61, "learning_rate": 0.0007057042875066937, "loss": 2.4263, "step": 22596 }, { "epoch": 0.61, "learning_rate": 0.0007056211040100063, "loss": 2.1593, "step": 22597 }, { "epoch": 0.61, "learning_rate": 0.0007055379227434804, "loss": 1.9203, "step": 22598 }, { "epoch": 0.61, "learning_rate": 0.0007054547437077469, "loss": 2.7664, "step": 22599 }, { "epoch": 0.61, "learning_rate": 0.0007053715669034353, "loss": 2.536, "step": 22600 }, { "epoch": 0.61, "learning_rate": 0.0007052883923311759, "loss": 2.2994, "step": 22601 }, { "epoch": 0.61, "learning_rate": 0.0007052052199915994, "loss": 2.8759, "step": 22602 }, { "epoch": 0.61, "learning_rate": 0.0007051220498853351, "loss": 2.644, "step": 22603 }, { "epoch": 0.61, "learning_rate": 0.0007050388820130135, "loss": 2.5912, "step": 22604 }, { "epoch": 0.61, "learning_rate": 0.0007049557163752647, "loss": 2.7771, "step": 22605 }, { "epoch": 0.61, "learning_rate": 0.0007048725529727186, "loss": 3.1378, "step": 22606 }, { "epoch": 0.61, "learning_rate": 0.0007047893918060055, "loss": 2.6418, "step": 22607 }, { "epoch": 0.61, "learning_rate": 0.0007047062328757547, "loss": 2.712, "step": 22608 }, { "epoch": 0.61, "learning_rate": 0.0007046230761825969, "loss": 2.8484, "step": 22609 }, { "epoch": 0.61, "learning_rate": 0.0007045399217271622, "loss": 2.294, "step": 22610 }, { "epoch": 0.61, "learning_rate": 0.0007044567695100799, "loss": 2.6408, "step": 22611 }, { "epoch": 0.61, "learning_rate": 0.00070437361953198, "loss": 2.4281, "step": 22612 }, { "epoch": 0.61, "learning_rate": 0.0007042904717934933, "loss": 2.8139, "step": 22613 }, { "epoch": 0.61, "learning_rate": 0.0007042073262952487, "loss": 2.7556, "step": 22614 }, { "epoch": 0.61, "learning_rate": 0.0007041241830378768, "loss": 2.4302, "step": 22615 }, { "epoch": 0.61, "learning_rate": 0.0007040410420220069, "loss": 1.9204, "step": 22616 }, { "epoch": 0.61, "learning_rate": 0.0007039579032482692, "loss": 3.2908, "step": 22617 }, { "epoch": 0.61, "learning_rate": 0.0007038747667172938, "loss": 2.2325, "step": 22618 }, { "epoch": 0.61, "learning_rate": 0.00070379163242971, "loss": 2.3137, "step": 22619 }, { "epoch": 0.61, "learning_rate": 0.0007037085003861476, "loss": 2.077, "step": 22620 }, { "epoch": 0.61, "learning_rate": 0.000703625370587237, "loss": 2.7341, "step": 22621 }, { "epoch": 0.61, "learning_rate": 0.0007035422430336075, "loss": 2.8244, "step": 22622 }, { "epoch": 0.61, "learning_rate": 0.0007034591177258893, "loss": 2.8135, "step": 22623 }, { "epoch": 0.61, "learning_rate": 0.0007033759946647114, "loss": 2.3896, "step": 22624 }, { "epoch": 0.61, "learning_rate": 0.0007032928738507036, "loss": 2.597, "step": 22625 }, { "epoch": 0.61, "learning_rate": 0.0007032097552844967, "loss": 2.7502, "step": 22626 }, { "epoch": 0.61, "learning_rate": 0.0007031266389667193, "loss": 2.1126, "step": 22627 }, { "epoch": 0.61, "learning_rate": 0.0007030435248980011, "loss": 2.3876, "step": 22628 }, { "epoch": 0.61, "learning_rate": 0.0007029604130789725, "loss": 2.1694, "step": 22629 }, { "epoch": 0.61, "learning_rate": 0.0007028773035102625, "loss": 2.3403, "step": 22630 }, { "epoch": 0.61, "learning_rate": 0.0007027941961925008, "loss": 2.6028, "step": 22631 }, { "epoch": 0.61, "learning_rate": 0.0007027110911263175, "loss": 2.5473, "step": 22632 }, { "epoch": 0.61, "learning_rate": 0.0007026279883123415, "loss": 2.5921, "step": 22633 }, { "epoch": 0.61, "learning_rate": 0.0007025448877512031, "loss": 2.446, "step": 22634 }, { "epoch": 0.61, "learning_rate": 0.000702461789443531, "loss": 2.301, "step": 22635 }, { "epoch": 0.61, "learning_rate": 0.0007023786933899552, "loss": 2.2078, "step": 22636 }, { "epoch": 0.61, "learning_rate": 0.0007022955995911057, "loss": 2.26, "step": 22637 }, { "epoch": 0.61, "learning_rate": 0.0007022125080476109, "loss": 2.3579, "step": 22638 }, { "epoch": 0.61, "learning_rate": 0.0007021294187601012, "loss": 2.3037, "step": 22639 }, { "epoch": 0.61, "learning_rate": 0.0007020463317292061, "loss": 2.2067, "step": 22640 }, { "epoch": 0.61, "learning_rate": 0.0007019632469555542, "loss": 2.219, "step": 22641 }, { "epoch": 0.61, "learning_rate": 0.0007018801644397758, "loss": 2.3235, "step": 22642 }, { "epoch": 0.61, "learning_rate": 0.0007017970841824996, "loss": 2.4609, "step": 22643 }, { "epoch": 0.61, "learning_rate": 0.0007017140061843556, "loss": 2.6376, "step": 22644 }, { "epoch": 0.61, "learning_rate": 0.000701630930445973, "loss": 2.4749, "step": 22645 }, { "epoch": 0.61, "learning_rate": 0.000701547856967981, "loss": 2.5483, "step": 22646 }, { "epoch": 0.61, "learning_rate": 0.0007014647857510091, "loss": 2.4505, "step": 22647 }, { "epoch": 0.61, "learning_rate": 0.0007013817167956869, "loss": 2.9528, "step": 22648 }, { "epoch": 0.61, "learning_rate": 0.000701298650102643, "loss": 2.491, "step": 22649 }, { "epoch": 0.61, "learning_rate": 0.0007012155856725076, "loss": 2.0525, "step": 22650 }, { "epoch": 0.61, "learning_rate": 0.0007011325235059089, "loss": 2.4994, "step": 22651 }, { "epoch": 0.61, "learning_rate": 0.000701049463603477, "loss": 3.1947, "step": 22652 }, { "epoch": 0.61, "learning_rate": 0.0007009664059658414, "loss": 2.7337, "step": 22653 }, { "epoch": 0.61, "learning_rate": 0.0007008833505936303, "loss": 2.5865, "step": 22654 }, { "epoch": 0.61, "learning_rate": 0.0007008002974874735, "loss": 2.861, "step": 22655 }, { "epoch": 0.61, "learning_rate": 0.0007007172466480005, "loss": 2.4251, "step": 22656 }, { "epoch": 0.61, "learning_rate": 0.0007006341980758397, "loss": 2.8605, "step": 22657 }, { "epoch": 0.61, "learning_rate": 0.000700551151771621, "loss": 2.4239, "step": 22658 }, { "epoch": 0.61, "learning_rate": 0.0007004681077359731, "loss": 2.5249, "step": 22659 }, { "epoch": 0.61, "learning_rate": 0.0007003850659695252, "loss": 2.2989, "step": 22660 }, { "epoch": 0.61, "learning_rate": 0.0007003020264729067, "loss": 2.6647, "step": 22661 }, { "epoch": 0.61, "learning_rate": 0.0007002189892467462, "loss": 3.0344, "step": 22662 }, { "epoch": 0.61, "learning_rate": 0.0007001359542916731, "loss": 2.9532, "step": 22663 }, { "epoch": 0.61, "learning_rate": 0.0007000529216083166, "loss": 2.4582, "step": 22664 }, { "epoch": 0.61, "learning_rate": 0.0006999698911973053, "loss": 2.3452, "step": 22665 }, { "epoch": 0.61, "learning_rate": 0.0006998868630592685, "loss": 2.1186, "step": 22666 }, { "epoch": 0.61, "learning_rate": 0.0006998038371948356, "loss": 2.5776, "step": 22667 }, { "epoch": 0.61, "learning_rate": 0.0006997208136046344, "loss": 2.6583, "step": 22668 }, { "epoch": 0.61, "learning_rate": 0.0006996377922892955, "loss": 2.3412, "step": 22669 }, { "epoch": 0.61, "learning_rate": 0.0006995547732494464, "loss": 2.6891, "step": 22670 }, { "epoch": 0.61, "learning_rate": 0.0006994717564857167, "loss": 1.9984, "step": 22671 }, { "epoch": 0.61, "learning_rate": 0.0006993887419987354, "loss": 2.6857, "step": 22672 }, { "epoch": 0.61, "learning_rate": 0.000699305729789131, "loss": 2.6691, "step": 22673 }, { "epoch": 0.61, "learning_rate": 0.0006992227198575327, "loss": 2.3464, "step": 22674 }, { "epoch": 0.61, "learning_rate": 0.0006991397122045695, "loss": 3.1097, "step": 22675 }, { "epoch": 0.61, "learning_rate": 0.0006990567068308698, "loss": 2.7126, "step": 22676 }, { "epoch": 0.61, "learning_rate": 0.000698973703737063, "loss": 2.6074, "step": 22677 }, { "epoch": 0.61, "learning_rate": 0.0006988907029237772, "loss": 2.4192, "step": 22678 }, { "epoch": 0.61, "learning_rate": 0.0006988077043916418, "loss": 2.342, "step": 22679 }, { "epoch": 0.61, "learning_rate": 0.0006987247081412857, "loss": 2.6548, "step": 22680 }, { "epoch": 0.61, "learning_rate": 0.0006986417141733367, "loss": 2.5229, "step": 22681 }, { "epoch": 0.61, "learning_rate": 0.0006985587224884244, "loss": 2.4572, "step": 22682 }, { "epoch": 0.61, "learning_rate": 0.0006984757330871778, "loss": 2.7272, "step": 22683 }, { "epoch": 0.61, "learning_rate": 0.0006983927459702249, "loss": 2.6306, "step": 22684 }, { "epoch": 0.61, "learning_rate": 0.0006983097611381945, "loss": 2.0913, "step": 22685 }, { "epoch": 0.61, "learning_rate": 0.0006982267785917153, "loss": 2.4112, "step": 22686 }, { "epoch": 0.61, "learning_rate": 0.0006981437983314163, "loss": 2.6198, "step": 22687 }, { "epoch": 0.61, "learning_rate": 0.0006980608203579259, "loss": 2.5633, "step": 22688 }, { "epoch": 0.61, "learning_rate": 0.0006979778446718725, "loss": 2.8761, "step": 22689 }, { "epoch": 0.61, "learning_rate": 0.0006978948712738851, "loss": 2.7744, "step": 22690 }, { "epoch": 0.61, "learning_rate": 0.0006978119001645924, "loss": 2.4041, "step": 22691 }, { "epoch": 0.61, "learning_rate": 0.0006977289313446223, "loss": 2.086, "step": 22692 }, { "epoch": 0.61, "learning_rate": 0.0006976459648146043, "loss": 2.512, "step": 22693 }, { "epoch": 0.61, "learning_rate": 0.0006975630005751659, "loss": 2.4759, "step": 22694 }, { "epoch": 0.61, "learning_rate": 0.0006974800386269362, "loss": 2.7039, "step": 22695 }, { "epoch": 0.61, "learning_rate": 0.0006973970789705441, "loss": 2.7297, "step": 22696 }, { "epoch": 0.61, "learning_rate": 0.0006973141216066172, "loss": 2.6151, "step": 22697 }, { "epoch": 0.61, "learning_rate": 0.0006972311665357843, "loss": 2.1772, "step": 22698 }, { "epoch": 0.61, "learning_rate": 0.0006971482137586744, "loss": 3.1232, "step": 22699 }, { "epoch": 0.61, "learning_rate": 0.0006970652632759151, "loss": 2.638, "step": 22700 }, { "epoch": 0.61, "learning_rate": 0.0006969823150881352, "loss": 2.5421, "step": 22701 }, { "epoch": 0.61, "learning_rate": 0.0006968993691959635, "loss": 2.2772, "step": 22702 }, { "epoch": 0.61, "learning_rate": 0.0006968164256000276, "loss": 2.5404, "step": 22703 }, { "epoch": 0.61, "learning_rate": 0.0006967334843009565, "loss": 2.3762, "step": 22704 }, { "epoch": 0.61, "learning_rate": 0.0006966505452993781, "loss": 2.4018, "step": 22705 }, { "epoch": 0.61, "learning_rate": 0.000696567608595921, "loss": 2.3711, "step": 22706 }, { "epoch": 0.61, "learning_rate": 0.0006964846741912134, "loss": 2.5606, "step": 22707 }, { "epoch": 0.61, "learning_rate": 0.0006964017420858837, "loss": 2.3157, "step": 22708 }, { "epoch": 0.61, "learning_rate": 0.0006963188122805601, "loss": 1.9396, "step": 22709 }, { "epoch": 0.61, "learning_rate": 0.0006962358847758712, "loss": 2.8251, "step": 22710 }, { "epoch": 0.61, "learning_rate": 0.0006961529595724444, "loss": 2.2439, "step": 22711 }, { "epoch": 0.61, "learning_rate": 0.0006960700366709091, "loss": 2.0514, "step": 22712 }, { "epoch": 0.61, "learning_rate": 0.0006959871160718923, "loss": 2.6842, "step": 22713 }, { "epoch": 0.61, "learning_rate": 0.000695904197776023, "loss": 2.685, "step": 22714 }, { "epoch": 0.61, "learning_rate": 0.0006958212817839291, "loss": 2.7364, "step": 22715 }, { "epoch": 0.61, "learning_rate": 0.0006957383680962386, "loss": 1.9486, "step": 22716 }, { "epoch": 0.61, "learning_rate": 0.00069565545671358, "loss": 2.3827, "step": 22717 }, { "epoch": 0.61, "learning_rate": 0.0006955725476365813, "loss": 2.692, "step": 22718 }, { "epoch": 0.61, "learning_rate": 0.0006954896408658704, "loss": 2.3539, "step": 22719 }, { "epoch": 0.61, "learning_rate": 0.0006954067364020758, "loss": 2.4938, "step": 22720 }, { "epoch": 0.61, "learning_rate": 0.0006953238342458251, "loss": 2.3992, "step": 22721 }, { "epoch": 0.61, "learning_rate": 0.0006952409343977464, "loss": 2.2076, "step": 22722 }, { "epoch": 0.61, "learning_rate": 0.0006951580368584685, "loss": 2.509, "step": 22723 }, { "epoch": 0.61, "learning_rate": 0.0006950751416286181, "loss": 2.4145, "step": 22724 }, { "epoch": 0.61, "learning_rate": 0.000694992248708824, "loss": 2.5516, "step": 22725 }, { "epoch": 0.61, "learning_rate": 0.0006949093580997147, "loss": 2.1007, "step": 22726 }, { "epoch": 0.61, "learning_rate": 0.0006948264698019172, "loss": 2.2475, "step": 22727 }, { "epoch": 0.61, "learning_rate": 0.0006947435838160598, "loss": 2.161, "step": 22728 }, { "epoch": 0.61, "learning_rate": 0.0006946607001427703, "loss": 2.4073, "step": 22729 }, { "epoch": 0.61, "learning_rate": 0.0006945778187826767, "loss": 2.1664, "step": 22730 }, { "epoch": 0.61, "learning_rate": 0.0006944949397364072, "loss": 2.2601, "step": 22731 }, { "epoch": 0.61, "learning_rate": 0.0006944120630045891, "loss": 2.736, "step": 22732 }, { "epoch": 0.61, "learning_rate": 0.0006943291885878508, "loss": 2.5907, "step": 22733 }, { "epoch": 0.61, "learning_rate": 0.00069424631648682, "loss": 2.3071, "step": 22734 }, { "epoch": 0.61, "learning_rate": 0.0006941634467021243, "loss": 2.617, "step": 22735 }, { "epoch": 0.61, "learning_rate": 0.000694080579234392, "loss": 2.8232, "step": 22736 }, { "epoch": 0.61, "learning_rate": 0.00069399771408425, "loss": 2.344, "step": 22737 }, { "epoch": 0.61, "learning_rate": 0.0006939148512523267, "loss": 2.653, "step": 22738 }, { "epoch": 0.61, "learning_rate": 0.0006938319907392502, "loss": 2.7751, "step": 22739 }, { "epoch": 0.61, "learning_rate": 0.0006937491325456474, "loss": 2.8089, "step": 22740 }, { "epoch": 0.61, "learning_rate": 0.0006936662766721462, "loss": 2.6427, "step": 22741 }, { "epoch": 0.61, "learning_rate": 0.0006935834231193752, "loss": 2.3274, "step": 22742 }, { "epoch": 0.61, "learning_rate": 0.000693500571887961, "loss": 2.4519, "step": 22743 }, { "epoch": 0.61, "learning_rate": 0.0006934177229785316, "loss": 2.7956, "step": 22744 }, { "epoch": 0.61, "learning_rate": 0.000693334876391715, "loss": 3.0039, "step": 22745 }, { "epoch": 0.61, "learning_rate": 0.0006932520321281383, "loss": 2.8404, "step": 22746 }, { "epoch": 0.61, "learning_rate": 0.0006931691901884296, "loss": 2.5596, "step": 22747 }, { "epoch": 0.61, "learning_rate": 0.000693086350573216, "loss": 2.5071, "step": 22748 }, { "epoch": 0.61, "learning_rate": 0.0006930035132831254, "loss": 2.3233, "step": 22749 }, { "epoch": 0.61, "learning_rate": 0.0006929206783187853, "loss": 2.6192, "step": 22750 }, { "epoch": 0.61, "learning_rate": 0.0006928378456808233, "loss": 2.766, "step": 22751 }, { "epoch": 0.61, "learning_rate": 0.0006927550153698667, "loss": 2.7034, "step": 22752 }, { "epoch": 0.61, "learning_rate": 0.0006926721873865436, "loss": 2.7833, "step": 22753 }, { "epoch": 0.61, "learning_rate": 0.0006925893617314806, "loss": 1.9502, "step": 22754 }, { "epoch": 0.61, "learning_rate": 0.0006925065384053062, "loss": 2.265, "step": 22755 }, { "epoch": 0.61, "learning_rate": 0.0006924237174086468, "loss": 2.4147, "step": 22756 }, { "epoch": 0.61, "learning_rate": 0.0006923408987421301, "loss": 2.6172, "step": 22757 }, { "epoch": 0.61, "learning_rate": 0.0006922580824063844, "loss": 2.9103, "step": 22758 }, { "epoch": 0.61, "learning_rate": 0.0006921752684020361, "loss": 2.4464, "step": 22759 }, { "epoch": 0.61, "learning_rate": 0.0006920924567297129, "loss": 2.1287, "step": 22760 }, { "epoch": 0.61, "learning_rate": 0.0006920096473900423, "loss": 2.6213, "step": 22761 }, { "epoch": 0.61, "learning_rate": 0.0006919268403836514, "loss": 2.1547, "step": 22762 }, { "epoch": 0.61, "learning_rate": 0.0006918440357111679, "loss": 2.4011, "step": 22763 }, { "epoch": 0.61, "learning_rate": 0.0006917612333732188, "loss": 2.4433, "step": 22764 }, { "epoch": 0.61, "learning_rate": 0.0006916784333704314, "loss": 2.5232, "step": 22765 }, { "epoch": 0.61, "learning_rate": 0.0006915956357034332, "loss": 2.0825, "step": 22766 }, { "epoch": 0.61, "learning_rate": 0.0006915128403728512, "loss": 2.5566, "step": 22767 }, { "epoch": 0.61, "learning_rate": 0.0006914300473793128, "loss": 2.4109, "step": 22768 }, { "epoch": 0.61, "learning_rate": 0.0006913472567234456, "loss": 2.3215, "step": 22769 }, { "epoch": 0.61, "learning_rate": 0.0006912644684058756, "loss": 2.2163, "step": 22770 }, { "epoch": 0.61, "learning_rate": 0.0006911816824272317, "loss": 2.3876, "step": 22771 }, { "epoch": 0.61, "learning_rate": 0.0006910988987881395, "loss": 1.8121, "step": 22772 }, { "epoch": 0.61, "learning_rate": 0.0006910161174892269, "loss": 2.3538, "step": 22773 }, { "epoch": 0.61, "learning_rate": 0.0006909333385311211, "loss": 2.1611, "step": 22774 }, { "epoch": 0.61, "learning_rate": 0.0006908505619144489, "loss": 2.3084, "step": 22775 }, { "epoch": 0.61, "learning_rate": 0.0006907677876398377, "loss": 2.6661, "step": 22776 }, { "epoch": 0.61, "learning_rate": 0.0006906850157079145, "loss": 2.6348, "step": 22777 }, { "epoch": 0.61, "learning_rate": 0.0006906022461193063, "loss": 2.0411, "step": 22778 }, { "epoch": 0.61, "learning_rate": 0.00069051947887464, "loss": 2.379, "step": 22779 }, { "epoch": 0.61, "learning_rate": 0.0006904367139745431, "loss": 2.6632, "step": 22780 }, { "epoch": 0.61, "learning_rate": 0.0006903539514196421, "loss": 2.4216, "step": 22781 }, { "epoch": 0.61, "learning_rate": 0.0006902711912105646, "loss": 2.6479, "step": 22782 }, { "epoch": 0.61, "learning_rate": 0.0006901884333479364, "loss": 2.4405, "step": 22783 }, { "epoch": 0.61, "learning_rate": 0.0006901056778323857, "loss": 2.382, "step": 22784 }, { "epoch": 0.61, "learning_rate": 0.0006900229246645393, "loss": 2.5423, "step": 22785 }, { "epoch": 0.61, "learning_rate": 0.0006899401738450232, "loss": 2.3293, "step": 22786 }, { "epoch": 0.61, "learning_rate": 0.0006898574253744649, "loss": 1.9613, "step": 22787 }, { "epoch": 0.61, "learning_rate": 0.000689774679253492, "loss": 2.2535, "step": 22788 }, { "epoch": 0.61, "learning_rate": 0.0006896919354827301, "loss": 2.3416, "step": 22789 }, { "epoch": 0.61, "learning_rate": 0.0006896091940628068, "loss": 2.5924, "step": 22790 }, { "epoch": 0.61, "learning_rate": 0.0006895264549943487, "loss": 2.6708, "step": 22791 }, { "epoch": 0.61, "learning_rate": 0.0006894437182779826, "loss": 2.3925, "step": 22792 }, { "epoch": 0.61, "learning_rate": 0.0006893609839143355, "loss": 2.415, "step": 22793 }, { "epoch": 0.61, "learning_rate": 0.000689278251904034, "loss": 1.9698, "step": 22794 }, { "epoch": 0.61, "learning_rate": 0.0006891955222477049, "loss": 2.5342, "step": 22795 }, { "epoch": 0.61, "learning_rate": 0.000689112794945975, "loss": 1.7161, "step": 22796 }, { "epoch": 0.61, "learning_rate": 0.0006890300699994708, "loss": 2.2403, "step": 22797 }, { "epoch": 0.61, "learning_rate": 0.0006889473474088197, "loss": 2.0291, "step": 22798 }, { "epoch": 0.61, "learning_rate": 0.0006888646271746475, "loss": 2.3692, "step": 22799 }, { "epoch": 0.61, "learning_rate": 0.0006887819092975809, "loss": 2.2094, "step": 22800 }, { "epoch": 0.61, "learning_rate": 0.0006886991937782477, "loss": 2.3827, "step": 22801 }, { "epoch": 0.61, "learning_rate": 0.0006886164806172733, "loss": 2.49, "step": 22802 }, { "epoch": 0.61, "learning_rate": 0.0006885337698152847, "loss": 2.6678, "step": 22803 }, { "epoch": 0.61, "learning_rate": 0.0006884510613729087, "loss": 2.6829, "step": 22804 }, { "epoch": 0.61, "learning_rate": 0.0006883683552907718, "loss": 2.6472, "step": 22805 }, { "epoch": 0.61, "learning_rate": 0.0006882856515695005, "loss": 2.3864, "step": 22806 }, { "epoch": 0.61, "learning_rate": 0.0006882029502097213, "loss": 2.2786, "step": 22807 }, { "epoch": 0.61, "learning_rate": 0.0006881202512120608, "loss": 2.5118, "step": 22808 }, { "epoch": 0.61, "learning_rate": 0.0006880375545771457, "loss": 2.4294, "step": 22809 }, { "epoch": 0.61, "learning_rate": 0.0006879548603056021, "loss": 2.3169, "step": 22810 }, { "epoch": 0.61, "learning_rate": 0.0006878721683980566, "loss": 2.378, "step": 22811 }, { "epoch": 0.61, "learning_rate": 0.0006877894788551363, "loss": 2.1926, "step": 22812 }, { "epoch": 0.61, "learning_rate": 0.0006877067916774664, "loss": 2.5793, "step": 22813 }, { "epoch": 0.61, "learning_rate": 0.0006876241068656744, "loss": 2.1996, "step": 22814 }, { "epoch": 0.61, "learning_rate": 0.0006875414244203865, "loss": 2.223, "step": 22815 }, { "epoch": 0.61, "learning_rate": 0.0006874587443422285, "loss": 2.3941, "step": 22816 }, { "epoch": 0.61, "learning_rate": 0.0006873760666318275, "loss": 2.3653, "step": 22817 }, { "epoch": 0.61, "learning_rate": 0.0006872933912898093, "loss": 2.5265, "step": 22818 }, { "epoch": 0.61, "learning_rate": 0.0006872107183168004, "loss": 2.5235, "step": 22819 }, { "epoch": 0.61, "learning_rate": 0.0006871280477134275, "loss": 2.421, "step": 22820 }, { "epoch": 0.61, "learning_rate": 0.0006870453794803162, "loss": 2.5396, "step": 22821 }, { "epoch": 0.61, "learning_rate": 0.0006869627136180933, "loss": 2.586, "step": 22822 }, { "epoch": 0.61, "learning_rate": 0.0006868800501273851, "loss": 2.4744, "step": 22823 }, { "epoch": 0.61, "learning_rate": 0.0006867973890088173, "loss": 2.7694, "step": 22824 }, { "epoch": 0.61, "learning_rate": 0.000686714730263017, "loss": 2.4488, "step": 22825 }, { "epoch": 0.61, "learning_rate": 0.0006866320738906093, "loss": 2.7853, "step": 22826 }, { "epoch": 0.61, "learning_rate": 0.0006865494198922212, "loss": 2.4789, "step": 22827 }, { "epoch": 0.61, "learning_rate": 0.000686466768268479, "loss": 2.4267, "step": 22828 }, { "epoch": 0.61, "learning_rate": 0.0006863841190200082, "loss": 2.636, "step": 22829 }, { "epoch": 0.61, "learning_rate": 0.000686301472147435, "loss": 2.6451, "step": 22830 }, { "epoch": 0.61, "learning_rate": 0.0006862188276513863, "loss": 2.8124, "step": 22831 }, { "epoch": 0.61, "learning_rate": 0.0006861361855324873, "loss": 2.7835, "step": 22832 }, { "epoch": 0.61, "learning_rate": 0.0006860535457913648, "loss": 2.2969, "step": 22833 }, { "epoch": 0.61, "learning_rate": 0.0006859709084286441, "loss": 2.7477, "step": 22834 }, { "epoch": 0.61, "learning_rate": 0.0006858882734449516, "loss": 2.7127, "step": 22835 }, { "epoch": 0.61, "learning_rate": 0.0006858056408409139, "loss": 2.5914, "step": 22836 }, { "epoch": 0.61, "learning_rate": 0.000685723010617156, "loss": 2.2883, "step": 22837 }, { "epoch": 0.61, "learning_rate": 0.0006856403827743045, "loss": 2.3936, "step": 22838 }, { "epoch": 0.61, "learning_rate": 0.0006855577573129854, "loss": 2.7352, "step": 22839 }, { "epoch": 0.61, "learning_rate": 0.0006854751342338243, "loss": 2.7581, "step": 22840 }, { "epoch": 0.61, "learning_rate": 0.0006853925135374479, "loss": 2.3076, "step": 22841 }, { "epoch": 0.61, "learning_rate": 0.0006853098952244812, "loss": 2.3392, "step": 22842 }, { "epoch": 0.61, "learning_rate": 0.0006852272792955501, "loss": 2.6199, "step": 22843 }, { "epoch": 0.61, "learning_rate": 0.0006851446657512814, "loss": 2.3882, "step": 22844 }, { "epoch": 0.61, "learning_rate": 0.0006850620545923, "loss": 2.4313, "step": 22845 }, { "epoch": 0.61, "learning_rate": 0.0006849794458192324, "loss": 2.607, "step": 22846 }, { "epoch": 0.61, "learning_rate": 0.0006848968394327044, "loss": 2.5741, "step": 22847 }, { "epoch": 0.61, "learning_rate": 0.0006848142354333413, "loss": 2.3753, "step": 22848 }, { "epoch": 0.61, "learning_rate": 0.0006847316338217692, "loss": 2.6231, "step": 22849 }, { "epoch": 0.61, "learning_rate": 0.0006846490345986141, "loss": 1.999, "step": 22850 }, { "epoch": 0.61, "learning_rate": 0.0006845664377645014, "loss": 2.4125, "step": 22851 }, { "epoch": 0.61, "learning_rate": 0.000684483843320057, "loss": 2.4613, "step": 22852 }, { "epoch": 0.61, "learning_rate": 0.0006844012512659064, "loss": 2.5625, "step": 22853 }, { "epoch": 0.61, "learning_rate": 0.0006843186616026755, "loss": 2.0009, "step": 22854 }, { "epoch": 0.61, "learning_rate": 0.0006842360743309905, "loss": 2.4506, "step": 22855 }, { "epoch": 0.61, "learning_rate": 0.000684153489451476, "loss": 3.1237, "step": 22856 }, { "epoch": 0.61, "learning_rate": 0.0006840709069647582, "loss": 2.5411, "step": 22857 }, { "epoch": 0.61, "learning_rate": 0.0006839883268714632, "loss": 2.1336, "step": 22858 }, { "epoch": 0.61, "learning_rate": 0.0006839057491722159, "loss": 2.602, "step": 22859 }, { "epoch": 0.61, "learning_rate": 0.0006838231738676421, "loss": 2.1613, "step": 22860 }, { "epoch": 0.61, "learning_rate": 0.0006837406009583674, "loss": 2.3961, "step": 22861 }, { "epoch": 0.61, "learning_rate": 0.0006836580304450172, "loss": 2.4865, "step": 22862 }, { "epoch": 0.61, "learning_rate": 0.0006835754623282176, "loss": 2.6546, "step": 22863 }, { "epoch": 0.61, "learning_rate": 0.0006834928966085934, "loss": 2.6154, "step": 22864 }, { "epoch": 0.61, "learning_rate": 0.0006834103332867704, "loss": 2.3464, "step": 22865 }, { "epoch": 0.61, "learning_rate": 0.0006833277723633744, "loss": 2.6349, "step": 22866 }, { "epoch": 0.61, "learning_rate": 0.0006832452138390302, "loss": 2.6546, "step": 22867 }, { "epoch": 0.61, "learning_rate": 0.0006831626577143643, "loss": 2.2323, "step": 22868 }, { "epoch": 0.61, "learning_rate": 0.0006830801039900006, "loss": 2.9, "step": 22869 }, { "epoch": 0.61, "learning_rate": 0.0006829975526665657, "loss": 2.6122, "step": 22870 }, { "epoch": 0.61, "learning_rate": 0.0006829150037446852, "loss": 2.5452, "step": 22871 }, { "epoch": 0.61, "learning_rate": 0.0006828324572249833, "loss": 2.3176, "step": 22872 }, { "epoch": 0.61, "learning_rate": 0.0006827499131080859, "loss": 2.305, "step": 22873 }, { "epoch": 0.61, "learning_rate": 0.000682667371394619, "loss": 2.5089, "step": 22874 }, { "epoch": 0.61, "learning_rate": 0.000682584832085207, "loss": 2.5613, "step": 22875 }, { "epoch": 0.61, "learning_rate": 0.0006825022951804757, "loss": 2.4761, "step": 22876 }, { "epoch": 0.61, "learning_rate": 0.0006824197606810502, "loss": 2.4056, "step": 22877 }, { "epoch": 0.61, "learning_rate": 0.0006823372285875558, "loss": 2.141, "step": 22878 }, { "epoch": 0.61, "learning_rate": 0.0006822546989006178, "loss": 2.6298, "step": 22879 }, { "epoch": 0.61, "learning_rate": 0.0006821721716208613, "loss": 2.457, "step": 22880 }, { "epoch": 0.61, "learning_rate": 0.0006820896467489116, "loss": 2.1558, "step": 22881 }, { "epoch": 0.61, "learning_rate": 0.000682007124285394, "loss": 2.772, "step": 22882 }, { "epoch": 0.61, "learning_rate": 0.0006819246042309335, "loss": 2.8541, "step": 22883 }, { "epoch": 0.61, "learning_rate": 0.0006818420865861558, "loss": 2.5221, "step": 22884 }, { "epoch": 0.62, "learning_rate": 0.0006817595713516851, "loss": 2.6627, "step": 22885 }, { "epoch": 0.62, "learning_rate": 0.0006816770585281466, "loss": 2.9728, "step": 22886 }, { "epoch": 0.62, "learning_rate": 0.0006815945481161666, "loss": 2.3026, "step": 22887 }, { "epoch": 0.62, "learning_rate": 0.000681512040116369, "loss": 2.4696, "step": 22888 }, { "epoch": 0.62, "learning_rate": 0.0006814295345293791, "loss": 2.3484, "step": 22889 }, { "epoch": 0.62, "learning_rate": 0.0006813470313558224, "loss": 2.7848, "step": 22890 }, { "epoch": 0.62, "learning_rate": 0.0006812645305963234, "loss": 2.4528, "step": 22891 }, { "epoch": 0.62, "learning_rate": 0.0006811820322515072, "loss": 2.1492, "step": 22892 }, { "epoch": 0.62, "learning_rate": 0.0006810995363219994, "loss": 2.2814, "step": 22893 }, { "epoch": 0.62, "learning_rate": 0.0006810170428084241, "loss": 2.5987, "step": 22894 }, { "epoch": 0.62, "learning_rate": 0.0006809345517114068, "loss": 2.4749, "step": 22895 }, { "epoch": 0.62, "learning_rate": 0.0006808520630315722, "loss": 2.6243, "step": 22896 }, { "epoch": 0.62, "learning_rate": 0.0006807695767695453, "loss": 2.8807, "step": 22897 }, { "epoch": 0.62, "learning_rate": 0.0006806870929259515, "loss": 2.5403, "step": 22898 }, { "epoch": 0.62, "learning_rate": 0.0006806046115014144, "loss": 2.3413, "step": 22899 }, { "epoch": 0.62, "learning_rate": 0.0006805221324965601, "loss": 2.3146, "step": 22900 }, { "epoch": 0.62, "learning_rate": 0.0006804396559120132, "loss": 2.5859, "step": 22901 }, { "epoch": 0.62, "learning_rate": 0.000680357181748398, "loss": 2.4504, "step": 22902 }, { "epoch": 0.62, "learning_rate": 0.0006802747100063399, "loss": 2.6359, "step": 22903 }, { "epoch": 0.62, "learning_rate": 0.0006801922406864631, "loss": 2.6532, "step": 22904 }, { "epoch": 0.62, "learning_rate": 0.0006801097737893928, "loss": 2.5426, "step": 22905 }, { "epoch": 0.62, "learning_rate": 0.0006800273093157538, "loss": 2.2956, "step": 22906 }, { "epoch": 0.62, "learning_rate": 0.0006799448472661707, "loss": 2.2258, "step": 22907 }, { "epoch": 0.62, "learning_rate": 0.0006798623876412681, "loss": 2.6699, "step": 22908 }, { "epoch": 0.62, "learning_rate": 0.000679779930441671, "loss": 2.2707, "step": 22909 }, { "epoch": 0.62, "learning_rate": 0.0006796974756680036, "loss": 2.8049, "step": 22910 }, { "epoch": 0.62, "learning_rate": 0.0006796150233208913, "loss": 2.4548, "step": 22911 }, { "epoch": 0.62, "learning_rate": 0.0006795325734009578, "loss": 2.9209, "step": 22912 }, { "epoch": 0.62, "learning_rate": 0.0006794501259088283, "loss": 2.829, "step": 22913 }, { "epoch": 0.62, "learning_rate": 0.0006793676808451279, "loss": 2.5475, "step": 22914 }, { "epoch": 0.62, "learning_rate": 0.0006792852382104802, "loss": 2.4091, "step": 22915 }, { "epoch": 0.62, "learning_rate": 0.00067920279800551, "loss": 2.4527, "step": 22916 }, { "epoch": 0.62, "learning_rate": 0.0006791203602308424, "loss": 2.2936, "step": 22917 }, { "epoch": 0.62, "learning_rate": 0.0006790379248871014, "loss": 2.6961, "step": 22918 }, { "epoch": 0.62, "learning_rate": 0.000678955491974912, "loss": 2.3013, "step": 22919 }, { "epoch": 0.62, "learning_rate": 0.000678873061494898, "loss": 2.3893, "step": 22920 }, { "epoch": 0.62, "learning_rate": 0.0006787906334476844, "loss": 2.5919, "step": 22921 }, { "epoch": 0.62, "learning_rate": 0.0006787082078338957, "loss": 2.7569, "step": 22922 }, { "epoch": 0.62, "learning_rate": 0.000678625784654156, "loss": 2.9048, "step": 22923 }, { "epoch": 0.62, "learning_rate": 0.0006785433639090898, "loss": 2.5017, "step": 22924 }, { "epoch": 0.62, "learning_rate": 0.0006784609455993218, "loss": 2.4946, "step": 22925 }, { "epoch": 0.62, "learning_rate": 0.000678378529725476, "loss": 2.0904, "step": 22926 }, { "epoch": 0.62, "learning_rate": 0.0006782961162881771, "loss": 2.4433, "step": 22927 }, { "epoch": 0.62, "learning_rate": 0.0006782137052880494, "loss": 2.5106, "step": 22928 }, { "epoch": 0.62, "learning_rate": 0.0006781312967257169, "loss": 2.1251, "step": 22929 }, { "epoch": 0.62, "learning_rate": 0.0006780488906018046, "loss": 2.5767, "step": 22930 }, { "epoch": 0.62, "learning_rate": 0.0006779664869169359, "loss": 2.5343, "step": 22931 }, { "epoch": 0.62, "learning_rate": 0.0006778840856717355, "loss": 2.6005, "step": 22932 }, { "epoch": 0.62, "learning_rate": 0.0006778016868668281, "loss": 2.2853, "step": 22933 }, { "epoch": 0.62, "learning_rate": 0.0006777192905028371, "loss": 2.4841, "step": 22934 }, { "epoch": 0.62, "learning_rate": 0.0006776368965803872, "loss": 2.4844, "step": 22935 }, { "epoch": 0.62, "learning_rate": 0.0006775545051001028, "loss": 2.4505, "step": 22936 }, { "epoch": 0.62, "learning_rate": 0.0006774721160626076, "loss": 2.4522, "step": 22937 }, { "epoch": 0.62, "learning_rate": 0.0006773897294685261, "loss": 2.0702, "step": 22938 }, { "epoch": 0.62, "learning_rate": 0.0006773073453184822, "loss": 2.5371, "step": 22939 }, { "epoch": 0.62, "learning_rate": 0.0006772249636131, "loss": 2.4586, "step": 22940 }, { "epoch": 0.62, "learning_rate": 0.0006771425843530043, "loss": 2.2841, "step": 22941 }, { "epoch": 0.62, "learning_rate": 0.0006770602075388181, "loss": 2.6977, "step": 22942 }, { "epoch": 0.62, "learning_rate": 0.0006769778331711662, "loss": 3.2884, "step": 22943 }, { "epoch": 0.62, "learning_rate": 0.000676895461250673, "loss": 2.641, "step": 22944 }, { "epoch": 0.62, "learning_rate": 0.0006768130917779613, "loss": 2.6143, "step": 22945 }, { "epoch": 0.62, "learning_rate": 0.0006767307247536565, "loss": 2.591, "step": 22946 }, { "epoch": 0.62, "learning_rate": 0.0006766483601783813, "loss": 2.639, "step": 22947 }, { "epoch": 0.62, "learning_rate": 0.0006765659980527605, "loss": 2.346, "step": 22948 }, { "epoch": 0.62, "learning_rate": 0.0006764836383774182, "loss": 2.5188, "step": 22949 }, { "epoch": 0.62, "learning_rate": 0.0006764012811529776, "loss": 2.9679, "step": 22950 }, { "epoch": 0.62, "learning_rate": 0.0006763189263800631, "loss": 2.938, "step": 22951 }, { "epoch": 0.62, "learning_rate": 0.0006762365740592989, "loss": 2.3771, "step": 22952 }, { "epoch": 0.62, "learning_rate": 0.0006761542241913081, "loss": 2.5975, "step": 22953 }, { "epoch": 0.62, "learning_rate": 0.0006760718767767153, "loss": 2.293, "step": 22954 }, { "epoch": 0.62, "learning_rate": 0.0006759895318161437, "loss": 2.9106, "step": 22955 }, { "epoch": 0.62, "learning_rate": 0.0006759071893102178, "loss": 2.4379, "step": 22956 }, { "epoch": 0.62, "learning_rate": 0.0006758248492595613, "loss": 2.0008, "step": 22957 }, { "epoch": 0.62, "learning_rate": 0.0006757425116647971, "loss": 2.4964, "step": 22958 }, { "epoch": 0.62, "learning_rate": 0.00067566017652655, "loss": 2.3356, "step": 22959 }, { "epoch": 0.62, "learning_rate": 0.0006755778438454438, "loss": 2.3538, "step": 22960 }, { "epoch": 0.62, "learning_rate": 0.0006754955136221015, "loss": 2.8022, "step": 22961 }, { "epoch": 0.62, "learning_rate": 0.0006754131858571469, "loss": 2.3588, "step": 22962 }, { "epoch": 0.62, "learning_rate": 0.0006753308605512045, "loss": 2.7754, "step": 22963 }, { "epoch": 0.62, "learning_rate": 0.0006752485377048971, "loss": 2.6594, "step": 22964 }, { "epoch": 0.62, "learning_rate": 0.0006751662173188489, "loss": 2.8457, "step": 22965 }, { "epoch": 0.62, "learning_rate": 0.0006750838993936832, "loss": 2.4012, "step": 22966 }, { "epoch": 0.62, "learning_rate": 0.0006750015839300239, "loss": 2.6159, "step": 22967 }, { "epoch": 0.62, "learning_rate": 0.0006749192709284945, "loss": 2.5308, "step": 22968 }, { "epoch": 0.62, "learning_rate": 0.0006748369603897185, "loss": 2.1727, "step": 22969 }, { "epoch": 0.62, "learning_rate": 0.0006747546523143195, "loss": 2.5485, "step": 22970 }, { "epoch": 0.62, "learning_rate": 0.0006746723467029214, "loss": 2.7044, "step": 22971 }, { "epoch": 0.62, "learning_rate": 0.0006745900435561472, "loss": 2.5117, "step": 22972 }, { "epoch": 0.62, "learning_rate": 0.0006745077428746211, "loss": 2.2956, "step": 22973 }, { "epoch": 0.62, "learning_rate": 0.0006744254446589656, "loss": 2.2345, "step": 22974 }, { "epoch": 0.62, "learning_rate": 0.0006743431489098046, "loss": 2.6354, "step": 22975 }, { "epoch": 0.62, "learning_rate": 0.0006742608556277623, "loss": 2.551, "step": 22976 }, { "epoch": 0.62, "learning_rate": 0.0006741785648134611, "loss": 2.1605, "step": 22977 }, { "epoch": 0.62, "learning_rate": 0.0006740962764675248, "loss": 2.7441, "step": 22978 }, { "epoch": 0.62, "learning_rate": 0.0006740139905905771, "loss": 2.5338, "step": 22979 }, { "epoch": 0.62, "learning_rate": 0.0006739317071832409, "loss": 2.1921, "step": 22980 }, { "epoch": 0.62, "learning_rate": 0.0006738494262461401, "loss": 2.1152, "step": 22981 }, { "epoch": 0.62, "learning_rate": 0.0006737671477798973, "loss": 2.1693, "step": 22982 }, { "epoch": 0.62, "learning_rate": 0.0006736848717851365, "loss": 2.3697, "step": 22983 }, { "epoch": 0.62, "learning_rate": 0.0006736025982624808, "loss": 2.3057, "step": 22984 }, { "epoch": 0.62, "learning_rate": 0.0006735203272125534, "loss": 2.5964, "step": 22985 }, { "epoch": 0.62, "learning_rate": 0.0006734380586359775, "loss": 2.6622, "step": 22986 }, { "epoch": 0.62, "learning_rate": 0.0006733557925333771, "loss": 2.215, "step": 22987 }, { "epoch": 0.62, "learning_rate": 0.000673273528905374, "loss": 2.3454, "step": 22988 }, { "epoch": 0.62, "learning_rate": 0.0006731912677525928, "loss": 2.5966, "step": 22989 }, { "epoch": 0.62, "learning_rate": 0.000673109009075656, "loss": 2.1342, "step": 22990 }, { "epoch": 0.62, "learning_rate": 0.0006730267528751865, "loss": 2.1505, "step": 22991 }, { "epoch": 0.62, "learning_rate": 0.0006729444991518084, "loss": 2.7867, "step": 22992 }, { "epoch": 0.62, "learning_rate": 0.0006728622479061441, "loss": 1.9197, "step": 22993 }, { "epoch": 0.62, "learning_rate": 0.0006727799991388168, "loss": 2.7019, "step": 22994 }, { "epoch": 0.62, "learning_rate": 0.0006726977528504498, "loss": 2.3546, "step": 22995 }, { "epoch": 0.62, "learning_rate": 0.0006726155090416661, "loss": 2.5045, "step": 22996 }, { "epoch": 0.62, "learning_rate": 0.0006725332677130888, "loss": 2.5626, "step": 22997 }, { "epoch": 0.62, "learning_rate": 0.000672451028865341, "loss": 2.1517, "step": 22998 }, { "epoch": 0.62, "learning_rate": 0.0006723687924990456, "loss": 2.5477, "step": 22999 }, { "epoch": 0.62, "learning_rate": 0.0006722865586148259, "loss": 2.768, "step": 23000 }, { "epoch": 0.62, "learning_rate": 0.000672204327213304, "loss": 2.8555, "step": 23001 }, { "epoch": 0.62, "learning_rate": 0.0006721220982951039, "loss": 2.7015, "step": 23002 }, { "epoch": 0.62, "learning_rate": 0.0006720398718608485, "loss": 3.3176, "step": 23003 }, { "epoch": 0.62, "learning_rate": 0.0006719576479111599, "loss": 2.8218, "step": 23004 }, { "epoch": 0.62, "learning_rate": 0.0006718754264466613, "loss": 2.6485, "step": 23005 }, { "epoch": 0.62, "learning_rate": 0.0006717932074679766, "loss": 2.3473, "step": 23006 }, { "epoch": 0.62, "learning_rate": 0.0006717109909757273, "loss": 2.6122, "step": 23007 }, { "epoch": 0.62, "learning_rate": 0.0006716287769705371, "loss": 3.1999, "step": 23008 }, { "epoch": 0.62, "learning_rate": 0.0006715465654530283, "loss": 2.2558, "step": 23009 }, { "epoch": 0.62, "learning_rate": 0.0006714643564238241, "loss": 2.3467, "step": 23010 }, { "epoch": 0.62, "learning_rate": 0.0006713821498835475, "loss": 2.5709, "step": 23011 }, { "epoch": 0.62, "learning_rate": 0.0006712999458328206, "loss": 2.2377, "step": 23012 }, { "epoch": 0.62, "learning_rate": 0.0006712177442722665, "loss": 2.4379, "step": 23013 }, { "epoch": 0.62, "learning_rate": 0.0006711355452025083, "loss": 2.2799, "step": 23014 }, { "epoch": 0.62, "learning_rate": 0.0006710533486241683, "loss": 2.8682, "step": 23015 }, { "epoch": 0.62, "learning_rate": 0.0006709711545378696, "loss": 2.3392, "step": 23016 }, { "epoch": 0.62, "learning_rate": 0.0006708889629442342, "loss": 2.6259, "step": 23017 }, { "epoch": 0.62, "learning_rate": 0.000670806773843885, "loss": 2.4637, "step": 23018 }, { "epoch": 0.62, "learning_rate": 0.0006707245872374454, "loss": 2.8495, "step": 23019 }, { "epoch": 0.62, "learning_rate": 0.0006706424031255371, "loss": 1.8189, "step": 23020 }, { "epoch": 0.62, "learning_rate": 0.0006705602215087832, "loss": 2.6947, "step": 23021 }, { "epoch": 0.62, "learning_rate": 0.0006704780423878062, "loss": 2.3105, "step": 23022 }, { "epoch": 0.62, "learning_rate": 0.0006703958657632285, "loss": 2.3285, "step": 23023 }, { "epoch": 0.62, "learning_rate": 0.000670313691635673, "loss": 2.4245, "step": 23024 }, { "epoch": 0.62, "learning_rate": 0.0006702315200057617, "loss": 2.7779, "step": 23025 }, { "epoch": 0.62, "learning_rate": 0.0006701493508741175, "loss": 2.538, "step": 23026 }, { "epoch": 0.62, "learning_rate": 0.0006700671842413632, "loss": 2.6751, "step": 23027 }, { "epoch": 0.62, "learning_rate": 0.0006699850201081206, "loss": 2.5337, "step": 23028 }, { "epoch": 0.62, "learning_rate": 0.0006699028584750124, "loss": 2.4304, "step": 23029 }, { "epoch": 0.62, "learning_rate": 0.0006698206993426617, "loss": 2.7082, "step": 23030 }, { "epoch": 0.62, "learning_rate": 0.0006697385427116896, "loss": 2.8792, "step": 23031 }, { "epoch": 0.62, "learning_rate": 0.0006696563885827201, "loss": 2.4057, "step": 23032 }, { "epoch": 0.62, "learning_rate": 0.0006695742369563739, "loss": 2.1279, "step": 23033 }, { "epoch": 0.62, "learning_rate": 0.0006694920878332747, "loss": 1.9312, "step": 23034 }, { "epoch": 0.62, "learning_rate": 0.0006694099412140442, "loss": 2.6999, "step": 23035 }, { "epoch": 0.62, "learning_rate": 0.0006693277970993048, "loss": 2.6701, "step": 23036 }, { "epoch": 0.62, "learning_rate": 0.000669245655489679, "loss": 2.8027, "step": 23037 }, { "epoch": 0.62, "learning_rate": 0.000669163516385789, "loss": 2.702, "step": 23038 }, { "epoch": 0.62, "learning_rate": 0.000669081379788257, "loss": 2.1942, "step": 23039 }, { "epoch": 0.62, "learning_rate": 0.0006689992456977052, "loss": 2.5493, "step": 23040 }, { "epoch": 0.62, "learning_rate": 0.0006689171141147562, "loss": 2.3557, "step": 23041 }, { "epoch": 0.62, "learning_rate": 0.0006688349850400317, "loss": 2.5833, "step": 23042 }, { "epoch": 0.62, "learning_rate": 0.0006687528584741547, "loss": 2.4993, "step": 23043 }, { "epoch": 0.62, "learning_rate": 0.000668670734417746, "loss": 2.9007, "step": 23044 }, { "epoch": 0.62, "learning_rate": 0.0006685886128714289, "loss": 2.6565, "step": 23045 }, { "epoch": 0.62, "learning_rate": 0.0006685064938358257, "loss": 2.5537, "step": 23046 }, { "epoch": 0.62, "learning_rate": 0.0006684243773115575, "loss": 2.2978, "step": 23047 }, { "epoch": 0.62, "learning_rate": 0.0006683422632992466, "loss": 2.5372, "step": 23048 }, { "epoch": 0.62, "learning_rate": 0.0006682601517995163, "loss": 2.7077, "step": 23049 }, { "epoch": 0.62, "learning_rate": 0.0006681780428129873, "loss": 2.3215, "step": 23050 }, { "epoch": 0.62, "learning_rate": 0.0006680959363402822, "loss": 2.3004, "step": 23051 }, { "epoch": 0.62, "learning_rate": 0.0006680138323820229, "loss": 2.3827, "step": 23052 }, { "epoch": 0.62, "learning_rate": 0.0006679317309388314, "loss": 2.3343, "step": 23053 }, { "epoch": 0.62, "learning_rate": 0.0006678496320113299, "loss": 2.2267, "step": 23054 }, { "epoch": 0.62, "learning_rate": 0.0006677675356001401, "loss": 2.3131, "step": 23055 }, { "epoch": 0.62, "learning_rate": 0.000667685441705884, "loss": 2.8593, "step": 23056 }, { "epoch": 0.62, "learning_rate": 0.0006676033503291836, "loss": 2.5659, "step": 23057 }, { "epoch": 0.62, "learning_rate": 0.0006675212614706608, "loss": 2.889, "step": 23058 }, { "epoch": 0.62, "learning_rate": 0.0006674391751309379, "loss": 2.469, "step": 23059 }, { "epoch": 0.62, "learning_rate": 0.000667357091310636, "loss": 2.7102, "step": 23060 }, { "epoch": 0.62, "learning_rate": 0.0006672750100103768, "loss": 2.4989, "step": 23061 }, { "epoch": 0.62, "learning_rate": 0.0006671929312307835, "loss": 2.4264, "step": 23062 }, { "epoch": 0.62, "learning_rate": 0.0006671108549724766, "loss": 2.3305, "step": 23063 }, { "epoch": 0.62, "learning_rate": 0.0006670287812360784, "loss": 2.7984, "step": 23064 }, { "epoch": 0.62, "learning_rate": 0.0006669467100222106, "loss": 2.9893, "step": 23065 }, { "epoch": 0.62, "learning_rate": 0.000666864641331495, "loss": 2.338, "step": 23066 }, { "epoch": 0.62, "learning_rate": 0.0006667825751645536, "loss": 2.2847, "step": 23067 }, { "epoch": 0.62, "learning_rate": 0.0006667005115220074, "loss": 2.1108, "step": 23068 }, { "epoch": 0.62, "learning_rate": 0.0006666184504044786, "loss": 2.2123, "step": 23069 }, { "epoch": 0.62, "learning_rate": 0.0006665363918125891, "loss": 2.6617, "step": 23070 }, { "epoch": 0.62, "learning_rate": 0.00066645433574696, "loss": 2.8215, "step": 23071 }, { "epoch": 0.62, "learning_rate": 0.0006663722822082132, "loss": 2.4346, "step": 23072 }, { "epoch": 0.62, "learning_rate": 0.0006662902311969709, "loss": 2.3005, "step": 23073 }, { "epoch": 0.62, "learning_rate": 0.0006662081827138533, "loss": 2.5629, "step": 23074 }, { "epoch": 0.62, "learning_rate": 0.0006661261367594833, "loss": 2.5552, "step": 23075 }, { "epoch": 0.62, "learning_rate": 0.0006660440933344823, "loss": 2.6903, "step": 23076 }, { "epoch": 0.62, "learning_rate": 0.000665962052439471, "loss": 2.5256, "step": 23077 }, { "epoch": 0.62, "learning_rate": 0.0006658800140750718, "loss": 2.7798, "step": 23078 }, { "epoch": 0.62, "learning_rate": 0.0006657979782419056, "loss": 2.5075, "step": 23079 }, { "epoch": 0.62, "learning_rate": 0.0006657159449405943, "loss": 2.6511, "step": 23080 }, { "epoch": 0.62, "learning_rate": 0.0006656339141717593, "loss": 2.3132, "step": 23081 }, { "epoch": 0.62, "learning_rate": 0.0006655518859360219, "loss": 2.3154, "step": 23082 }, { "epoch": 0.62, "learning_rate": 0.0006654698602340036, "loss": 2.4124, "step": 23083 }, { "epoch": 0.62, "learning_rate": 0.000665387837066326, "loss": 2.7651, "step": 23084 }, { "epoch": 0.62, "learning_rate": 0.0006653058164336101, "loss": 2.8524, "step": 23085 }, { "epoch": 0.62, "learning_rate": 0.0006652237983364779, "loss": 2.4352, "step": 23086 }, { "epoch": 0.62, "learning_rate": 0.0006651417827755497, "loss": 2.2813, "step": 23087 }, { "epoch": 0.62, "learning_rate": 0.0006650597697514478, "loss": 2.6136, "step": 23088 }, { "epoch": 0.62, "learning_rate": 0.0006649777592647937, "loss": 2.6701, "step": 23089 }, { "epoch": 0.62, "learning_rate": 0.0006648957513162075, "loss": 2.2003, "step": 23090 }, { "epoch": 0.62, "learning_rate": 0.0006648137459063113, "loss": 2.4821, "step": 23091 }, { "epoch": 0.62, "learning_rate": 0.0006647317430357266, "loss": 2.3302, "step": 23092 }, { "epoch": 0.62, "learning_rate": 0.000664649742705074, "loss": 2.7622, "step": 23093 }, { "epoch": 0.62, "learning_rate": 0.0006645677449149751, "loss": 2.511, "step": 23094 }, { "epoch": 0.62, "learning_rate": 0.0006644857496660508, "loss": 2.4161, "step": 23095 }, { "epoch": 0.62, "learning_rate": 0.0006644037569589226, "loss": 2.5092, "step": 23096 }, { "epoch": 0.62, "learning_rate": 0.0006643217667942116, "loss": 2.4049, "step": 23097 }, { "epoch": 0.62, "learning_rate": 0.0006642397791725387, "loss": 2.1538, "step": 23098 }, { "epoch": 0.62, "learning_rate": 0.0006641577940945251, "loss": 2.6103, "step": 23099 }, { "epoch": 0.62, "learning_rate": 0.0006640758115607924, "loss": 2.3282, "step": 23100 }, { "epoch": 0.62, "learning_rate": 0.0006639938315719611, "loss": 2.6507, "step": 23101 }, { "epoch": 0.62, "learning_rate": 0.0006639118541286529, "loss": 2.6544, "step": 23102 }, { "epoch": 0.62, "learning_rate": 0.0006638298792314876, "loss": 2.4995, "step": 23103 }, { "epoch": 0.62, "learning_rate": 0.0006637479068810873, "loss": 2.6816, "step": 23104 }, { "epoch": 0.62, "learning_rate": 0.0006636659370780733, "loss": 2.3428, "step": 23105 }, { "epoch": 0.62, "learning_rate": 0.0006635839698230654, "loss": 2.3403, "step": 23106 }, { "epoch": 0.62, "learning_rate": 0.0006635020051166851, "loss": 2.7731, "step": 23107 }, { "epoch": 0.62, "learning_rate": 0.0006634200429595541, "loss": 2.173, "step": 23108 }, { "epoch": 0.62, "learning_rate": 0.0006633380833522922, "loss": 2.8322, "step": 23109 }, { "epoch": 0.62, "learning_rate": 0.0006632561262955208, "loss": 2.4432, "step": 23110 }, { "epoch": 0.62, "learning_rate": 0.0006631741717898611, "loss": 2.4467, "step": 23111 }, { "epoch": 0.62, "learning_rate": 0.0006630922198359333, "loss": 2.3427, "step": 23112 }, { "epoch": 0.62, "learning_rate": 0.0006630102704343589, "loss": 2.9226, "step": 23113 }, { "epoch": 0.62, "learning_rate": 0.0006629283235857581, "loss": 2.6049, "step": 23114 }, { "epoch": 0.62, "learning_rate": 0.0006628463792907523, "loss": 2.4165, "step": 23115 }, { "epoch": 0.62, "learning_rate": 0.0006627644375499622, "loss": 2.2631, "step": 23116 }, { "epoch": 0.62, "learning_rate": 0.0006626824983640081, "loss": 2.7309, "step": 23117 }, { "epoch": 0.62, "learning_rate": 0.0006626005617335111, "loss": 2.7086, "step": 23118 }, { "epoch": 0.62, "learning_rate": 0.0006625186276590924, "loss": 2.7085, "step": 23119 }, { "epoch": 0.62, "learning_rate": 0.0006624366961413716, "loss": 2.3159, "step": 23120 }, { "epoch": 0.62, "learning_rate": 0.0006623547671809706, "loss": 2.7015, "step": 23121 }, { "epoch": 0.62, "learning_rate": 0.0006622728407785092, "loss": 2.5472, "step": 23122 }, { "epoch": 0.62, "learning_rate": 0.0006621909169346083, "loss": 2.5142, "step": 23123 }, { "epoch": 0.62, "learning_rate": 0.0006621089956498889, "loss": 2.1044, "step": 23124 }, { "epoch": 0.62, "learning_rate": 0.0006620270769249711, "loss": 2.7683, "step": 23125 }, { "epoch": 0.62, "learning_rate": 0.0006619451607604758, "loss": 2.3999, "step": 23126 }, { "epoch": 0.62, "learning_rate": 0.0006618632471570236, "loss": 2.2422, "step": 23127 }, { "epoch": 0.62, "learning_rate": 0.000661781336115235, "loss": 2.4099, "step": 23128 }, { "epoch": 0.62, "learning_rate": 0.0006616994276357304, "loss": 2.4503, "step": 23129 }, { "epoch": 0.62, "learning_rate": 0.0006616175217191304, "loss": 2.4477, "step": 23130 }, { "epoch": 0.62, "learning_rate": 0.0006615356183660557, "loss": 2.4367, "step": 23131 }, { "epoch": 0.62, "learning_rate": 0.000661453717577127, "loss": 2.7189, "step": 23132 }, { "epoch": 0.62, "learning_rate": 0.0006613718193529636, "loss": 2.5232, "step": 23133 }, { "epoch": 0.62, "learning_rate": 0.0006612899236941871, "loss": 2.2186, "step": 23134 }, { "epoch": 0.62, "learning_rate": 0.0006612080306014181, "loss": 2.1778, "step": 23135 }, { "epoch": 0.62, "learning_rate": 0.000661126140075276, "loss": 2.6649, "step": 23136 }, { "epoch": 0.62, "learning_rate": 0.0006610442521163818, "loss": 2.7281, "step": 23137 }, { "epoch": 0.62, "learning_rate": 0.0006609623667253556, "loss": 2.1417, "step": 23138 }, { "epoch": 0.62, "learning_rate": 0.000660880483902818, "loss": 2.8511, "step": 23139 }, { "epoch": 0.62, "learning_rate": 0.0006607986036493891, "loss": 2.3451, "step": 23140 }, { "epoch": 0.62, "learning_rate": 0.0006607167259656895, "loss": 2.1074, "step": 23141 }, { "epoch": 0.62, "learning_rate": 0.0006606348508523392, "loss": 2.7873, "step": 23142 }, { "epoch": 0.62, "learning_rate": 0.0006605529783099588, "loss": 2.521, "step": 23143 }, { "epoch": 0.62, "learning_rate": 0.0006604711083391681, "loss": 2.2855, "step": 23144 }, { "epoch": 0.62, "learning_rate": 0.0006603892409405881, "loss": 2.6228, "step": 23145 }, { "epoch": 0.62, "learning_rate": 0.0006603073761148377, "loss": 3.1026, "step": 23146 }, { "epoch": 0.62, "learning_rate": 0.0006602255138625382, "loss": 2.4694, "step": 23147 }, { "epoch": 0.62, "learning_rate": 0.0006601436541843098, "loss": 2.0784, "step": 23148 }, { "epoch": 0.62, "learning_rate": 0.0006600617970807719, "loss": 2.5871, "step": 23149 }, { "epoch": 0.62, "learning_rate": 0.000659979942552545, "loss": 2.5531, "step": 23150 }, { "epoch": 0.62, "learning_rate": 0.0006598980906002499, "loss": 2.4248, "step": 23151 }, { "epoch": 0.62, "learning_rate": 0.0006598162412245055, "loss": 2.284, "step": 23152 }, { "epoch": 0.62, "learning_rate": 0.0006597343944259324, "loss": 2.2597, "step": 23153 }, { "epoch": 0.62, "learning_rate": 0.0006596525502051509, "loss": 2.5637, "step": 23154 }, { "epoch": 0.62, "learning_rate": 0.0006595707085627808, "loss": 2.093, "step": 23155 }, { "epoch": 0.62, "learning_rate": 0.0006594888694994423, "loss": 1.956, "step": 23156 }, { "epoch": 0.62, "learning_rate": 0.0006594070330157549, "loss": 2.2071, "step": 23157 }, { "epoch": 0.62, "learning_rate": 0.000659325199112339, "loss": 2.5212, "step": 23158 }, { "epoch": 0.62, "learning_rate": 0.0006592433677898148, "loss": 2.0731, "step": 23159 }, { "epoch": 0.62, "learning_rate": 0.0006591615390488016, "loss": 2.5697, "step": 23160 }, { "epoch": 0.62, "learning_rate": 0.0006590797128899198, "loss": 2.7738, "step": 23161 }, { "epoch": 0.62, "learning_rate": 0.0006589978893137893, "loss": 2.0945, "step": 23162 }, { "epoch": 0.62, "learning_rate": 0.0006589160683210293, "loss": 2.3991, "step": 23163 }, { "epoch": 0.62, "learning_rate": 0.0006588342499122608, "loss": 2.2775, "step": 23164 }, { "epoch": 0.62, "learning_rate": 0.0006587524340881028, "loss": 2.5014, "step": 23165 }, { "epoch": 0.62, "learning_rate": 0.0006586706208491752, "loss": 3.3204, "step": 23166 }, { "epoch": 0.62, "learning_rate": 0.0006585888101960981, "loss": 2.7972, "step": 23167 }, { "epoch": 0.62, "learning_rate": 0.000658507002129491, "loss": 2.1953, "step": 23168 }, { "epoch": 0.62, "learning_rate": 0.0006584251966499738, "loss": 2.7599, "step": 23169 }, { "epoch": 0.62, "learning_rate": 0.0006583433937581664, "loss": 2.4467, "step": 23170 }, { "epoch": 0.62, "learning_rate": 0.0006582615934546883, "loss": 2.3427, "step": 23171 }, { "epoch": 0.62, "learning_rate": 0.0006581797957401594, "loss": 2.531, "step": 23172 }, { "epoch": 0.62, "learning_rate": 0.0006580980006151989, "loss": 2.561, "step": 23173 }, { "epoch": 0.62, "learning_rate": 0.0006580162080804271, "loss": 2.8022, "step": 23174 }, { "epoch": 0.62, "learning_rate": 0.0006579344181364636, "loss": 2.3584, "step": 23175 }, { "epoch": 0.62, "learning_rate": 0.0006578526307839272, "loss": 2.8694, "step": 23176 }, { "epoch": 0.62, "learning_rate": 0.0006577708460234383, "loss": 2.4339, "step": 23177 }, { "epoch": 0.62, "learning_rate": 0.0006576890638556168, "loss": 2.8916, "step": 23178 }, { "epoch": 0.62, "learning_rate": 0.0006576072842810811, "loss": 2.5509, "step": 23179 }, { "epoch": 0.62, "learning_rate": 0.0006575255073004518, "loss": 2.6849, "step": 23180 }, { "epoch": 0.62, "learning_rate": 0.0006574437329143478, "loss": 2.4419, "step": 23181 }, { "epoch": 0.62, "learning_rate": 0.0006573619611233887, "loss": 2.8963, "step": 23182 }, { "epoch": 0.62, "learning_rate": 0.0006572801919281946, "loss": 2.4287, "step": 23183 }, { "epoch": 0.62, "learning_rate": 0.0006571984253293841, "loss": 2.6965, "step": 23184 }, { "epoch": 0.62, "learning_rate": 0.0006571166613275769, "loss": 2.5157, "step": 23185 }, { "epoch": 0.62, "learning_rate": 0.0006570348999233931, "loss": 2.223, "step": 23186 }, { "epoch": 0.62, "learning_rate": 0.0006569531411174512, "loss": 2.0895, "step": 23187 }, { "epoch": 0.62, "learning_rate": 0.000656871384910371, "loss": 2.5921, "step": 23188 }, { "epoch": 0.62, "learning_rate": 0.0006567896313027722, "loss": 2.5641, "step": 23189 }, { "epoch": 0.62, "learning_rate": 0.0006567078802952733, "loss": 2.5192, "step": 23190 }, { "epoch": 0.62, "learning_rate": 0.0006566261318884947, "loss": 2.663, "step": 23191 }, { "epoch": 0.62, "learning_rate": 0.0006565443860830546, "loss": 2.3358, "step": 23192 }, { "epoch": 0.62, "learning_rate": 0.0006564626428795728, "loss": 2.1828, "step": 23193 }, { "epoch": 0.62, "learning_rate": 0.0006563809022786691, "loss": 2.212, "step": 23194 }, { "epoch": 0.62, "learning_rate": 0.0006562991642809619, "loss": 2.3001, "step": 23195 }, { "epoch": 0.62, "learning_rate": 0.0006562174288870708, "loss": 2.6721, "step": 23196 }, { "epoch": 0.62, "learning_rate": 0.0006561356960976151, "loss": 2.7167, "step": 23197 }, { "epoch": 0.62, "learning_rate": 0.0006560539659132138, "loss": 2.8056, "step": 23198 }, { "epoch": 0.62, "learning_rate": 0.0006559722383344863, "loss": 2.2638, "step": 23199 }, { "epoch": 0.62, "learning_rate": 0.0006558905133620514, "loss": 2.4658, "step": 23200 }, { "epoch": 0.62, "learning_rate": 0.0006558087909965285, "loss": 2.5274, "step": 23201 }, { "epoch": 0.62, "learning_rate": 0.0006557270712385368, "loss": 2.3533, "step": 23202 }, { "epoch": 0.62, "learning_rate": 0.000655645354088695, "loss": 2.5478, "step": 23203 }, { "epoch": 0.62, "learning_rate": 0.0006555636395476225, "loss": 2.5341, "step": 23204 }, { "epoch": 0.62, "learning_rate": 0.0006554819276159388, "loss": 2.4164, "step": 23205 }, { "epoch": 0.62, "learning_rate": 0.0006554002182942618, "loss": 2.3296, "step": 23206 }, { "epoch": 0.62, "learning_rate": 0.0006553185115832117, "loss": 2.4581, "step": 23207 }, { "epoch": 0.62, "learning_rate": 0.0006552368074834064, "loss": 2.5193, "step": 23208 }, { "epoch": 0.62, "learning_rate": 0.0006551551059954655, "loss": 2.8593, "step": 23209 }, { "epoch": 0.62, "learning_rate": 0.0006550734071200082, "loss": 2.958, "step": 23210 }, { "epoch": 0.62, "learning_rate": 0.0006549917108576526, "loss": 2.4076, "step": 23211 }, { "epoch": 0.62, "learning_rate": 0.0006549100172090184, "loss": 2.6383, "step": 23212 }, { "epoch": 0.62, "learning_rate": 0.0006548283261747244, "loss": 2.7946, "step": 23213 }, { "epoch": 0.62, "learning_rate": 0.0006547466377553889, "loss": 2.3358, "step": 23214 }, { "epoch": 0.62, "learning_rate": 0.0006546649519516315, "loss": 2.3179, "step": 23215 }, { "epoch": 0.62, "learning_rate": 0.0006545832687640704, "loss": 2.5909, "step": 23216 }, { "epoch": 0.62, "learning_rate": 0.0006545015881933247, "loss": 2.728, "step": 23217 }, { "epoch": 0.62, "learning_rate": 0.0006544199102400137, "loss": 2.525, "step": 23218 }, { "epoch": 0.62, "learning_rate": 0.0006543382349047549, "loss": 2.4936, "step": 23219 }, { "epoch": 0.62, "learning_rate": 0.0006542565621881682, "loss": 2.5398, "step": 23220 }, { "epoch": 0.62, "learning_rate": 0.0006541748920908723, "loss": 1.7063, "step": 23221 }, { "epoch": 0.62, "learning_rate": 0.0006540932246134852, "loss": 2.815, "step": 23222 }, { "epoch": 0.62, "learning_rate": 0.0006540115597566257, "loss": 2.71, "step": 23223 }, { "epoch": 0.62, "learning_rate": 0.0006539298975209136, "loss": 2.2679, "step": 23224 }, { "epoch": 0.62, "learning_rate": 0.0006538482379069661, "loss": 2.3243, "step": 23225 }, { "epoch": 0.62, "learning_rate": 0.0006537665809154028, "loss": 2.6456, "step": 23226 }, { "epoch": 0.62, "learning_rate": 0.0006536849265468416, "loss": 2.607, "step": 23227 }, { "epoch": 0.62, "learning_rate": 0.0006536032748019016, "loss": 2.4864, "step": 23228 }, { "epoch": 0.62, "learning_rate": 0.0006535216256812015, "loss": 2.6162, "step": 23229 }, { "epoch": 0.62, "learning_rate": 0.0006534399791853593, "loss": 2.8718, "step": 23230 }, { "epoch": 0.62, "learning_rate": 0.0006533583353149941, "loss": 2.5736, "step": 23231 }, { "epoch": 0.62, "learning_rate": 0.0006532766940707242, "loss": 2.3164, "step": 23232 }, { "epoch": 0.62, "learning_rate": 0.0006531950554531679, "loss": 2.7475, "step": 23233 }, { "epoch": 0.62, "learning_rate": 0.0006531134194629442, "loss": 2.6324, "step": 23234 }, { "epoch": 0.62, "learning_rate": 0.000653031786100671, "loss": 2.5193, "step": 23235 }, { "epoch": 0.62, "learning_rate": 0.0006529501553669666, "loss": 2.3018, "step": 23236 }, { "epoch": 0.62, "learning_rate": 0.0006528685272624504, "loss": 1.9009, "step": 23237 }, { "epoch": 0.62, "learning_rate": 0.0006527869017877397, "loss": 2.3745, "step": 23238 }, { "epoch": 0.62, "learning_rate": 0.0006527052789434536, "loss": 1.9268, "step": 23239 }, { "epoch": 0.62, "learning_rate": 0.0006526236587302101, "loss": 2.5624, "step": 23240 }, { "epoch": 0.62, "learning_rate": 0.0006525420411486276, "loss": 2.5356, "step": 23241 }, { "epoch": 0.62, "learning_rate": 0.0006524604261993247, "loss": 2.5767, "step": 23242 }, { "epoch": 0.62, "learning_rate": 0.0006523788138829193, "loss": 2.6111, "step": 23243 }, { "epoch": 0.62, "learning_rate": 0.00065229720420003, "loss": 2.4466, "step": 23244 }, { "epoch": 0.62, "learning_rate": 0.0006522155971512748, "loss": 2.2261, "step": 23245 }, { "epoch": 0.62, "learning_rate": 0.000652133992737272, "loss": 2.5351, "step": 23246 }, { "epoch": 0.62, "learning_rate": 0.0006520523909586398, "loss": 2.4805, "step": 23247 }, { "epoch": 0.62, "learning_rate": 0.000651970791815997, "loss": 2.7988, "step": 23248 }, { "epoch": 0.62, "learning_rate": 0.0006518891953099606, "loss": 2.5394, "step": 23249 }, { "epoch": 0.62, "learning_rate": 0.00065180760144115, "loss": 2.1835, "step": 23250 }, { "epoch": 0.62, "learning_rate": 0.0006517260102101826, "loss": 2.8821, "step": 23251 }, { "epoch": 0.62, "learning_rate": 0.0006516444216176764, "loss": 2.4128, "step": 23252 }, { "epoch": 0.62, "learning_rate": 0.00065156283566425, "loss": 2.5957, "step": 23253 }, { "epoch": 0.62, "learning_rate": 0.0006514812523505211, "loss": 2.5977, "step": 23254 }, { "epoch": 0.62, "learning_rate": 0.000651399671677108, "loss": 2.6065, "step": 23255 }, { "epoch": 0.62, "learning_rate": 0.0006513180936446288, "loss": 2.8426, "step": 23256 }, { "epoch": 0.63, "learning_rate": 0.0006512365182537012, "loss": 2.3892, "step": 23257 }, { "epoch": 0.63, "learning_rate": 0.0006511549455049433, "loss": 2.5622, "step": 23258 }, { "epoch": 0.63, "learning_rate": 0.0006510733753989735, "loss": 2.5423, "step": 23259 }, { "epoch": 0.63, "learning_rate": 0.0006509918079364091, "loss": 2.4885, "step": 23260 }, { "epoch": 0.63, "learning_rate": 0.0006509102431178686, "loss": 2.4412, "step": 23261 }, { "epoch": 0.63, "learning_rate": 0.0006508286809439696, "loss": 2.5065, "step": 23262 }, { "epoch": 0.63, "learning_rate": 0.00065074712141533, "loss": 2.7185, "step": 23263 }, { "epoch": 0.63, "learning_rate": 0.0006506655645325681, "loss": 2.4195, "step": 23264 }, { "epoch": 0.63, "learning_rate": 0.000650584010296301, "loss": 1.9603, "step": 23265 }, { "epoch": 0.63, "learning_rate": 0.0006505024587071471, "loss": 2.3778, "step": 23266 }, { "epoch": 0.63, "learning_rate": 0.0006504209097657243, "loss": 2.72, "step": 23267 }, { "epoch": 0.63, "learning_rate": 0.00065033936347265, "loss": 2.8265, "step": 23268 }, { "epoch": 0.63, "learning_rate": 0.0006502578198285424, "loss": 2.4301, "step": 23269 }, { "epoch": 0.63, "learning_rate": 0.0006501762788340186, "loss": 2.4671, "step": 23270 }, { "epoch": 0.63, "learning_rate": 0.000650094740489697, "loss": 2.7534, "step": 23271 }, { "epoch": 0.63, "learning_rate": 0.0006500132047961952, "loss": 2.2238, "step": 23272 }, { "epoch": 0.63, "learning_rate": 0.0006499316717541306, "loss": 2.075, "step": 23273 }, { "epoch": 0.63, "learning_rate": 0.0006498501413641211, "loss": 2.7354, "step": 23274 }, { "epoch": 0.63, "learning_rate": 0.0006497686136267844, "loss": 2.8552, "step": 23275 }, { "epoch": 0.63, "learning_rate": 0.000649687088542738, "loss": 2.5585, "step": 23276 }, { "epoch": 0.63, "learning_rate": 0.0006496055661125999, "loss": 2.7383, "step": 23277 }, { "epoch": 0.63, "learning_rate": 0.0006495240463369869, "loss": 2.4015, "step": 23278 }, { "epoch": 0.63, "learning_rate": 0.0006494425292165171, "loss": 2.1005, "step": 23279 }, { "epoch": 0.63, "learning_rate": 0.0006493610147518085, "loss": 2.2039, "step": 23280 }, { "epoch": 0.63, "learning_rate": 0.0006492795029434779, "loss": 2.5447, "step": 23281 }, { "epoch": 0.63, "learning_rate": 0.0006491979937921428, "loss": 2.7204, "step": 23282 }, { "epoch": 0.63, "learning_rate": 0.0006491164872984214, "loss": 2.4129, "step": 23283 }, { "epoch": 0.63, "learning_rate": 0.0006490349834629305, "loss": 2.6167, "step": 23284 }, { "epoch": 0.63, "learning_rate": 0.0006489534822862881, "loss": 2.6449, "step": 23285 }, { "epoch": 0.63, "learning_rate": 0.0006488719837691111, "loss": 2.5674, "step": 23286 }, { "epoch": 0.63, "learning_rate": 0.0006487904879120172, "loss": 2.0974, "step": 23287 }, { "epoch": 0.63, "learning_rate": 0.0006487089947156239, "loss": 2.3461, "step": 23288 }, { "epoch": 0.63, "learning_rate": 0.0006486275041805483, "loss": 2.6383, "step": 23289 }, { "epoch": 0.63, "learning_rate": 0.000648546016307408, "loss": 2.8636, "step": 23290 }, { "epoch": 0.63, "learning_rate": 0.0006484645310968202, "loss": 2.658, "step": 23291 }, { "epoch": 0.63, "learning_rate": 0.0006483830485494022, "loss": 2.1688, "step": 23292 }, { "epoch": 0.63, "learning_rate": 0.0006483015686657718, "loss": 2.3818, "step": 23293 }, { "epoch": 0.63, "learning_rate": 0.0006482200914465453, "loss": 2.2597, "step": 23294 }, { "epoch": 0.63, "learning_rate": 0.0006481386168923404, "loss": 2.4171, "step": 23295 }, { "epoch": 0.63, "learning_rate": 0.0006480571450037751, "loss": 2.4593, "step": 23296 }, { "epoch": 0.63, "learning_rate": 0.0006479756757814655, "loss": 3.0279, "step": 23297 }, { "epoch": 0.63, "learning_rate": 0.0006478942092260292, "loss": 2.5164, "step": 23298 }, { "epoch": 0.63, "learning_rate": 0.0006478127453380837, "loss": 2.5835, "step": 23299 }, { "epoch": 0.63, "learning_rate": 0.0006477312841182456, "loss": 1.9784, "step": 23300 }, { "epoch": 0.63, "learning_rate": 0.0006476498255671323, "loss": 2.2514, "step": 23301 }, { "epoch": 0.63, "learning_rate": 0.0006475683696853612, "loss": 2.7369, "step": 23302 }, { "epoch": 0.63, "learning_rate": 0.0006474869164735488, "loss": 2.6914, "step": 23303 }, { "epoch": 0.63, "learning_rate": 0.0006474054659323128, "loss": 2.4823, "step": 23304 }, { "epoch": 0.63, "learning_rate": 0.0006473240180622697, "loss": 2.2462, "step": 23305 }, { "epoch": 0.63, "learning_rate": 0.0006472425728640367, "loss": 2.1683, "step": 23306 }, { "epoch": 0.63, "learning_rate": 0.0006471611303382316, "loss": 2.7882, "step": 23307 }, { "epoch": 0.63, "learning_rate": 0.0006470796904854699, "loss": 2.753, "step": 23308 }, { "epoch": 0.63, "learning_rate": 0.0006469982533063696, "loss": 2.7389, "step": 23309 }, { "epoch": 0.63, "learning_rate": 0.0006469168188015477, "loss": 2.4001, "step": 23310 }, { "epoch": 0.63, "learning_rate": 0.0006468353869716206, "loss": 2.7789, "step": 23311 }, { "epoch": 0.63, "learning_rate": 0.0006467539578172056, "loss": 2.6547, "step": 23312 }, { "epoch": 0.63, "learning_rate": 0.0006466725313389192, "loss": 2.6221, "step": 23313 }, { "epoch": 0.63, "learning_rate": 0.0006465911075373787, "loss": 2.6024, "step": 23314 }, { "epoch": 0.63, "learning_rate": 0.000646509686413201, "loss": 2.2189, "step": 23315 }, { "epoch": 0.63, "learning_rate": 0.0006464282679670024, "loss": 2.4766, "step": 23316 }, { "epoch": 0.63, "learning_rate": 0.0006463468521994, "loss": 2.6088, "step": 23317 }, { "epoch": 0.63, "learning_rate": 0.0006462654391110108, "loss": 2.2212, "step": 23318 }, { "epoch": 0.63, "learning_rate": 0.0006461840287024513, "loss": 1.9606, "step": 23319 }, { "epoch": 0.63, "learning_rate": 0.0006461026209743389, "loss": 2.343, "step": 23320 }, { "epoch": 0.63, "learning_rate": 0.0006460212159272888, "loss": 2.9239, "step": 23321 }, { "epoch": 0.63, "learning_rate": 0.000645939813561919, "loss": 2.0823, "step": 23322 }, { "epoch": 0.63, "learning_rate": 0.0006458584138788464, "loss": 2.6972, "step": 23323 }, { "epoch": 0.63, "learning_rate": 0.0006457770168786868, "loss": 2.4871, "step": 23324 }, { "epoch": 0.63, "learning_rate": 0.0006456956225620568, "loss": 2.3863, "step": 23325 }, { "epoch": 0.63, "learning_rate": 0.000645614230929574, "loss": 2.6305, "step": 23326 }, { "epoch": 0.63, "learning_rate": 0.0006455328419818541, "loss": 2.5836, "step": 23327 }, { "epoch": 0.63, "learning_rate": 0.0006454514557195142, "loss": 2.378, "step": 23328 }, { "epoch": 0.63, "learning_rate": 0.0006453700721431706, "loss": 2.33, "step": 23329 }, { "epoch": 0.63, "learning_rate": 0.0006452886912534398, "loss": 2.9139, "step": 23330 }, { "epoch": 0.63, "learning_rate": 0.0006452073130509388, "loss": 2.5306, "step": 23331 }, { "epoch": 0.63, "learning_rate": 0.0006451259375362835, "loss": 2.4834, "step": 23332 }, { "epoch": 0.63, "learning_rate": 0.0006450445647100904, "loss": 2.7463, "step": 23333 }, { "epoch": 0.63, "learning_rate": 0.0006449631945729768, "loss": 2.7834, "step": 23334 }, { "epoch": 0.63, "learning_rate": 0.0006448818271255581, "loss": 2.4842, "step": 23335 }, { "epoch": 0.63, "learning_rate": 0.0006448004623684513, "loss": 1.9778, "step": 23336 }, { "epoch": 0.63, "learning_rate": 0.0006447191003022732, "loss": 2.9494, "step": 23337 }, { "epoch": 0.63, "learning_rate": 0.0006446377409276389, "loss": 2.3346, "step": 23338 }, { "epoch": 0.63, "learning_rate": 0.0006445563842451663, "loss": 2.0044, "step": 23339 }, { "epoch": 0.63, "learning_rate": 0.0006444750302554704, "loss": 2.5678, "step": 23340 }, { "epoch": 0.63, "learning_rate": 0.0006443936789591682, "loss": 2.7728, "step": 23341 }, { "epoch": 0.63, "learning_rate": 0.000644312330356876, "loss": 2.4487, "step": 23342 }, { "epoch": 0.63, "learning_rate": 0.0006442309844492101, "loss": 2.3302, "step": 23343 }, { "epoch": 0.63, "learning_rate": 0.0006441496412367864, "loss": 2.2891, "step": 23344 }, { "epoch": 0.63, "learning_rate": 0.0006440683007202216, "loss": 2.7716, "step": 23345 }, { "epoch": 0.63, "learning_rate": 0.0006439869629001316, "loss": 2.8864, "step": 23346 }, { "epoch": 0.63, "learning_rate": 0.0006439056277771329, "loss": 2.8614, "step": 23347 }, { "epoch": 0.63, "learning_rate": 0.0006438242953518413, "loss": 2.6735, "step": 23348 }, { "epoch": 0.63, "learning_rate": 0.0006437429656248732, "loss": 2.571, "step": 23349 }, { "epoch": 0.63, "learning_rate": 0.000643661638596845, "loss": 2.5583, "step": 23350 }, { "epoch": 0.63, "learning_rate": 0.000643580314268372, "loss": 2.3775, "step": 23351 }, { "epoch": 0.63, "learning_rate": 0.000643498992640071, "loss": 2.459, "step": 23352 }, { "epoch": 0.63, "learning_rate": 0.0006434176737125584, "loss": 2.2385, "step": 23353 }, { "epoch": 0.63, "learning_rate": 0.0006433363574864491, "loss": 2.836, "step": 23354 }, { "epoch": 0.63, "learning_rate": 0.0006432550439623601, "loss": 2.266, "step": 23355 }, { "epoch": 0.63, "learning_rate": 0.000643173733140907, "loss": 2.2923, "step": 23356 }, { "epoch": 0.63, "learning_rate": 0.0006430924250227058, "loss": 2.7428, "step": 23357 }, { "epoch": 0.63, "learning_rate": 0.0006430111196083728, "loss": 2.5614, "step": 23358 }, { "epoch": 0.63, "learning_rate": 0.0006429298168985236, "loss": 2.354, "step": 23359 }, { "epoch": 0.63, "learning_rate": 0.0006428485168937742, "loss": 2.4502, "step": 23360 }, { "epoch": 0.63, "learning_rate": 0.0006427672195947409, "loss": 2.3909, "step": 23361 }, { "epoch": 0.63, "learning_rate": 0.0006426859250020389, "loss": 2.5574, "step": 23362 }, { "epoch": 0.63, "learning_rate": 0.000642604633116285, "loss": 2.7408, "step": 23363 }, { "epoch": 0.63, "learning_rate": 0.0006425233439380937, "loss": 2.6255, "step": 23364 }, { "epoch": 0.63, "learning_rate": 0.0006424420574680821, "loss": 2.1417, "step": 23365 }, { "epoch": 0.63, "learning_rate": 0.0006423607737068657, "loss": 2.2119, "step": 23366 }, { "epoch": 0.63, "learning_rate": 0.0006422794926550599, "loss": 2.3951, "step": 23367 }, { "epoch": 0.63, "learning_rate": 0.0006421982143132805, "loss": 2.597, "step": 23368 }, { "epoch": 0.63, "learning_rate": 0.000642116938682144, "loss": 2.599, "step": 23369 }, { "epoch": 0.63, "learning_rate": 0.0006420356657622652, "loss": 2.4555, "step": 23370 }, { "epoch": 0.63, "learning_rate": 0.0006419543955542603, "loss": 2.0949, "step": 23371 }, { "epoch": 0.63, "learning_rate": 0.000641873128058745, "loss": 2.6354, "step": 23372 }, { "epoch": 0.63, "learning_rate": 0.0006417918632763347, "loss": 2.6447, "step": 23373 }, { "epoch": 0.63, "learning_rate": 0.0006417106012076453, "loss": 2.4353, "step": 23374 }, { "epoch": 0.63, "learning_rate": 0.0006416293418532921, "loss": 2.2391, "step": 23375 }, { "epoch": 0.63, "learning_rate": 0.0006415480852138911, "loss": 2.4515, "step": 23376 }, { "epoch": 0.63, "learning_rate": 0.0006414668312900578, "loss": 2.4032, "step": 23377 }, { "epoch": 0.63, "learning_rate": 0.0006413855800824075, "loss": 2.3455, "step": 23378 }, { "epoch": 0.63, "learning_rate": 0.0006413043315915561, "loss": 2.3925, "step": 23379 }, { "epoch": 0.63, "learning_rate": 0.0006412230858181191, "loss": 2.238, "step": 23380 }, { "epoch": 0.63, "learning_rate": 0.0006411418427627114, "loss": 2.3749, "step": 23381 }, { "epoch": 0.63, "learning_rate": 0.0006410606024259496, "loss": 2.506, "step": 23382 }, { "epoch": 0.63, "learning_rate": 0.000640979364808448, "loss": 2.216, "step": 23383 }, { "epoch": 0.63, "learning_rate": 0.0006408981299108225, "loss": 2.4304, "step": 23384 }, { "epoch": 0.63, "learning_rate": 0.0006408168977336888, "loss": 2.2195, "step": 23385 }, { "epoch": 0.63, "learning_rate": 0.000640735668277662, "loss": 2.345, "step": 23386 }, { "epoch": 0.63, "learning_rate": 0.0006406544415433574, "loss": 2.4515, "step": 23387 }, { "epoch": 0.63, "learning_rate": 0.0006405732175313908, "loss": 2.2326, "step": 23388 }, { "epoch": 0.63, "learning_rate": 0.000640491996242377, "loss": 2.4257, "step": 23389 }, { "epoch": 0.63, "learning_rate": 0.0006404107776769316, "loss": 2.7679, "step": 23390 }, { "epoch": 0.63, "learning_rate": 0.0006403295618356699, "loss": 2.5534, "step": 23391 }, { "epoch": 0.63, "learning_rate": 0.000640248348719207, "loss": 2.5503, "step": 23392 }, { "epoch": 0.63, "learning_rate": 0.0006401671383281589, "loss": 2.3152, "step": 23393 }, { "epoch": 0.63, "learning_rate": 0.0006400859306631394, "loss": 2.4902, "step": 23394 }, { "epoch": 0.63, "learning_rate": 0.0006400047257247648, "loss": 3.1793, "step": 23395 }, { "epoch": 0.63, "learning_rate": 0.0006399235235136504, "loss": 2.5966, "step": 23396 }, { "epoch": 0.63, "learning_rate": 0.0006398423240304107, "loss": 2.5081, "step": 23397 }, { "epoch": 0.63, "learning_rate": 0.0006397611272756613, "loss": 2.5023, "step": 23398 }, { "epoch": 0.63, "learning_rate": 0.0006396799332500172, "loss": 2.3303, "step": 23399 }, { "epoch": 0.63, "learning_rate": 0.0006395987419540932, "loss": 2.5861, "step": 23400 }, { "epoch": 0.63, "learning_rate": 0.0006395175533885051, "loss": 1.9866, "step": 23401 }, { "epoch": 0.63, "learning_rate": 0.0006394363675538673, "loss": 2.3915, "step": 23402 }, { "epoch": 0.63, "learning_rate": 0.000639355184450795, "loss": 2.4172, "step": 23403 }, { "epoch": 0.63, "learning_rate": 0.0006392740040799036, "loss": 2.3705, "step": 23404 }, { "epoch": 0.63, "learning_rate": 0.0006391928264418079, "loss": 2.6711, "step": 23405 }, { "epoch": 0.63, "learning_rate": 0.0006391116515371226, "loss": 2.5474, "step": 23406 }, { "epoch": 0.63, "learning_rate": 0.0006390304793664631, "loss": 2.3703, "step": 23407 }, { "epoch": 0.63, "learning_rate": 0.000638949309930444, "loss": 2.3947, "step": 23408 }, { "epoch": 0.63, "learning_rate": 0.0006388681432296808, "loss": 2.1978, "step": 23409 }, { "epoch": 0.63, "learning_rate": 0.0006387869792647876, "loss": 2.838, "step": 23410 }, { "epoch": 0.63, "learning_rate": 0.0006387058180363793, "loss": 2.0297, "step": 23411 }, { "epoch": 0.63, "learning_rate": 0.000638624659545072, "loss": 2.3352, "step": 23412 }, { "epoch": 0.63, "learning_rate": 0.0006385435037914791, "loss": 2.7923, "step": 23413 }, { "epoch": 0.63, "learning_rate": 0.000638462350776216, "loss": 2.9086, "step": 23414 }, { "epoch": 0.63, "learning_rate": 0.0006383812004998978, "loss": 2.6066, "step": 23415 }, { "epoch": 0.63, "learning_rate": 0.0006383000529631386, "loss": 2.7168, "step": 23416 }, { "epoch": 0.63, "learning_rate": 0.000638218908166554, "loss": 2.9363, "step": 23417 }, { "epoch": 0.63, "learning_rate": 0.0006381377661107579, "loss": 2.4215, "step": 23418 }, { "epoch": 0.63, "learning_rate": 0.0006380566267963654, "loss": 2.5307, "step": 23419 }, { "epoch": 0.63, "learning_rate": 0.0006379754902239913, "loss": 2.2889, "step": 23420 }, { "epoch": 0.63, "learning_rate": 0.0006378943563942501, "loss": 2.9468, "step": 23421 }, { "epoch": 0.63, "learning_rate": 0.0006378132253077564, "loss": 2.3553, "step": 23422 }, { "epoch": 0.63, "learning_rate": 0.0006377320969651255, "loss": 2.3229, "step": 23423 }, { "epoch": 0.63, "learning_rate": 0.0006376509713669707, "loss": 2.4759, "step": 23424 }, { "epoch": 0.63, "learning_rate": 0.0006375698485139081, "loss": 2.5339, "step": 23425 }, { "epoch": 0.63, "learning_rate": 0.000637488728406551, "loss": 2.5561, "step": 23426 }, { "epoch": 0.63, "learning_rate": 0.0006374076110455143, "loss": 2.5544, "step": 23427 }, { "epoch": 0.63, "learning_rate": 0.0006373264964314134, "loss": 2.403, "step": 23428 }, { "epoch": 0.63, "learning_rate": 0.0006372453845648617, "loss": 2.6134, "step": 23429 }, { "epoch": 0.63, "learning_rate": 0.0006371642754464742, "loss": 2.4679, "step": 23430 }, { "epoch": 0.63, "learning_rate": 0.0006370831690768652, "loss": 2.2855, "step": 23431 }, { "epoch": 0.63, "learning_rate": 0.0006370020654566493, "loss": 2.6036, "step": 23432 }, { "epoch": 0.63, "learning_rate": 0.0006369209645864409, "loss": 2.1125, "step": 23433 }, { "epoch": 0.63, "learning_rate": 0.0006368398664668543, "loss": 2.5067, "step": 23434 }, { "epoch": 0.63, "learning_rate": 0.0006367587710985038, "loss": 2.9659, "step": 23435 }, { "epoch": 0.63, "learning_rate": 0.0006366776784820042, "loss": 2.0757, "step": 23436 }, { "epoch": 0.63, "learning_rate": 0.0006365965886179693, "loss": 2.846, "step": 23437 }, { "epoch": 0.63, "learning_rate": 0.0006365155015070137, "loss": 2.5148, "step": 23438 }, { "epoch": 0.63, "learning_rate": 0.000636434417149752, "loss": 2.6831, "step": 23439 }, { "epoch": 0.63, "learning_rate": 0.0006363533355467977, "loss": 2.271, "step": 23440 }, { "epoch": 0.63, "learning_rate": 0.000636272256698766, "loss": 2.1992, "step": 23441 }, { "epoch": 0.63, "learning_rate": 0.0006361911806062703, "loss": 2.6386, "step": 23442 }, { "epoch": 0.63, "learning_rate": 0.0006361101072699252, "loss": 3.0703, "step": 23443 }, { "epoch": 0.63, "learning_rate": 0.0006360290366903451, "loss": 2.8756, "step": 23444 }, { "epoch": 0.63, "learning_rate": 0.0006359479688681437, "loss": 2.6016, "step": 23445 }, { "epoch": 0.63, "learning_rate": 0.0006358669038039354, "loss": 2.6579, "step": 23446 }, { "epoch": 0.63, "learning_rate": 0.0006357858414983344, "loss": 2.314, "step": 23447 }, { "epoch": 0.63, "learning_rate": 0.0006357047819519547, "loss": 2.1831, "step": 23448 }, { "epoch": 0.63, "learning_rate": 0.0006356237251654104, "loss": 2.6945, "step": 23449 }, { "epoch": 0.63, "learning_rate": 0.000635542671139316, "loss": 2.281, "step": 23450 }, { "epoch": 0.63, "learning_rate": 0.0006354616198742846, "loss": 2.3074, "step": 23451 }, { "epoch": 0.63, "learning_rate": 0.0006353805713709315, "loss": 2.4812, "step": 23452 }, { "epoch": 0.63, "learning_rate": 0.0006352995256298693, "loss": 2.4696, "step": 23453 }, { "epoch": 0.63, "learning_rate": 0.0006352184826517129, "loss": 2.1448, "step": 23454 }, { "epoch": 0.63, "learning_rate": 0.0006351374424370764, "loss": 2.2608, "step": 23455 }, { "epoch": 0.63, "learning_rate": 0.000635056404986573, "loss": 2.6628, "step": 23456 }, { "epoch": 0.63, "learning_rate": 0.000634975370300817, "loss": 2.7068, "step": 23457 }, { "epoch": 0.63, "learning_rate": 0.0006348943383804227, "loss": 2.2186, "step": 23458 }, { "epoch": 0.63, "learning_rate": 0.0006348133092260033, "loss": 2.4762, "step": 23459 }, { "epoch": 0.63, "learning_rate": 0.0006347322828381733, "loss": 2.159, "step": 23460 }, { "epoch": 0.63, "learning_rate": 0.0006346512592175459, "loss": 2.2242, "step": 23461 }, { "epoch": 0.63, "learning_rate": 0.0006345702383647354, "loss": 3.0696, "step": 23462 }, { "epoch": 0.63, "learning_rate": 0.0006344892202803554, "loss": 2.5556, "step": 23463 }, { "epoch": 0.63, "learning_rate": 0.0006344082049650197, "loss": 2.6605, "step": 23464 }, { "epoch": 0.63, "learning_rate": 0.0006343271924193419, "loss": 2.509, "step": 23465 }, { "epoch": 0.63, "learning_rate": 0.0006342461826439363, "loss": 2.8039, "step": 23466 }, { "epoch": 0.63, "learning_rate": 0.000634165175639416, "loss": 2.5834, "step": 23467 }, { "epoch": 0.63, "learning_rate": 0.0006340841714063952, "loss": 2.5994, "step": 23468 }, { "epoch": 0.63, "learning_rate": 0.000634003169945487, "loss": 2.8737, "step": 23469 }, { "epoch": 0.63, "learning_rate": 0.0006339221712573051, "loss": 2.9963, "step": 23470 }, { "epoch": 0.63, "learning_rate": 0.000633841175342464, "loss": 2.411, "step": 23471 }, { "epoch": 0.63, "learning_rate": 0.0006337601822015763, "loss": 2.5475, "step": 23472 }, { "epoch": 0.63, "learning_rate": 0.0006336791918352561, "loss": 2.5716, "step": 23473 }, { "epoch": 0.63, "learning_rate": 0.0006335982042441168, "loss": 2.7067, "step": 23474 }, { "epoch": 0.63, "learning_rate": 0.0006335172194287719, "loss": 3.101, "step": 23475 }, { "epoch": 0.63, "learning_rate": 0.0006334362373898354, "loss": 2.5146, "step": 23476 }, { "epoch": 0.63, "learning_rate": 0.00063335525812792, "loss": 2.3443, "step": 23477 }, { "epoch": 0.63, "learning_rate": 0.0006332742816436398, "loss": 2.406, "step": 23478 }, { "epoch": 0.63, "learning_rate": 0.0006331933079376082, "loss": 2.5707, "step": 23479 }, { "epoch": 0.63, "learning_rate": 0.0006331123370104382, "loss": 2.0773, "step": 23480 }, { "epoch": 0.63, "learning_rate": 0.0006330313688627437, "loss": 2.6646, "step": 23481 }, { "epoch": 0.63, "learning_rate": 0.0006329504034951383, "loss": 2.4106, "step": 23482 }, { "epoch": 0.63, "learning_rate": 0.0006328694409082344, "loss": 2.6724, "step": 23483 }, { "epoch": 0.63, "learning_rate": 0.0006327884811026462, "loss": 2.3458, "step": 23484 }, { "epoch": 0.63, "learning_rate": 0.0006327075240789873, "loss": 2.6062, "step": 23485 }, { "epoch": 0.63, "learning_rate": 0.0006326265698378699, "loss": 2.3849, "step": 23486 }, { "epoch": 0.63, "learning_rate": 0.0006325456183799084, "loss": 2.9733, "step": 23487 }, { "epoch": 0.63, "learning_rate": 0.0006324646697057152, "loss": 2.5458, "step": 23488 }, { "epoch": 0.63, "learning_rate": 0.000632383723815904, "loss": 2.7759, "step": 23489 }, { "epoch": 0.63, "learning_rate": 0.0006323027807110882, "loss": 2.5626, "step": 23490 }, { "epoch": 0.63, "learning_rate": 0.0006322218403918804, "loss": 2.3743, "step": 23491 }, { "epoch": 0.63, "learning_rate": 0.0006321409028588944, "loss": 2.3371, "step": 23492 }, { "epoch": 0.63, "learning_rate": 0.0006320599681127434, "loss": 2.1991, "step": 23493 }, { "epoch": 0.63, "learning_rate": 0.0006319790361540401, "loss": 2.589, "step": 23494 }, { "epoch": 0.63, "learning_rate": 0.0006318981069833983, "loss": 2.6392, "step": 23495 }, { "epoch": 0.63, "learning_rate": 0.0006318171806014297, "loss": 2.0221, "step": 23496 }, { "epoch": 0.63, "learning_rate": 0.0006317362570087487, "loss": 2.4558, "step": 23497 }, { "epoch": 0.63, "learning_rate": 0.0006316553362059685, "loss": 2.6399, "step": 23498 }, { "epoch": 0.63, "learning_rate": 0.000631574418193701, "loss": 2.0988, "step": 23499 }, { "epoch": 0.63, "learning_rate": 0.0006314935029725597, "loss": 2.4041, "step": 23500 }, { "epoch": 0.63, "learning_rate": 0.0006314125905431585, "loss": 2.1159, "step": 23501 }, { "epoch": 0.63, "learning_rate": 0.000631331680906109, "loss": 2.4876, "step": 23502 }, { "epoch": 0.63, "learning_rate": 0.0006312507740620251, "loss": 2.4791, "step": 23503 }, { "epoch": 0.63, "learning_rate": 0.0006311698700115191, "loss": 2.498, "step": 23504 }, { "epoch": 0.63, "learning_rate": 0.0006310889687552043, "loss": 2.5251, "step": 23505 }, { "epoch": 0.63, "learning_rate": 0.0006310080702936938, "loss": 3.1344, "step": 23506 }, { "epoch": 0.63, "learning_rate": 0.0006309271746276, "loss": 3.1714, "step": 23507 }, { "epoch": 0.63, "learning_rate": 0.0006308462817575358, "loss": 2.3519, "step": 23508 }, { "epoch": 0.63, "learning_rate": 0.0006307653916841143, "loss": 2.5114, "step": 23509 }, { "epoch": 0.63, "learning_rate": 0.0006306845044079481, "loss": 2.3736, "step": 23510 }, { "epoch": 0.63, "learning_rate": 0.0006306036199296506, "loss": 2.4942, "step": 23511 }, { "epoch": 0.63, "learning_rate": 0.0006305227382498334, "loss": 2.8343, "step": 23512 }, { "epoch": 0.63, "learning_rate": 0.0006304418593691098, "loss": 2.4585, "step": 23513 }, { "epoch": 0.63, "learning_rate": 0.0006303609832880933, "loss": 2.8476, "step": 23514 }, { "epoch": 0.63, "learning_rate": 0.0006302801100073952, "loss": 2.7711, "step": 23515 }, { "epoch": 0.63, "learning_rate": 0.0006301992395276292, "loss": 2.4631, "step": 23516 }, { "epoch": 0.63, "learning_rate": 0.0006301183718494076, "loss": 2.5393, "step": 23517 }, { "epoch": 0.63, "learning_rate": 0.000630037506973343, "loss": 2.4057, "step": 23518 }, { "epoch": 0.63, "learning_rate": 0.0006299566449000483, "loss": 2.2735, "step": 23519 }, { "epoch": 0.63, "learning_rate": 0.0006298757856301358, "loss": 2.6635, "step": 23520 }, { "epoch": 0.63, "learning_rate": 0.0006297949291642181, "loss": 2.4546, "step": 23521 }, { "epoch": 0.63, "learning_rate": 0.000629714075502908, "loss": 2.5031, "step": 23522 }, { "epoch": 0.63, "learning_rate": 0.0006296332246468177, "loss": 2.8281, "step": 23523 }, { "epoch": 0.63, "learning_rate": 0.0006295523765965598, "loss": 2.2924, "step": 23524 }, { "epoch": 0.63, "learning_rate": 0.0006294715313527473, "loss": 2.4876, "step": 23525 }, { "epoch": 0.63, "learning_rate": 0.0006293906889159917, "loss": 1.9429, "step": 23526 }, { "epoch": 0.63, "learning_rate": 0.0006293098492869062, "loss": 2.2125, "step": 23527 }, { "epoch": 0.63, "learning_rate": 0.0006292290124661033, "loss": 2.3719, "step": 23528 }, { "epoch": 0.63, "learning_rate": 0.0006291481784541948, "loss": 2.4937, "step": 23529 }, { "epoch": 0.63, "learning_rate": 0.0006290673472517936, "loss": 2.6044, "step": 23530 }, { "epoch": 0.63, "learning_rate": 0.0006289865188595117, "loss": 2.589, "step": 23531 }, { "epoch": 0.63, "learning_rate": 0.0006289056932779613, "loss": 2.6493, "step": 23532 }, { "epoch": 0.63, "learning_rate": 0.0006288248705077554, "loss": 2.4772, "step": 23533 }, { "epoch": 0.63, "learning_rate": 0.0006287440505495059, "loss": 2.4547, "step": 23534 }, { "epoch": 0.63, "learning_rate": 0.0006286632334038249, "loss": 2.8782, "step": 23535 }, { "epoch": 0.63, "learning_rate": 0.0006285824190713252, "loss": 2.947, "step": 23536 }, { "epoch": 0.63, "learning_rate": 0.0006285016075526184, "loss": 3.025, "step": 23537 }, { "epoch": 0.63, "learning_rate": 0.0006284207988483174, "loss": 2.9743, "step": 23538 }, { "epoch": 0.63, "learning_rate": 0.0006283399929590335, "loss": 2.2177, "step": 23539 }, { "epoch": 0.63, "learning_rate": 0.0006282591898853794, "loss": 2.7482, "step": 23540 }, { "epoch": 0.63, "learning_rate": 0.0006281783896279677, "loss": 2.6254, "step": 23541 }, { "epoch": 0.63, "learning_rate": 0.0006280975921874096, "loss": 2.584, "step": 23542 }, { "epoch": 0.63, "learning_rate": 0.0006280167975643176, "loss": 2.4276, "step": 23543 }, { "epoch": 0.63, "learning_rate": 0.0006279360057593042, "loss": 1.92, "step": 23544 }, { "epoch": 0.63, "learning_rate": 0.0006278552167729808, "loss": 1.8561, "step": 23545 }, { "epoch": 0.63, "learning_rate": 0.0006277744306059601, "loss": 2.4231, "step": 23546 }, { "epoch": 0.63, "learning_rate": 0.0006276936472588533, "loss": 2.5627, "step": 23547 }, { "epoch": 0.63, "learning_rate": 0.0006276128667322731, "loss": 2.8257, "step": 23548 }, { "epoch": 0.63, "learning_rate": 0.0006275320890268312, "loss": 2.8113, "step": 23549 }, { "epoch": 0.63, "learning_rate": 0.0006274513141431397, "loss": 2.3937, "step": 23550 }, { "epoch": 0.63, "learning_rate": 0.0006273705420818102, "loss": 2.6816, "step": 23551 }, { "epoch": 0.63, "learning_rate": 0.0006272897728434552, "loss": 2.0491, "step": 23552 }, { "epoch": 0.63, "learning_rate": 0.0006272090064286859, "loss": 2.4182, "step": 23553 }, { "epoch": 0.63, "learning_rate": 0.0006271282428381151, "loss": 2.519, "step": 23554 }, { "epoch": 0.63, "learning_rate": 0.0006270474820723535, "loss": 2.8061, "step": 23555 }, { "epoch": 0.63, "learning_rate": 0.0006269667241320134, "loss": 2.6917, "step": 23556 }, { "epoch": 0.63, "learning_rate": 0.0006268859690177073, "loss": 2.5441, "step": 23557 }, { "epoch": 0.63, "learning_rate": 0.0006268052167300459, "loss": 2.3916, "step": 23558 }, { "epoch": 0.63, "learning_rate": 0.0006267244672696417, "loss": 2.4458, "step": 23559 }, { "epoch": 0.63, "learning_rate": 0.0006266437206371062, "loss": 2.2129, "step": 23560 }, { "epoch": 0.63, "learning_rate": 0.000626562976833051, "loss": 2.3697, "step": 23561 }, { "epoch": 0.63, "learning_rate": 0.0006264822358580878, "loss": 2.5462, "step": 23562 }, { "epoch": 0.63, "learning_rate": 0.0006264014977128287, "loss": 2.4571, "step": 23563 }, { "epoch": 0.63, "learning_rate": 0.0006263207623978848, "loss": 2.7468, "step": 23564 }, { "epoch": 0.63, "learning_rate": 0.0006262400299138682, "loss": 2.5271, "step": 23565 }, { "epoch": 0.63, "learning_rate": 0.0006261593002613901, "loss": 2.7633, "step": 23566 }, { "epoch": 0.63, "learning_rate": 0.0006260785734410625, "loss": 2.1226, "step": 23567 }, { "epoch": 0.63, "learning_rate": 0.000625997849453497, "loss": 2.6025, "step": 23568 }, { "epoch": 0.63, "learning_rate": 0.0006259171282993044, "loss": 2.4681, "step": 23569 }, { "epoch": 0.63, "learning_rate": 0.0006258364099790967, "loss": 2.4207, "step": 23570 }, { "epoch": 0.63, "learning_rate": 0.0006257556944934861, "loss": 1.8217, "step": 23571 }, { "epoch": 0.63, "learning_rate": 0.0006256749818430832, "loss": 2.9386, "step": 23572 }, { "epoch": 0.63, "learning_rate": 0.0006255942720284997, "loss": 2.4194, "step": 23573 }, { "epoch": 0.63, "learning_rate": 0.0006255135650503469, "loss": 2.614, "step": 23574 }, { "epoch": 0.63, "learning_rate": 0.0006254328609092364, "loss": 2.4068, "step": 23575 }, { "epoch": 0.63, "learning_rate": 0.0006253521596057796, "loss": 2.7765, "step": 23576 }, { "epoch": 0.63, "learning_rate": 0.0006252714611405879, "loss": 2.7228, "step": 23577 }, { "epoch": 0.63, "learning_rate": 0.0006251907655142726, "loss": 2.5072, "step": 23578 }, { "epoch": 0.63, "learning_rate": 0.0006251100727274452, "loss": 2.5264, "step": 23579 }, { "epoch": 0.63, "learning_rate": 0.0006250293827807166, "loss": 2.4856, "step": 23580 }, { "epoch": 0.63, "learning_rate": 0.0006249486956746988, "loss": 2.7634, "step": 23581 }, { "epoch": 0.63, "learning_rate": 0.0006248680114100021, "loss": 2.8138, "step": 23582 }, { "epoch": 0.63, "learning_rate": 0.0006247873299872383, "loss": 2.4297, "step": 23583 }, { "epoch": 0.63, "learning_rate": 0.0006247066514070191, "loss": 2.3934, "step": 23584 }, { "epoch": 0.63, "learning_rate": 0.0006246259756699548, "loss": 2.6984, "step": 23585 }, { "epoch": 0.63, "learning_rate": 0.0006245453027766569, "loss": 2.4994, "step": 23586 }, { "epoch": 0.63, "learning_rate": 0.0006244646327277372, "loss": 2.4846, "step": 23587 }, { "epoch": 0.63, "learning_rate": 0.0006243839655238058, "loss": 2.4961, "step": 23588 }, { "epoch": 0.63, "learning_rate": 0.0006243033011654746, "loss": 2.4493, "step": 23589 }, { "epoch": 0.63, "learning_rate": 0.0006242226396533544, "loss": 2.3661, "step": 23590 }, { "epoch": 0.63, "learning_rate": 0.000624141980988056, "loss": 2.5293, "step": 23591 }, { "epoch": 0.63, "learning_rate": 0.0006240613251701912, "loss": 2.3882, "step": 23592 }, { "epoch": 0.63, "learning_rate": 0.0006239806722003702, "loss": 2.5703, "step": 23593 }, { "epoch": 0.63, "learning_rate": 0.0006239000220792045, "loss": 2.7802, "step": 23594 }, { "epoch": 0.63, "learning_rate": 0.0006238193748073052, "loss": 2.6692, "step": 23595 }, { "epoch": 0.63, "learning_rate": 0.0006237387303852828, "loss": 2.3982, "step": 23596 }, { "epoch": 0.63, "learning_rate": 0.0006236580888137485, "loss": 1.9848, "step": 23597 }, { "epoch": 0.63, "learning_rate": 0.0006235774500933136, "loss": 2.0114, "step": 23598 }, { "epoch": 0.63, "learning_rate": 0.0006234968142245882, "loss": 2.8441, "step": 23599 }, { "epoch": 0.63, "learning_rate": 0.0006234161812081842, "loss": 2.4594, "step": 23600 }, { "epoch": 0.63, "learning_rate": 0.0006233355510447114, "loss": 2.5308, "step": 23601 }, { "epoch": 0.63, "learning_rate": 0.0006232549237347809, "loss": 2.3556, "step": 23602 }, { "epoch": 0.63, "learning_rate": 0.0006231742992790044, "loss": 2.3674, "step": 23603 }, { "epoch": 0.63, "learning_rate": 0.0006230936776779917, "loss": 2.5096, "step": 23604 }, { "epoch": 0.63, "learning_rate": 0.0006230130589323538, "loss": 2.5831, "step": 23605 }, { "epoch": 0.63, "learning_rate": 0.0006229324430427019, "loss": 2.4831, "step": 23606 }, { "epoch": 0.63, "learning_rate": 0.0006228518300096461, "loss": 2.7171, "step": 23607 }, { "epoch": 0.63, "learning_rate": 0.0006227712198337976, "loss": 2.584, "step": 23608 }, { "epoch": 0.63, "learning_rate": 0.0006226906125157668, "loss": 2.2032, "step": 23609 }, { "epoch": 0.63, "learning_rate": 0.0006226100080561644, "loss": 2.5117, "step": 23610 }, { "epoch": 0.63, "learning_rate": 0.0006225294064556011, "loss": 2.3111, "step": 23611 }, { "epoch": 0.63, "learning_rate": 0.0006224488077146875, "loss": 2.8165, "step": 23612 }, { "epoch": 0.63, "learning_rate": 0.0006223682118340344, "loss": 2.5328, "step": 23613 }, { "epoch": 0.63, "learning_rate": 0.0006222876188142523, "loss": 2.5387, "step": 23614 }, { "epoch": 0.63, "learning_rate": 0.0006222070286559514, "loss": 2.4601, "step": 23615 }, { "epoch": 0.63, "learning_rate": 0.0006221264413597429, "loss": 2.4685, "step": 23616 }, { "epoch": 0.63, "learning_rate": 0.0006220458569262365, "loss": 2.2884, "step": 23617 }, { "epoch": 0.63, "learning_rate": 0.0006219652753560432, "loss": 2.5947, "step": 23618 }, { "epoch": 0.63, "learning_rate": 0.0006218846966497735, "loss": 2.7054, "step": 23619 }, { "epoch": 0.63, "learning_rate": 0.0006218041208080376, "loss": 2.6402, "step": 23620 }, { "epoch": 0.63, "learning_rate": 0.0006217235478314461, "loss": 2.1187, "step": 23621 }, { "epoch": 0.63, "learning_rate": 0.0006216429777206096, "loss": 2.7129, "step": 23622 }, { "epoch": 0.63, "learning_rate": 0.000621562410476138, "loss": 2.3187, "step": 23623 }, { "epoch": 0.63, "learning_rate": 0.0006214818460986421, "loss": 2.2319, "step": 23624 }, { "epoch": 0.63, "learning_rate": 0.0006214012845887318, "loss": 2.5541, "step": 23625 }, { "epoch": 0.63, "learning_rate": 0.0006213207259470179, "loss": 2.5039, "step": 23626 }, { "epoch": 0.63, "learning_rate": 0.0006212401701741106, "loss": 2.1422, "step": 23627 }, { "epoch": 0.63, "learning_rate": 0.0006211596172706196, "loss": 2.5024, "step": 23628 }, { "epoch": 0.64, "learning_rate": 0.0006210790672371558, "loss": 2.483, "step": 23629 }, { "epoch": 0.64, "learning_rate": 0.0006209985200743297, "loss": 2.4574, "step": 23630 }, { "epoch": 0.64, "learning_rate": 0.0006209179757827505, "loss": 2.0291, "step": 23631 }, { "epoch": 0.64, "learning_rate": 0.000620837434363029, "loss": 2.5278, "step": 23632 }, { "epoch": 0.64, "learning_rate": 0.0006207568958157757, "loss": 2.4044, "step": 23633 }, { "epoch": 0.64, "learning_rate": 0.0006206763601416, "loss": 2.6133, "step": 23634 }, { "epoch": 0.64, "learning_rate": 0.0006205958273411125, "loss": 2.4018, "step": 23635 }, { "epoch": 0.64, "learning_rate": 0.0006205152974149232, "loss": 2.0833, "step": 23636 }, { "epoch": 0.64, "learning_rate": 0.0006204347703636419, "loss": 2.373, "step": 23637 }, { "epoch": 0.64, "learning_rate": 0.0006203542461878793, "loss": 2.7116, "step": 23638 }, { "epoch": 0.64, "learning_rate": 0.0006202737248882449, "loss": 2.4141, "step": 23639 }, { "epoch": 0.64, "learning_rate": 0.0006201932064653487, "loss": 3.0148, "step": 23640 }, { "epoch": 0.64, "learning_rate": 0.0006201126909198011, "loss": 2.4269, "step": 23641 }, { "epoch": 0.64, "learning_rate": 0.0006200321782522118, "loss": 2.4607, "step": 23642 }, { "epoch": 0.64, "learning_rate": 0.0006199516684631909, "loss": 2.6178, "step": 23643 }, { "epoch": 0.64, "learning_rate": 0.0006198711615533481, "loss": 2.6486, "step": 23644 }, { "epoch": 0.64, "learning_rate": 0.000619790657523293, "loss": 2.2808, "step": 23645 }, { "epoch": 0.64, "learning_rate": 0.0006197101563736367, "loss": 3.0081, "step": 23646 }, { "epoch": 0.64, "learning_rate": 0.0006196296581049877, "loss": 2.9652, "step": 23647 }, { "epoch": 0.64, "learning_rate": 0.0006195491627179566, "loss": 2.0113, "step": 23648 }, { "epoch": 0.64, "learning_rate": 0.000619468670213153, "loss": 2.6209, "step": 23649 }, { "epoch": 0.64, "learning_rate": 0.0006193881805911867, "loss": 2.2795, "step": 23650 }, { "epoch": 0.64, "learning_rate": 0.0006193076938526676, "loss": 2.701, "step": 23651 }, { "epoch": 0.64, "learning_rate": 0.000619227209998205, "loss": 2.698, "step": 23652 }, { "epoch": 0.64, "learning_rate": 0.0006191467290284091, "loss": 2.3437, "step": 23653 }, { "epoch": 0.64, "learning_rate": 0.0006190662509438898, "loss": 2.1217, "step": 23654 }, { "epoch": 0.64, "learning_rate": 0.0006189857757452563, "loss": 2.5374, "step": 23655 }, { "epoch": 0.64, "learning_rate": 0.0006189053034331184, "loss": 2.5746, "step": 23656 }, { "epoch": 0.64, "learning_rate": 0.0006188248340080861, "loss": 2.021, "step": 23657 }, { "epoch": 0.64, "learning_rate": 0.0006187443674707681, "loss": 2.5066, "step": 23658 }, { "epoch": 0.64, "learning_rate": 0.0006186639038217753, "loss": 2.7253, "step": 23659 }, { "epoch": 0.64, "learning_rate": 0.0006185834430617161, "loss": 2.4574, "step": 23660 }, { "epoch": 0.64, "learning_rate": 0.0006185029851912007, "loss": 2.7076, "step": 23661 }, { "epoch": 0.64, "learning_rate": 0.0006184225302108386, "loss": 2.2776, "step": 23662 }, { "epoch": 0.64, "learning_rate": 0.0006183420781212389, "loss": 2.7832, "step": 23663 }, { "epoch": 0.64, "learning_rate": 0.0006182616289230114, "loss": 2.4608, "step": 23664 }, { "epoch": 0.64, "learning_rate": 0.0006181811826167658, "loss": 2.6354, "step": 23665 }, { "epoch": 0.64, "learning_rate": 0.0006181007392031112, "loss": 2.4764, "step": 23666 }, { "epoch": 0.64, "learning_rate": 0.000618020298682657, "loss": 2.2948, "step": 23667 }, { "epoch": 0.64, "learning_rate": 0.0006179398610560129, "loss": 2.7735, "step": 23668 }, { "epoch": 0.64, "learning_rate": 0.000617859426323788, "loss": 2.7098, "step": 23669 }, { "epoch": 0.64, "learning_rate": 0.0006177789944865922, "loss": 2.4799, "step": 23670 }, { "epoch": 0.64, "learning_rate": 0.0006176985655450335, "loss": 2.784, "step": 23671 }, { "epoch": 0.64, "learning_rate": 0.0006176181394997227, "loss": 2.2754, "step": 23672 }, { "epoch": 0.64, "learning_rate": 0.0006175377163512688, "loss": 2.4471, "step": 23673 }, { "epoch": 0.64, "learning_rate": 0.0006174572961002802, "loss": 2.5741, "step": 23674 }, { "epoch": 0.64, "learning_rate": 0.0006173768787473667, "loss": 2.5161, "step": 23675 }, { "epoch": 0.64, "learning_rate": 0.0006172964642931381, "loss": 2.9882, "step": 23676 }, { "epoch": 0.64, "learning_rate": 0.0006172160527382027, "loss": 1.9969, "step": 23677 }, { "epoch": 0.64, "learning_rate": 0.0006171356440831704, "loss": 2.3943, "step": 23678 }, { "epoch": 0.64, "learning_rate": 0.0006170552383286495, "loss": 2.6358, "step": 23679 }, { "epoch": 0.64, "learning_rate": 0.0006169748354752498, "loss": 2.5355, "step": 23680 }, { "epoch": 0.64, "learning_rate": 0.0006168944355235805, "loss": 2.5208, "step": 23681 }, { "epoch": 0.64, "learning_rate": 0.0006168140384742502, "loss": 2.2701, "step": 23682 }, { "epoch": 0.64, "learning_rate": 0.0006167336443278684, "loss": 2.0333, "step": 23683 }, { "epoch": 0.64, "learning_rate": 0.0006166532530850439, "loss": 2.3386, "step": 23684 }, { "epoch": 0.64, "learning_rate": 0.0006165728647463858, "loss": 2.7174, "step": 23685 }, { "epoch": 0.64, "learning_rate": 0.0006164924793125035, "loss": 2.1583, "step": 23686 }, { "epoch": 0.64, "learning_rate": 0.0006164120967840052, "loss": 2.7961, "step": 23687 }, { "epoch": 0.64, "learning_rate": 0.0006163317171615001, "loss": 2.598, "step": 23688 }, { "epoch": 0.64, "learning_rate": 0.0006162513404455981, "loss": 2.6926, "step": 23689 }, { "epoch": 0.64, "learning_rate": 0.0006161709666369067, "loss": 2.6269, "step": 23690 }, { "epoch": 0.64, "learning_rate": 0.0006160905957360354, "loss": 2.5913, "step": 23691 }, { "epoch": 0.64, "learning_rate": 0.0006160102277435935, "loss": 2.7931, "step": 23692 }, { "epoch": 0.64, "learning_rate": 0.000615929862660189, "loss": 2.8909, "step": 23693 }, { "epoch": 0.64, "learning_rate": 0.0006158495004864316, "loss": 2.7634, "step": 23694 }, { "epoch": 0.64, "learning_rate": 0.0006157691412229295, "loss": 2.2526, "step": 23695 }, { "epoch": 0.64, "learning_rate": 0.0006156887848702917, "loss": 2.4216, "step": 23696 }, { "epoch": 0.64, "learning_rate": 0.000615608431429127, "loss": 2.4653, "step": 23697 }, { "epoch": 0.64, "learning_rate": 0.0006155280809000441, "loss": 2.5775, "step": 23698 }, { "epoch": 0.64, "learning_rate": 0.0006154477332836516, "loss": 2.7758, "step": 23699 }, { "epoch": 0.64, "learning_rate": 0.0006153673885805587, "loss": 2.5061, "step": 23700 }, { "epoch": 0.64, "learning_rate": 0.0006152870467913731, "loss": 2.2168, "step": 23701 }, { "epoch": 0.64, "learning_rate": 0.0006152067079167047, "loss": 2.7856, "step": 23702 }, { "epoch": 0.64, "learning_rate": 0.0006151263719571612, "loss": 2.3954, "step": 23703 }, { "epoch": 0.64, "learning_rate": 0.0006150460389133514, "loss": 2.5647, "step": 23704 }, { "epoch": 0.64, "learning_rate": 0.0006149657087858842, "loss": 2.5196, "step": 23705 }, { "epoch": 0.64, "learning_rate": 0.0006148853815753677, "loss": 2.2209, "step": 23706 }, { "epoch": 0.64, "learning_rate": 0.0006148050572824106, "loss": 2.4819, "step": 23707 }, { "epoch": 0.64, "learning_rate": 0.0006147247359076219, "loss": 2.2528, "step": 23708 }, { "epoch": 0.64, "learning_rate": 0.0006146444174516094, "loss": 2.243, "step": 23709 }, { "epoch": 0.64, "learning_rate": 0.000614564101914982, "loss": 2.7462, "step": 23710 }, { "epoch": 0.64, "learning_rate": 0.0006144837892983482, "loss": 2.6912, "step": 23711 }, { "epoch": 0.64, "learning_rate": 0.0006144034796023161, "loss": 2.4337, "step": 23712 }, { "epoch": 0.64, "learning_rate": 0.0006143231728274947, "loss": 2.1809, "step": 23713 }, { "epoch": 0.64, "learning_rate": 0.0006142428689744914, "loss": 2.4379, "step": 23714 }, { "epoch": 0.64, "learning_rate": 0.0006141625680439153, "loss": 2.34, "step": 23715 }, { "epoch": 0.64, "learning_rate": 0.000614082270036375, "loss": 2.3796, "step": 23716 }, { "epoch": 0.64, "learning_rate": 0.0006140019749524782, "loss": 2.6227, "step": 23717 }, { "epoch": 0.64, "learning_rate": 0.0006139216827928331, "loss": 2.1206, "step": 23718 }, { "epoch": 0.64, "learning_rate": 0.000613841393558049, "loss": 3.0352, "step": 23719 }, { "epoch": 0.64, "learning_rate": 0.0006137611072487329, "loss": 2.3587, "step": 23720 }, { "epoch": 0.64, "learning_rate": 0.0006136808238654939, "loss": 2.6106, "step": 23721 }, { "epoch": 0.64, "learning_rate": 0.0006136005434089397, "loss": 2.4175, "step": 23722 }, { "epoch": 0.64, "learning_rate": 0.0006135202658796787, "loss": 2.9931, "step": 23723 }, { "epoch": 0.64, "learning_rate": 0.0006134399912783193, "loss": 2.2239, "step": 23724 }, { "epoch": 0.64, "learning_rate": 0.0006133597196054691, "loss": 2.2495, "step": 23725 }, { "epoch": 0.64, "learning_rate": 0.0006132794508617365, "loss": 3.165, "step": 23726 }, { "epoch": 0.64, "learning_rate": 0.0006131991850477301, "loss": 2.8749, "step": 23727 }, { "epoch": 0.64, "learning_rate": 0.0006131189221640572, "loss": 2.4025, "step": 23728 }, { "epoch": 0.64, "learning_rate": 0.0006130386622113265, "loss": 2.1401, "step": 23729 }, { "epoch": 0.64, "learning_rate": 0.0006129584051901454, "loss": 2.5145, "step": 23730 }, { "epoch": 0.64, "learning_rate": 0.0006128781511011219, "loss": 2.6806, "step": 23731 }, { "epoch": 0.64, "learning_rate": 0.0006127978999448652, "loss": 2.0151, "step": 23732 }, { "epoch": 0.64, "learning_rate": 0.0006127176517219816, "loss": 2.2255, "step": 23733 }, { "epoch": 0.64, "learning_rate": 0.0006126374064330801, "loss": 2.5367, "step": 23734 }, { "epoch": 0.64, "learning_rate": 0.0006125571640787684, "loss": 2.6611, "step": 23735 }, { "epoch": 0.64, "learning_rate": 0.0006124769246596542, "loss": 2.6317, "step": 23736 }, { "epoch": 0.64, "learning_rate": 0.0006123966881763458, "loss": 2.6031, "step": 23737 }, { "epoch": 0.64, "learning_rate": 0.0006123164546294506, "loss": 2.5864, "step": 23738 }, { "epoch": 0.64, "learning_rate": 0.0006122362240195767, "loss": 2.597, "step": 23739 }, { "epoch": 0.64, "learning_rate": 0.0006121559963473318, "loss": 2.4769, "step": 23740 }, { "epoch": 0.64, "learning_rate": 0.0006120757716133237, "loss": 2.4844, "step": 23741 }, { "epoch": 0.64, "learning_rate": 0.0006119955498181602, "loss": 2.6763, "step": 23742 }, { "epoch": 0.64, "learning_rate": 0.0006119153309624495, "loss": 2.5095, "step": 23743 }, { "epoch": 0.64, "learning_rate": 0.000611835115046798, "loss": 2.6431, "step": 23744 }, { "epoch": 0.64, "learning_rate": 0.0006117549020718148, "loss": 2.1823, "step": 23745 }, { "epoch": 0.64, "learning_rate": 0.0006116746920381073, "loss": 2.9738, "step": 23746 }, { "epoch": 0.64, "learning_rate": 0.0006115944849462825, "loss": 1.9449, "step": 23747 }, { "epoch": 0.64, "learning_rate": 0.0006115142807969486, "loss": 2.5418, "step": 23748 }, { "epoch": 0.64, "learning_rate": 0.0006114340795907129, "loss": 2.3252, "step": 23749 }, { "epoch": 0.64, "learning_rate": 0.0006113538813281831, "loss": 2.4655, "step": 23750 }, { "epoch": 0.64, "learning_rate": 0.000611273686009967, "loss": 2.7435, "step": 23751 }, { "epoch": 0.64, "learning_rate": 0.0006111934936366719, "loss": 2.4113, "step": 23752 }, { "epoch": 0.64, "learning_rate": 0.0006111133042089053, "loss": 2.3529, "step": 23753 }, { "epoch": 0.64, "learning_rate": 0.000611033117727275, "loss": 2.5245, "step": 23754 }, { "epoch": 0.64, "learning_rate": 0.000610952934192388, "loss": 2.2106, "step": 23755 }, { "epoch": 0.64, "learning_rate": 0.0006108727536048525, "loss": 2.3648, "step": 23756 }, { "epoch": 0.64, "learning_rate": 0.0006107925759652748, "loss": 2.547, "step": 23757 }, { "epoch": 0.64, "learning_rate": 0.0006107124012742631, "loss": 2.4258, "step": 23758 }, { "epoch": 0.64, "learning_rate": 0.0006106322295324251, "loss": 2.4625, "step": 23759 }, { "epoch": 0.64, "learning_rate": 0.0006105520607403672, "loss": 2.4615, "step": 23760 }, { "epoch": 0.64, "learning_rate": 0.0006104718948986974, "loss": 2.4394, "step": 23761 }, { "epoch": 0.64, "learning_rate": 0.0006103917320080233, "loss": 2.5791, "step": 23762 }, { "epoch": 0.64, "learning_rate": 0.0006103115720689513, "loss": 2.4313, "step": 23763 }, { "epoch": 0.64, "learning_rate": 0.0006102314150820894, "loss": 2.6677, "step": 23764 }, { "epoch": 0.64, "learning_rate": 0.0006101512610480444, "loss": 2.2984, "step": 23765 }, { "epoch": 0.64, "learning_rate": 0.0006100711099674238, "loss": 2.0494, "step": 23766 }, { "epoch": 0.64, "learning_rate": 0.000609990961840835, "loss": 2.6326, "step": 23767 }, { "epoch": 0.64, "learning_rate": 0.0006099108166688847, "loss": 2.3496, "step": 23768 }, { "epoch": 0.64, "learning_rate": 0.0006098306744521802, "loss": 2.3946, "step": 23769 }, { "epoch": 0.64, "learning_rate": 0.000609750535191329, "loss": 2.0497, "step": 23770 }, { "epoch": 0.64, "learning_rate": 0.0006096703988869379, "loss": 2.3367, "step": 23771 }, { "epoch": 0.64, "learning_rate": 0.0006095902655396144, "loss": 2.8973, "step": 23772 }, { "epoch": 0.64, "learning_rate": 0.0006095101351499646, "loss": 2.5587, "step": 23773 }, { "epoch": 0.64, "learning_rate": 0.0006094300077185966, "loss": 3.0196, "step": 23774 }, { "epoch": 0.64, "learning_rate": 0.0006093498832461173, "loss": 2.7352, "step": 23775 }, { "epoch": 0.64, "learning_rate": 0.0006092697617331329, "loss": 2.7079, "step": 23776 }, { "epoch": 0.64, "learning_rate": 0.0006091896431802508, "loss": 2.8503, "step": 23777 }, { "epoch": 0.64, "learning_rate": 0.000609109527588079, "loss": 2.3576, "step": 23778 }, { "epoch": 0.64, "learning_rate": 0.0006090294149572227, "loss": 2.4005, "step": 23779 }, { "epoch": 0.64, "learning_rate": 0.00060894930528829, "loss": 2.1699, "step": 23780 }, { "epoch": 0.64, "learning_rate": 0.0006088691985818874, "loss": 2.4109, "step": 23781 }, { "epoch": 0.64, "learning_rate": 0.0006087890948386216, "loss": 2.5532, "step": 23782 }, { "epoch": 0.64, "learning_rate": 0.0006087089940591, "loss": 2.3836, "step": 23783 }, { "epoch": 0.64, "learning_rate": 0.0006086288962439291, "loss": 2.9845, "step": 23784 }, { "epoch": 0.64, "learning_rate": 0.0006085488013937154, "loss": 2.6461, "step": 23785 }, { "epoch": 0.64, "learning_rate": 0.0006084687095090662, "loss": 2.6062, "step": 23786 }, { "epoch": 0.64, "learning_rate": 0.000608388620590588, "loss": 2.1737, "step": 23787 }, { "epoch": 0.64, "learning_rate": 0.0006083085346388875, "loss": 2.363, "step": 23788 }, { "epoch": 0.64, "learning_rate": 0.000608228451654572, "loss": 2.4894, "step": 23789 }, { "epoch": 0.64, "learning_rate": 0.0006081483716382471, "loss": 2.0407, "step": 23790 }, { "epoch": 0.64, "learning_rate": 0.0006080682945905207, "loss": 2.2416, "step": 23791 }, { "epoch": 0.64, "learning_rate": 0.0006079882205119984, "loss": 2.5384, "step": 23792 }, { "epoch": 0.64, "learning_rate": 0.0006079081494032872, "loss": 1.9749, "step": 23793 }, { "epoch": 0.64, "learning_rate": 0.000607828081264994, "loss": 2.8404, "step": 23794 }, { "epoch": 0.64, "learning_rate": 0.0006077480160977249, "loss": 2.4045, "step": 23795 }, { "epoch": 0.64, "learning_rate": 0.0006076679539020869, "loss": 2.3887, "step": 23796 }, { "epoch": 0.64, "learning_rate": 0.0006075878946786863, "loss": 2.7106, "step": 23797 }, { "epoch": 0.64, "learning_rate": 0.0006075078384281295, "loss": 2.7184, "step": 23798 }, { "epoch": 0.64, "learning_rate": 0.0006074277851510235, "loss": 2.3798, "step": 23799 }, { "epoch": 0.64, "learning_rate": 0.000607347734847974, "loss": 2.7203, "step": 23800 }, { "epoch": 0.64, "learning_rate": 0.0006072676875195879, "loss": 2.5924, "step": 23801 }, { "epoch": 0.64, "learning_rate": 0.0006071876431664721, "loss": 2.7894, "step": 23802 }, { "epoch": 0.64, "learning_rate": 0.0006071076017892319, "loss": 2.5023, "step": 23803 }, { "epoch": 0.64, "learning_rate": 0.0006070275633884743, "loss": 2.5459, "step": 23804 }, { "epoch": 0.64, "learning_rate": 0.0006069475279648062, "loss": 2.3776, "step": 23805 }, { "epoch": 0.64, "learning_rate": 0.0006068674955188329, "loss": 2.8249, "step": 23806 }, { "epoch": 0.64, "learning_rate": 0.0006067874660511613, "loss": 2.7934, "step": 23807 }, { "epoch": 0.64, "learning_rate": 0.0006067074395623974, "loss": 2.3503, "step": 23808 }, { "epoch": 0.64, "learning_rate": 0.0006066274160531475, "loss": 2.3564, "step": 23809 }, { "epoch": 0.64, "learning_rate": 0.0006065473955240184, "loss": 2.3774, "step": 23810 }, { "epoch": 0.64, "learning_rate": 0.0006064673779756156, "loss": 2.8161, "step": 23811 }, { "epoch": 0.64, "learning_rate": 0.0006063873634085455, "loss": 2.162, "step": 23812 }, { "epoch": 0.64, "learning_rate": 0.0006063073518234146, "loss": 2.3786, "step": 23813 }, { "epoch": 0.64, "learning_rate": 0.0006062273432208287, "loss": 2.5763, "step": 23814 }, { "epoch": 0.64, "learning_rate": 0.0006061473376013945, "loss": 2.7324, "step": 23815 }, { "epoch": 0.64, "learning_rate": 0.0006060673349657169, "loss": 2.457, "step": 23816 }, { "epoch": 0.64, "learning_rate": 0.000605987335314403, "loss": 2.1905, "step": 23817 }, { "epoch": 0.64, "learning_rate": 0.0006059073386480591, "loss": 2.502, "step": 23818 }, { "epoch": 0.64, "learning_rate": 0.0006058273449672902, "loss": 2.549, "step": 23819 }, { "epoch": 0.64, "learning_rate": 0.0006057473542727027, "loss": 2.7421, "step": 23820 }, { "epoch": 0.64, "learning_rate": 0.0006056673665649033, "loss": 2.5808, "step": 23821 }, { "epoch": 0.64, "learning_rate": 0.0006055873818444971, "loss": 2.3166, "step": 23822 }, { "epoch": 0.64, "learning_rate": 0.0006055074001120904, "loss": 2.5704, "step": 23823 }, { "epoch": 0.64, "learning_rate": 0.0006054274213682893, "loss": 2.4186, "step": 23824 }, { "epoch": 0.64, "learning_rate": 0.0006053474456136994, "loss": 2.3482, "step": 23825 }, { "epoch": 0.64, "learning_rate": 0.0006052674728489267, "loss": 2.5362, "step": 23826 }, { "epoch": 0.64, "learning_rate": 0.000605187503074577, "loss": 2.3624, "step": 23827 }, { "epoch": 0.64, "learning_rate": 0.0006051075362912561, "loss": 2.605, "step": 23828 }, { "epoch": 0.64, "learning_rate": 0.0006050275724995702, "loss": 2.2417, "step": 23829 }, { "epoch": 0.64, "learning_rate": 0.0006049476117001245, "loss": 2.4819, "step": 23830 }, { "epoch": 0.64, "learning_rate": 0.0006048676538935251, "loss": 2.1356, "step": 23831 }, { "epoch": 0.64, "learning_rate": 0.0006047876990803781, "loss": 2.2007, "step": 23832 }, { "epoch": 0.64, "learning_rate": 0.0006047077472612883, "loss": 2.6506, "step": 23833 }, { "epoch": 0.64, "learning_rate": 0.0006046277984368625, "loss": 2.3867, "step": 23834 }, { "epoch": 0.64, "learning_rate": 0.0006045478526077052, "loss": 3.0319, "step": 23835 }, { "epoch": 0.64, "learning_rate": 0.000604467909774423, "loss": 2.6032, "step": 23836 }, { "epoch": 0.64, "learning_rate": 0.0006043879699376214, "loss": 2.7335, "step": 23837 }, { "epoch": 0.64, "learning_rate": 0.0006043080330979054, "loss": 2.807, "step": 23838 }, { "epoch": 0.64, "learning_rate": 0.000604228099255881, "loss": 2.9542, "step": 23839 }, { "epoch": 0.64, "learning_rate": 0.0006041481684121541, "loss": 2.7864, "step": 23840 }, { "epoch": 0.64, "learning_rate": 0.0006040682405673297, "loss": 2.577, "step": 23841 }, { "epoch": 0.64, "learning_rate": 0.0006039883157220136, "loss": 2.5894, "step": 23842 }, { "epoch": 0.64, "learning_rate": 0.0006039083938768111, "loss": 2.4695, "step": 23843 }, { "epoch": 0.64, "learning_rate": 0.0006038284750323278, "loss": 2.6923, "step": 23844 }, { "epoch": 0.64, "learning_rate": 0.0006037485591891694, "loss": 2.3619, "step": 23845 }, { "epoch": 0.64, "learning_rate": 0.0006036686463479406, "loss": 2.1807, "step": 23846 }, { "epoch": 0.64, "learning_rate": 0.0006035887365092476, "loss": 2.106, "step": 23847 }, { "epoch": 0.64, "learning_rate": 0.0006035088296736957, "loss": 2.5215, "step": 23848 }, { "epoch": 0.64, "learning_rate": 0.0006034289258418897, "loss": 2.0829, "step": 23849 }, { "epoch": 0.64, "learning_rate": 0.0006033490250144354, "loss": 2.4617, "step": 23850 }, { "epoch": 0.64, "learning_rate": 0.0006032691271919377, "loss": 2.3809, "step": 23851 }, { "epoch": 0.64, "learning_rate": 0.0006031892323750023, "loss": 2.8749, "step": 23852 }, { "epoch": 0.64, "learning_rate": 0.0006031093405642345, "loss": 2.9161, "step": 23853 }, { "epoch": 0.64, "learning_rate": 0.0006030294517602392, "loss": 2.3223, "step": 23854 }, { "epoch": 0.64, "learning_rate": 0.0006029495659636218, "loss": 1.8368, "step": 23855 }, { "epoch": 0.64, "learning_rate": 0.0006028696831749876, "loss": 2.6039, "step": 23856 }, { "epoch": 0.64, "learning_rate": 0.0006027898033949415, "loss": 2.5916, "step": 23857 }, { "epoch": 0.64, "learning_rate": 0.000602709926624089, "loss": 2.2806, "step": 23858 }, { "epoch": 0.64, "learning_rate": 0.0006026300528630351, "loss": 2.5827, "step": 23859 }, { "epoch": 0.64, "learning_rate": 0.0006025501821123846, "loss": 2.8285, "step": 23860 }, { "epoch": 0.64, "learning_rate": 0.0006024703143727435, "loss": 2.2626, "step": 23861 }, { "epoch": 0.64, "learning_rate": 0.0006023904496447156, "loss": 2.4368, "step": 23862 }, { "epoch": 0.64, "learning_rate": 0.0006023105879289066, "loss": 2.3312, "step": 23863 }, { "epoch": 0.64, "learning_rate": 0.0006022307292259219, "loss": 2.4811, "step": 23864 }, { "epoch": 0.64, "learning_rate": 0.0006021508735363659, "loss": 2.583, "step": 23865 }, { "epoch": 0.64, "learning_rate": 0.0006020710208608436, "loss": 2.8661, "step": 23866 }, { "epoch": 0.64, "learning_rate": 0.0006019911711999602, "loss": 2.3522, "step": 23867 }, { "epoch": 0.64, "learning_rate": 0.0006019113245543204, "loss": 2.8414, "step": 23868 }, { "epoch": 0.64, "learning_rate": 0.0006018314809245295, "loss": 2.4115, "step": 23869 }, { "epoch": 0.64, "learning_rate": 0.0006017516403111919, "loss": 2.3749, "step": 23870 }, { "epoch": 0.64, "learning_rate": 0.0006016718027149126, "loss": 2.6208, "step": 23871 }, { "epoch": 0.64, "learning_rate": 0.0006015919681362968, "loss": 2.4994, "step": 23872 }, { "epoch": 0.64, "learning_rate": 0.0006015121365759488, "loss": 2.6452, "step": 23873 }, { "epoch": 0.64, "learning_rate": 0.0006014323080344735, "loss": 2.5307, "step": 23874 }, { "epoch": 0.64, "learning_rate": 0.0006013524825124764, "loss": 2.5486, "step": 23875 }, { "epoch": 0.64, "learning_rate": 0.0006012726600105609, "loss": 2.629, "step": 23876 }, { "epoch": 0.64, "learning_rate": 0.0006011928405293329, "loss": 2.3316, "step": 23877 }, { "epoch": 0.64, "learning_rate": 0.0006011130240693964, "loss": 2.4474, "step": 23878 }, { "epoch": 0.64, "learning_rate": 0.0006010332106313563, "loss": 2.5026, "step": 23879 }, { "epoch": 0.64, "learning_rate": 0.0006009534002158175, "loss": 2.4868, "step": 23880 }, { "epoch": 0.64, "learning_rate": 0.0006008735928233842, "loss": 2.8514, "step": 23881 }, { "epoch": 0.64, "learning_rate": 0.0006007937884546611, "loss": 2.7817, "step": 23882 }, { "epoch": 0.64, "learning_rate": 0.0006007139871102531, "loss": 2.2072, "step": 23883 }, { "epoch": 0.64, "learning_rate": 0.0006006341887907644, "loss": 2.4028, "step": 23884 }, { "epoch": 0.64, "learning_rate": 0.0006005543934967999, "loss": 3.0695, "step": 23885 }, { "epoch": 0.64, "learning_rate": 0.0006004746012289637, "loss": 2.2332, "step": 23886 }, { "epoch": 0.64, "learning_rate": 0.0006003948119878605, "loss": 2.363, "step": 23887 }, { "epoch": 0.64, "learning_rate": 0.0006003150257740951, "loss": 2.4865, "step": 23888 }, { "epoch": 0.64, "learning_rate": 0.0006002352425882712, "loss": 2.7684, "step": 23889 }, { "epoch": 0.64, "learning_rate": 0.0006001554624309935, "loss": 2.4568, "step": 23890 }, { "epoch": 0.64, "learning_rate": 0.0006000756853028671, "loss": 2.3895, "step": 23891 }, { "epoch": 0.64, "learning_rate": 0.0005999959112044955, "loss": 2.5146, "step": 23892 }, { "epoch": 0.64, "learning_rate": 0.000599916140136483, "loss": 2.0891, "step": 23893 }, { "epoch": 0.64, "learning_rate": 0.0005998363720994351, "loss": 2.3572, "step": 23894 }, { "epoch": 0.64, "learning_rate": 0.0005997566070939547, "loss": 2.1819, "step": 23895 }, { "epoch": 0.64, "learning_rate": 0.0005996768451206469, "loss": 2.3837, "step": 23896 }, { "epoch": 0.64, "learning_rate": 0.0005995970861801157, "loss": 1.9437, "step": 23897 }, { "epoch": 0.64, "learning_rate": 0.0005995173302729653, "loss": 2.7042, "step": 23898 }, { "epoch": 0.64, "learning_rate": 0.0005994375773998003, "loss": 2.474, "step": 23899 }, { "epoch": 0.64, "learning_rate": 0.0005993578275612241, "loss": 2.3011, "step": 23900 }, { "epoch": 0.64, "learning_rate": 0.0005992780807578418, "loss": 2.6379, "step": 23901 }, { "epoch": 0.64, "learning_rate": 0.000599198336990257, "loss": 2.0212, "step": 23902 }, { "epoch": 0.64, "learning_rate": 0.0005991185962590737, "loss": 2.2275, "step": 23903 }, { "epoch": 0.64, "learning_rate": 0.0005990388585648969, "loss": 2.4511, "step": 23904 }, { "epoch": 0.64, "learning_rate": 0.0005989591239083294, "loss": 2.9103, "step": 23905 }, { "epoch": 0.64, "learning_rate": 0.0005988793922899758, "loss": 2.5886, "step": 23906 }, { "epoch": 0.64, "learning_rate": 0.0005987996637104409, "loss": 2.5014, "step": 23907 }, { "epoch": 0.64, "learning_rate": 0.0005987199381703274, "loss": 2.6078, "step": 23908 }, { "epoch": 0.64, "learning_rate": 0.00059864021567024, "loss": 2.7879, "step": 23909 }, { "epoch": 0.64, "learning_rate": 0.0005985604962107829, "loss": 2.2349, "step": 23910 }, { "epoch": 0.64, "learning_rate": 0.0005984807797925593, "loss": 2.3389, "step": 23911 }, { "epoch": 0.64, "learning_rate": 0.0005984010664161739, "loss": 2.5055, "step": 23912 }, { "epoch": 0.64, "learning_rate": 0.00059832135608223, "loss": 2.6172, "step": 23913 }, { "epoch": 0.64, "learning_rate": 0.0005982416487913315, "loss": 2.5173, "step": 23914 }, { "epoch": 0.64, "learning_rate": 0.0005981619445440829, "loss": 2.6721, "step": 23915 }, { "epoch": 0.64, "learning_rate": 0.0005980822433410872, "loss": 2.3724, "step": 23916 }, { "epoch": 0.64, "learning_rate": 0.0005980025451829486, "loss": 2.5594, "step": 23917 }, { "epoch": 0.64, "learning_rate": 0.0005979228500702712, "loss": 2.3645, "step": 23918 }, { "epoch": 0.64, "learning_rate": 0.0005978431580036579, "loss": 2.046, "step": 23919 }, { "epoch": 0.64, "learning_rate": 0.0005977634689837135, "loss": 2.3993, "step": 23920 }, { "epoch": 0.64, "learning_rate": 0.0005976837830110409, "loss": 2.5103, "step": 23921 }, { "epoch": 0.64, "learning_rate": 0.0005976041000862438, "loss": 2.596, "step": 23922 }, { "epoch": 0.64, "learning_rate": 0.0005975244202099264, "loss": 2.6002, "step": 23923 }, { "epoch": 0.64, "learning_rate": 0.0005974447433826917, "loss": 2.5639, "step": 23924 }, { "epoch": 0.64, "learning_rate": 0.0005973650696051438, "loss": 2.7445, "step": 23925 }, { "epoch": 0.64, "learning_rate": 0.0005972853988778864, "loss": 2.5336, "step": 23926 }, { "epoch": 0.64, "learning_rate": 0.0005972057312015225, "loss": 2.6502, "step": 23927 }, { "epoch": 0.64, "learning_rate": 0.000597126066576656, "loss": 2.3054, "step": 23928 }, { "epoch": 0.64, "learning_rate": 0.0005970464050038906, "loss": 2.6616, "step": 23929 }, { "epoch": 0.64, "learning_rate": 0.0005969667464838293, "loss": 2.1497, "step": 23930 }, { "epoch": 0.64, "learning_rate": 0.0005968870910170763, "loss": 2.209, "step": 23931 }, { "epoch": 0.64, "learning_rate": 0.0005968074386042342, "loss": 2.8436, "step": 23932 }, { "epoch": 0.64, "learning_rate": 0.0005967277892459068, "loss": 2.8055, "step": 23933 }, { "epoch": 0.64, "learning_rate": 0.0005966481429426982, "loss": 2.7504, "step": 23934 }, { "epoch": 0.64, "learning_rate": 0.0005965684996952106, "loss": 2.3971, "step": 23935 }, { "epoch": 0.64, "learning_rate": 0.000596488859504048, "loss": 2.4444, "step": 23936 }, { "epoch": 0.64, "learning_rate": 0.000596409222369814, "loss": 2.9027, "step": 23937 }, { "epoch": 0.64, "learning_rate": 0.0005963295882931112, "loss": 2.5064, "step": 23938 }, { "epoch": 0.64, "learning_rate": 0.0005962499572745436, "loss": 2.3899, "step": 23939 }, { "epoch": 0.64, "learning_rate": 0.0005961703293147138, "loss": 2.3363, "step": 23940 }, { "epoch": 0.64, "learning_rate": 0.0005960907044142254, "loss": 2.6835, "step": 23941 }, { "epoch": 0.64, "learning_rate": 0.0005960110825736819, "loss": 2.2178, "step": 23942 }, { "epoch": 0.64, "learning_rate": 0.0005959314637936859, "loss": 2.5079, "step": 23943 }, { "epoch": 0.64, "learning_rate": 0.0005958518480748409, "loss": 2.6326, "step": 23944 }, { "epoch": 0.64, "learning_rate": 0.0005957722354177503, "loss": 2.5179, "step": 23945 }, { "epoch": 0.64, "learning_rate": 0.0005956926258230169, "loss": 2.0012, "step": 23946 }, { "epoch": 0.64, "learning_rate": 0.0005956130192912441, "loss": 2.7195, "step": 23947 }, { "epoch": 0.64, "learning_rate": 0.0005955334158230341, "loss": 2.6868, "step": 23948 }, { "epoch": 0.64, "learning_rate": 0.000595453815418991, "loss": 2.5954, "step": 23949 }, { "epoch": 0.64, "learning_rate": 0.0005953742180797178, "loss": 2.3005, "step": 23950 }, { "epoch": 0.64, "learning_rate": 0.0005952946238058168, "loss": 2.5742, "step": 23951 }, { "epoch": 0.64, "learning_rate": 0.0005952150325978911, "loss": 2.3033, "step": 23952 }, { "epoch": 0.64, "learning_rate": 0.0005951354444565447, "loss": 2.5866, "step": 23953 }, { "epoch": 0.64, "learning_rate": 0.0005950558593823793, "loss": 2.4635, "step": 23954 }, { "epoch": 0.64, "learning_rate": 0.0005949762773759986, "loss": 2.7751, "step": 23955 }, { "epoch": 0.64, "learning_rate": 0.0005948966984380048, "loss": 2.5959, "step": 23956 }, { "epoch": 0.64, "learning_rate": 0.0005948171225690014, "loss": 2.7652, "step": 23957 }, { "epoch": 0.64, "learning_rate": 0.0005947375497695911, "loss": 2.5829, "step": 23958 }, { "epoch": 0.64, "learning_rate": 0.0005946579800403765, "loss": 2.7721, "step": 23959 }, { "epoch": 0.64, "learning_rate": 0.0005945784133819606, "loss": 2.252, "step": 23960 }, { "epoch": 0.64, "learning_rate": 0.0005944988497949464, "loss": 2.6299, "step": 23961 }, { "epoch": 0.64, "learning_rate": 0.0005944192892799362, "loss": 2.9826, "step": 23962 }, { "epoch": 0.64, "learning_rate": 0.0005943397318375333, "loss": 2.2493, "step": 23963 }, { "epoch": 0.64, "learning_rate": 0.0005942601774683396, "loss": 2.1999, "step": 23964 }, { "epoch": 0.64, "learning_rate": 0.0005941806261729582, "loss": 2.2492, "step": 23965 }, { "epoch": 0.64, "learning_rate": 0.0005941010779519924, "loss": 2.985, "step": 23966 }, { "epoch": 0.64, "learning_rate": 0.0005940215328060439, "loss": 2.6466, "step": 23967 }, { "epoch": 0.64, "learning_rate": 0.0005939419907357155, "loss": 2.8923, "step": 23968 }, { "epoch": 0.64, "learning_rate": 0.0005938624517416104, "loss": 2.6159, "step": 23969 }, { "epoch": 0.64, "learning_rate": 0.0005937829158243304, "loss": 2.32, "step": 23970 }, { "epoch": 0.64, "learning_rate": 0.0005937033829844784, "loss": 2.4183, "step": 23971 }, { "epoch": 0.64, "learning_rate": 0.0005936238532226572, "loss": 2.6502, "step": 23972 }, { "epoch": 0.64, "learning_rate": 0.0005935443265394689, "loss": 2.6002, "step": 23973 }, { "epoch": 0.64, "learning_rate": 0.0005934648029355163, "loss": 2.3773, "step": 23974 }, { "epoch": 0.64, "learning_rate": 0.0005933852824114014, "loss": 2.3001, "step": 23975 }, { "epoch": 0.64, "learning_rate": 0.0005933057649677269, "loss": 2.7018, "step": 23976 }, { "epoch": 0.64, "learning_rate": 0.0005932262506050956, "loss": 2.7014, "step": 23977 }, { "epoch": 0.64, "learning_rate": 0.000593146739324109, "loss": 2.836, "step": 23978 }, { "epoch": 0.64, "learning_rate": 0.00059306723112537, "loss": 2.6801, "step": 23979 }, { "epoch": 0.64, "learning_rate": 0.0005929877260094815, "loss": 2.525, "step": 23980 }, { "epoch": 0.64, "learning_rate": 0.0005929082239770447, "loss": 2.2362, "step": 23981 }, { "epoch": 0.64, "learning_rate": 0.0005928287250286625, "loss": 2.5777, "step": 23982 }, { "epoch": 0.64, "learning_rate": 0.0005927492291649372, "loss": 2.2093, "step": 23983 }, { "epoch": 0.64, "learning_rate": 0.0005926697363864707, "loss": 3.0417, "step": 23984 }, { "epoch": 0.64, "learning_rate": 0.0005925902466938658, "loss": 2.3857, "step": 23985 }, { "epoch": 0.64, "learning_rate": 0.000592510760087724, "loss": 2.2443, "step": 23986 }, { "epoch": 0.64, "learning_rate": 0.0005924312765686479, "loss": 2.3696, "step": 23987 }, { "epoch": 0.64, "learning_rate": 0.0005923517961372398, "loss": 2.3346, "step": 23988 }, { "epoch": 0.64, "learning_rate": 0.0005922723187941013, "loss": 1.9166, "step": 23989 }, { "epoch": 0.64, "learning_rate": 0.0005921928445398353, "loss": 2.203, "step": 23990 }, { "epoch": 0.64, "learning_rate": 0.0005921133733750428, "loss": 2.6425, "step": 23991 }, { "epoch": 0.64, "learning_rate": 0.0005920339053003267, "loss": 2.7651, "step": 23992 }, { "epoch": 0.64, "learning_rate": 0.0005919544403162891, "loss": 2.4739, "step": 23993 }, { "epoch": 0.64, "learning_rate": 0.0005918749784235314, "loss": 2.4579, "step": 23994 }, { "epoch": 0.64, "learning_rate": 0.0005917955196226557, "loss": 2.0093, "step": 23995 }, { "epoch": 0.64, "learning_rate": 0.0005917160639142647, "loss": 2.8966, "step": 23996 }, { "epoch": 0.64, "learning_rate": 0.0005916366112989594, "loss": 2.665, "step": 23997 }, { "epoch": 0.64, "learning_rate": 0.0005915571617773423, "loss": 2.5407, "step": 23998 }, { "epoch": 0.64, "learning_rate": 0.0005914777153500151, "loss": 2.4963, "step": 23999 }, { "epoch": 0.64, "learning_rate": 0.0005913982720175795, "loss": 1.9595, "step": 24000 }, { "epoch": 0.64, "learning_rate": 0.0005913188317806378, "loss": 2.5185, "step": 24001 }, { "epoch": 0.65, "learning_rate": 0.0005912393946397914, "loss": 2.5051, "step": 24002 }, { "epoch": 0.65, "learning_rate": 0.0005911599605956423, "loss": 2.6475, "step": 24003 }, { "epoch": 0.65, "learning_rate": 0.0005910805296487923, "loss": 2.6099, "step": 24004 }, { "epoch": 0.65, "learning_rate": 0.000591001101799843, "loss": 2.5539, "step": 24005 }, { "epoch": 0.65, "learning_rate": 0.0005909216770493962, "loss": 2.3436, "step": 24006 }, { "epoch": 0.65, "learning_rate": 0.0005908422553980541, "loss": 2.3238, "step": 24007 }, { "epoch": 0.65, "learning_rate": 0.0005907628368464172, "loss": 2.3518, "step": 24008 }, { "epoch": 0.65, "learning_rate": 0.0005906834213950887, "loss": 2.1574, "step": 24009 }, { "epoch": 0.65, "learning_rate": 0.0005906040090446687, "loss": 2.3098, "step": 24010 }, { "epoch": 0.65, "learning_rate": 0.0005905245997957598, "loss": 2.5291, "step": 24011 }, { "epoch": 0.65, "learning_rate": 0.0005904451936489634, "loss": 2.2175, "step": 24012 }, { "epoch": 0.65, "learning_rate": 0.000590365790604881, "loss": 2.5743, "step": 24013 }, { "epoch": 0.65, "learning_rate": 0.0005902863906641138, "loss": 2.1687, "step": 24014 }, { "epoch": 0.65, "learning_rate": 0.0005902069938272641, "loss": 2.4483, "step": 24015 }, { "epoch": 0.65, "learning_rate": 0.0005901276000949326, "loss": 2.4275, "step": 24016 }, { "epoch": 0.65, "learning_rate": 0.0005900482094677214, "loss": 2.443, "step": 24017 }, { "epoch": 0.65, "learning_rate": 0.0005899688219462315, "loss": 2.5434, "step": 24018 }, { "epoch": 0.65, "learning_rate": 0.0005898894375310643, "loss": 2.5717, "step": 24019 }, { "epoch": 0.65, "learning_rate": 0.0005898100562228222, "loss": 2.4934, "step": 24020 }, { "epoch": 0.65, "learning_rate": 0.0005897306780221048, "loss": 2.7922, "step": 24021 }, { "epoch": 0.65, "learning_rate": 0.0005896513029295148, "loss": 2.7071, "step": 24022 }, { "epoch": 0.65, "learning_rate": 0.0005895719309456536, "loss": 2.4838, "step": 24023 }, { "epoch": 0.65, "learning_rate": 0.0005894925620711216, "loss": 2.7302, "step": 24024 }, { "epoch": 0.65, "learning_rate": 0.0005894131963065208, "loss": 2.7345, "step": 24025 }, { "epoch": 0.65, "learning_rate": 0.0005893338336524518, "loss": 2.0988, "step": 24026 }, { "epoch": 0.65, "learning_rate": 0.0005892544741095166, "loss": 2.3243, "step": 24027 }, { "epoch": 0.65, "learning_rate": 0.0005891751176783161, "loss": 2.3062, "step": 24028 }, { "epoch": 0.65, "learning_rate": 0.0005890957643594513, "loss": 2.47, "step": 24029 }, { "epoch": 0.65, "learning_rate": 0.0005890164141535235, "loss": 2.4075, "step": 24030 }, { "epoch": 0.65, "learning_rate": 0.0005889370670611341, "loss": 2.428, "step": 24031 }, { "epoch": 0.65, "learning_rate": 0.0005888577230828837, "loss": 2.4471, "step": 24032 }, { "epoch": 0.65, "learning_rate": 0.0005887783822193742, "loss": 2.4927, "step": 24033 }, { "epoch": 0.65, "learning_rate": 0.0005886990444712055, "loss": 2.6759, "step": 24034 }, { "epoch": 0.65, "learning_rate": 0.0005886197098389793, "loss": 2.7055, "step": 24035 }, { "epoch": 0.65, "learning_rate": 0.0005885403783232974, "loss": 2.5022, "step": 24036 }, { "epoch": 0.65, "learning_rate": 0.0005884610499247595, "loss": 2.7656, "step": 24037 }, { "epoch": 0.65, "learning_rate": 0.0005883817246439669, "loss": 2.4354, "step": 24038 }, { "epoch": 0.65, "learning_rate": 0.0005883024024815214, "loss": 2.5452, "step": 24039 }, { "epoch": 0.65, "learning_rate": 0.0005882230834380227, "loss": 2.2728, "step": 24040 }, { "epoch": 0.65, "learning_rate": 0.0005881437675140725, "loss": 2.342, "step": 24041 }, { "epoch": 0.65, "learning_rate": 0.0005880644547102716, "loss": 2.3374, "step": 24042 }, { "epoch": 0.65, "learning_rate": 0.0005879851450272206, "loss": 2.5139, "step": 24043 }, { "epoch": 0.65, "learning_rate": 0.0005879058384655206, "loss": 2.4559, "step": 24044 }, { "epoch": 0.65, "learning_rate": 0.0005878265350257721, "loss": 2.6019, "step": 24045 }, { "epoch": 0.65, "learning_rate": 0.0005877472347085762, "loss": 2.5944, "step": 24046 }, { "epoch": 0.65, "learning_rate": 0.0005876679375145336, "loss": 2.5335, "step": 24047 }, { "epoch": 0.65, "learning_rate": 0.0005875886434442449, "loss": 2.5012, "step": 24048 }, { "epoch": 0.65, "learning_rate": 0.0005875093524983109, "loss": 2.7368, "step": 24049 }, { "epoch": 0.65, "learning_rate": 0.0005874300646773326, "loss": 2.6602, "step": 24050 }, { "epoch": 0.65, "learning_rate": 0.0005873507799819097, "loss": 2.4795, "step": 24051 }, { "epoch": 0.65, "learning_rate": 0.0005872714984126444, "loss": 2.086, "step": 24052 }, { "epoch": 0.65, "learning_rate": 0.0005871922199701358, "loss": 2.4113, "step": 24053 }, { "epoch": 0.65, "learning_rate": 0.0005871129446549852, "loss": 2.2457, "step": 24054 }, { "epoch": 0.65, "learning_rate": 0.0005870336724677934, "loss": 2.0803, "step": 24055 }, { "epoch": 0.65, "learning_rate": 0.0005869544034091606, "loss": 2.655, "step": 24056 }, { "epoch": 0.65, "learning_rate": 0.000586875137479687, "loss": 2.6863, "step": 24057 }, { "epoch": 0.65, "learning_rate": 0.0005867958746799739, "loss": 2.2629, "step": 24058 }, { "epoch": 0.65, "learning_rate": 0.0005867166150106211, "loss": 2.4949, "step": 24059 }, { "epoch": 0.65, "learning_rate": 0.0005866373584722298, "loss": 2.4127, "step": 24060 }, { "epoch": 0.65, "learning_rate": 0.0005865581050653995, "loss": 2.5235, "step": 24061 }, { "epoch": 0.65, "learning_rate": 0.0005864788547907311, "loss": 2.2348, "step": 24062 }, { "epoch": 0.65, "learning_rate": 0.0005863996076488254, "loss": 2.4312, "step": 24063 }, { "epoch": 0.65, "learning_rate": 0.0005863203636402818, "loss": 2.3863, "step": 24064 }, { "epoch": 0.65, "learning_rate": 0.0005862411227657014, "loss": 2.1936, "step": 24065 }, { "epoch": 0.65, "learning_rate": 0.0005861618850256844, "loss": 2.3234, "step": 24066 }, { "epoch": 0.65, "learning_rate": 0.0005860826504208309, "loss": 2.4014, "step": 24067 }, { "epoch": 0.65, "learning_rate": 0.0005860034189517413, "loss": 2.6956, "step": 24068 }, { "epoch": 0.65, "learning_rate": 0.0005859241906190156, "loss": 2.5756, "step": 24069 }, { "epoch": 0.65, "learning_rate": 0.0005858449654232542, "loss": 2.4108, "step": 24070 }, { "epoch": 0.65, "learning_rate": 0.0005857657433650575, "loss": 2.2212, "step": 24071 }, { "epoch": 0.65, "learning_rate": 0.0005856865244450253, "loss": 2.8346, "step": 24072 }, { "epoch": 0.65, "learning_rate": 0.0005856073086637579, "loss": 2.4437, "step": 24073 }, { "epoch": 0.65, "learning_rate": 0.0005855280960218556, "loss": 2.6415, "step": 24074 }, { "epoch": 0.65, "learning_rate": 0.0005854488865199182, "loss": 2.7808, "step": 24075 }, { "epoch": 0.65, "learning_rate": 0.0005853696801585458, "loss": 2.6595, "step": 24076 }, { "epoch": 0.65, "learning_rate": 0.0005852904769383389, "loss": 2.9234, "step": 24077 }, { "epoch": 0.65, "learning_rate": 0.000585211276859897, "loss": 2.84, "step": 24078 }, { "epoch": 0.65, "learning_rate": 0.0005851320799238206, "loss": 1.9419, "step": 24079 }, { "epoch": 0.65, "learning_rate": 0.000585052886130709, "loss": 2.301, "step": 24080 }, { "epoch": 0.65, "learning_rate": 0.0005849736954811624, "loss": 2.242, "step": 24081 }, { "epoch": 0.65, "learning_rate": 0.0005848945079757816, "loss": 2.3986, "step": 24082 }, { "epoch": 0.65, "learning_rate": 0.0005848153236151653, "loss": 2.2293, "step": 24083 }, { "epoch": 0.65, "learning_rate": 0.0005847361423999138, "loss": 2.4173, "step": 24084 }, { "epoch": 0.65, "learning_rate": 0.0005846569643306274, "loss": 2.3588, "step": 24085 }, { "epoch": 0.65, "learning_rate": 0.0005845777894079053, "loss": 2.3525, "step": 24086 }, { "epoch": 0.65, "learning_rate": 0.0005844986176323477, "loss": 2.5773, "step": 24087 }, { "epoch": 0.65, "learning_rate": 0.0005844194490045542, "loss": 2.6023, "step": 24088 }, { "epoch": 0.65, "learning_rate": 0.0005843402835251247, "loss": 2.0439, "step": 24089 }, { "epoch": 0.65, "learning_rate": 0.000584261121194659, "loss": 2.2857, "step": 24090 }, { "epoch": 0.65, "learning_rate": 0.0005841819620137565, "loss": 2.3609, "step": 24091 }, { "epoch": 0.65, "learning_rate": 0.0005841028059830173, "loss": 2.6869, "step": 24092 }, { "epoch": 0.65, "learning_rate": 0.0005840236531030412, "loss": 2.7871, "step": 24093 }, { "epoch": 0.65, "learning_rate": 0.0005839445033744269, "loss": 2.7524, "step": 24094 }, { "epoch": 0.65, "learning_rate": 0.0005838653567977752, "loss": 2.4872, "step": 24095 }, { "epoch": 0.65, "learning_rate": 0.0005837862133736848, "loss": 2.2214, "step": 24096 }, { "epoch": 0.65, "learning_rate": 0.0005837070731027557, "loss": 2.7853, "step": 24097 }, { "epoch": 0.65, "learning_rate": 0.0005836279359855872, "loss": 2.2728, "step": 24098 }, { "epoch": 0.65, "learning_rate": 0.0005835488020227793, "loss": 2.4086, "step": 24099 }, { "epoch": 0.65, "learning_rate": 0.000583469671214931, "loss": 2.0969, "step": 24100 }, { "epoch": 0.65, "learning_rate": 0.0005833905435626424, "loss": 2.8264, "step": 24101 }, { "epoch": 0.65, "learning_rate": 0.0005833114190665123, "loss": 2.4449, "step": 24102 }, { "epoch": 0.65, "learning_rate": 0.0005832322977271407, "loss": 2.4247, "step": 24103 }, { "epoch": 0.65, "learning_rate": 0.0005831531795451264, "loss": 2.3909, "step": 24104 }, { "epoch": 0.65, "learning_rate": 0.0005830740645210689, "loss": 2.3283, "step": 24105 }, { "epoch": 0.65, "learning_rate": 0.0005829949526555679, "loss": 2.2739, "step": 24106 }, { "epoch": 0.65, "learning_rate": 0.0005829158439492226, "loss": 2.3018, "step": 24107 }, { "epoch": 0.65, "learning_rate": 0.0005828367384026322, "loss": 2.3887, "step": 24108 }, { "epoch": 0.65, "learning_rate": 0.0005827576360163965, "loss": 2.138, "step": 24109 }, { "epoch": 0.65, "learning_rate": 0.000582678536791114, "loss": 2.2605, "step": 24110 }, { "epoch": 0.65, "learning_rate": 0.0005825994407273842, "loss": 2.8864, "step": 24111 }, { "epoch": 0.65, "learning_rate": 0.0005825203478258066, "loss": 2.1368, "step": 24112 }, { "epoch": 0.65, "learning_rate": 0.00058244125808698, "loss": 2.485, "step": 24113 }, { "epoch": 0.65, "learning_rate": 0.0005823621715115044, "loss": 2.4509, "step": 24114 }, { "epoch": 0.65, "learning_rate": 0.0005822830880999777, "loss": 2.251, "step": 24115 }, { "epoch": 0.65, "learning_rate": 0.0005822040078529997, "loss": 2.2753, "step": 24116 }, { "epoch": 0.65, "learning_rate": 0.00058212493077117, "loss": 2.5528, "step": 24117 }, { "epoch": 0.65, "learning_rate": 0.0005820458568550866, "loss": 2.9293, "step": 24118 }, { "epoch": 0.65, "learning_rate": 0.0005819667861053486, "loss": 2.4318, "step": 24119 }, { "epoch": 0.65, "learning_rate": 0.0005818877185225563, "loss": 2.4422, "step": 24120 }, { "epoch": 0.65, "learning_rate": 0.0005818086541073076, "loss": 2.504, "step": 24121 }, { "epoch": 0.65, "learning_rate": 0.0005817295928602022, "loss": 2.1758, "step": 24122 }, { "epoch": 0.65, "learning_rate": 0.0005816505347818381, "loss": 2.4601, "step": 24123 }, { "epoch": 0.65, "learning_rate": 0.0005815714798728148, "loss": 2.6233, "step": 24124 }, { "epoch": 0.65, "learning_rate": 0.0005814924281337311, "loss": 2.3469, "step": 24125 }, { "epoch": 0.65, "learning_rate": 0.0005814133795651861, "loss": 2.4536, "step": 24126 }, { "epoch": 0.65, "learning_rate": 0.0005813343341677784, "loss": 2.5963, "step": 24127 }, { "epoch": 0.65, "learning_rate": 0.0005812552919421072, "loss": 2.6862, "step": 24128 }, { "epoch": 0.65, "learning_rate": 0.0005811762528887709, "loss": 2.9796, "step": 24129 }, { "epoch": 0.65, "learning_rate": 0.0005810972170083686, "loss": 2.4821, "step": 24130 }, { "epoch": 0.65, "learning_rate": 0.0005810181843014986, "loss": 2.2362, "step": 24131 }, { "epoch": 0.65, "learning_rate": 0.0005809391547687596, "loss": 2.3563, "step": 24132 }, { "epoch": 0.65, "learning_rate": 0.0005808601284107513, "loss": 2.253, "step": 24133 }, { "epoch": 0.65, "learning_rate": 0.0005807811052280715, "loss": 2.4402, "step": 24134 }, { "epoch": 0.65, "learning_rate": 0.0005807020852213189, "loss": 2.4058, "step": 24135 }, { "epoch": 0.65, "learning_rate": 0.0005806230683910929, "loss": 2.66, "step": 24136 }, { "epoch": 0.65, "learning_rate": 0.000580544054737991, "loss": 2.3342, "step": 24137 }, { "epoch": 0.65, "learning_rate": 0.0005804650442626125, "loss": 2.715, "step": 24138 }, { "epoch": 0.65, "learning_rate": 0.0005803860369655558, "loss": 2.5884, "step": 24139 }, { "epoch": 0.65, "learning_rate": 0.0005803070328474194, "loss": 2.9577, "step": 24140 }, { "epoch": 0.65, "learning_rate": 0.0005802280319088023, "loss": 2.5247, "step": 24141 }, { "epoch": 0.65, "learning_rate": 0.0005801490341503022, "loss": 2.7323, "step": 24142 }, { "epoch": 0.65, "learning_rate": 0.000580070039572518, "loss": 2.5843, "step": 24143 }, { "epoch": 0.65, "learning_rate": 0.0005799910481760484, "loss": 2.6195, "step": 24144 }, { "epoch": 0.65, "learning_rate": 0.0005799120599614909, "loss": 2.7923, "step": 24145 }, { "epoch": 0.65, "learning_rate": 0.0005798330749294451, "loss": 2.2421, "step": 24146 }, { "epoch": 0.65, "learning_rate": 0.0005797540930805085, "loss": 2.5068, "step": 24147 }, { "epoch": 0.65, "learning_rate": 0.0005796751144152799, "loss": 2.8951, "step": 24148 }, { "epoch": 0.65, "learning_rate": 0.0005795961389343577, "loss": 2.7784, "step": 24149 }, { "epoch": 0.65, "learning_rate": 0.0005795171666383396, "loss": 2.7808, "step": 24150 }, { "epoch": 0.65, "learning_rate": 0.0005794381975278243, "loss": 2.881, "step": 24151 }, { "epoch": 0.65, "learning_rate": 0.0005793592316034101, "loss": 2.6563, "step": 24152 }, { "epoch": 0.65, "learning_rate": 0.0005792802688656951, "loss": 2.3901, "step": 24153 }, { "epoch": 0.65, "learning_rate": 0.0005792013093152776, "loss": 2.684, "step": 24154 }, { "epoch": 0.65, "learning_rate": 0.0005791223529527561, "loss": 2.2991, "step": 24155 }, { "epoch": 0.65, "learning_rate": 0.0005790433997787281, "loss": 2.5063, "step": 24156 }, { "epoch": 0.65, "learning_rate": 0.0005789644497937922, "loss": 1.984, "step": 24157 }, { "epoch": 0.65, "learning_rate": 0.0005788855029985458, "loss": 2.2258, "step": 24158 }, { "epoch": 0.65, "learning_rate": 0.0005788065593935878, "loss": 2.2649, "step": 24159 }, { "epoch": 0.65, "learning_rate": 0.0005787276189795165, "loss": 2.3778, "step": 24160 }, { "epoch": 0.65, "learning_rate": 0.0005786486817569291, "loss": 3.0734, "step": 24161 }, { "epoch": 0.65, "learning_rate": 0.0005785697477264238, "loss": 2.4461, "step": 24162 }, { "epoch": 0.65, "learning_rate": 0.0005784908168885993, "loss": 2.3513, "step": 24163 }, { "epoch": 0.65, "learning_rate": 0.0005784118892440524, "loss": 2.5931, "step": 24164 }, { "epoch": 0.65, "learning_rate": 0.0005783329647933819, "loss": 2.315, "step": 24165 }, { "epoch": 0.65, "learning_rate": 0.0005782540435371853, "loss": 2.6788, "step": 24166 }, { "epoch": 0.65, "learning_rate": 0.0005781751254760607, "loss": 2.3684, "step": 24167 }, { "epoch": 0.65, "learning_rate": 0.0005780962106106065, "loss": 2.2653, "step": 24168 }, { "epoch": 0.65, "learning_rate": 0.0005780172989414193, "loss": 2.281, "step": 24169 }, { "epoch": 0.65, "learning_rate": 0.0005779383904690978, "loss": 2.4151, "step": 24170 }, { "epoch": 0.65, "learning_rate": 0.0005778594851942395, "loss": 2.3914, "step": 24171 }, { "epoch": 0.65, "learning_rate": 0.0005777805831174423, "loss": 2.7063, "step": 24172 }, { "epoch": 0.65, "learning_rate": 0.0005777016842393043, "loss": 2.0812, "step": 24173 }, { "epoch": 0.65, "learning_rate": 0.0005776227885604224, "loss": 2.2721, "step": 24174 }, { "epoch": 0.65, "learning_rate": 0.0005775438960813948, "loss": 2.3085, "step": 24175 }, { "epoch": 0.65, "learning_rate": 0.0005774650068028196, "loss": 2.3916, "step": 24176 }, { "epoch": 0.65, "learning_rate": 0.0005773861207252935, "loss": 2.7171, "step": 24177 }, { "epoch": 0.65, "learning_rate": 0.0005773072378494141, "loss": 2.3972, "step": 24178 }, { "epoch": 0.65, "learning_rate": 0.0005772283581757803, "loss": 2.8931, "step": 24179 }, { "epoch": 0.65, "learning_rate": 0.0005771494817049886, "loss": 2.8114, "step": 24180 }, { "epoch": 0.65, "learning_rate": 0.0005770706084376371, "loss": 2.3944, "step": 24181 }, { "epoch": 0.65, "learning_rate": 0.0005769917383743228, "loss": 2.7341, "step": 24182 }, { "epoch": 0.65, "learning_rate": 0.0005769128715156434, "loss": 2.65, "step": 24183 }, { "epoch": 0.65, "learning_rate": 0.0005768340078621964, "loss": 2.9559, "step": 24184 }, { "epoch": 0.65, "learning_rate": 0.0005767551474145793, "loss": 2.3949, "step": 24185 }, { "epoch": 0.65, "learning_rate": 0.0005766762901733895, "loss": 2.505, "step": 24186 }, { "epoch": 0.65, "learning_rate": 0.000576597436139225, "loss": 2.2615, "step": 24187 }, { "epoch": 0.65, "learning_rate": 0.0005765185853126822, "loss": 2.6974, "step": 24188 }, { "epoch": 0.65, "learning_rate": 0.0005764397376943587, "loss": 2.2595, "step": 24189 }, { "epoch": 0.65, "learning_rate": 0.0005763608932848525, "loss": 2.6096, "step": 24190 }, { "epoch": 0.65, "learning_rate": 0.0005762820520847598, "loss": 2.2062, "step": 24191 }, { "epoch": 0.65, "learning_rate": 0.0005762032140946791, "loss": 2.5109, "step": 24192 }, { "epoch": 0.65, "learning_rate": 0.0005761243793152069, "loss": 2.2744, "step": 24193 }, { "epoch": 0.65, "learning_rate": 0.0005760455477469404, "loss": 2.5126, "step": 24194 }, { "epoch": 0.65, "learning_rate": 0.0005759667193904777, "loss": 2.6115, "step": 24195 }, { "epoch": 0.65, "learning_rate": 0.0005758878942464146, "loss": 2.4025, "step": 24196 }, { "epoch": 0.65, "learning_rate": 0.0005758090723153492, "loss": 2.5962, "step": 24197 }, { "epoch": 0.65, "learning_rate": 0.0005757302535978784, "loss": 2.5263, "step": 24198 }, { "epoch": 0.65, "learning_rate": 0.0005756514380945993, "loss": 2.0193, "step": 24199 }, { "epoch": 0.65, "learning_rate": 0.0005755726258061095, "loss": 2.6943, "step": 24200 }, { "epoch": 0.65, "learning_rate": 0.0005754938167330051, "loss": 2.8151, "step": 24201 }, { "epoch": 0.65, "learning_rate": 0.0005754150108758838, "loss": 2.5379, "step": 24202 }, { "epoch": 0.65, "learning_rate": 0.0005753362082353427, "loss": 2.6505, "step": 24203 }, { "epoch": 0.65, "learning_rate": 0.0005752574088119779, "loss": 2.7228, "step": 24204 }, { "epoch": 0.65, "learning_rate": 0.0005751786126063874, "loss": 2.2484, "step": 24205 }, { "epoch": 0.65, "learning_rate": 0.0005750998196191681, "loss": 2.9633, "step": 24206 }, { "epoch": 0.65, "learning_rate": 0.0005750210298509162, "loss": 2.2731, "step": 24207 }, { "epoch": 0.65, "learning_rate": 0.0005749422433022295, "loss": 2.3007, "step": 24208 }, { "epoch": 0.65, "learning_rate": 0.0005748634599737039, "loss": 2.9515, "step": 24209 }, { "epoch": 0.65, "learning_rate": 0.0005747846798659368, "loss": 2.2742, "step": 24210 }, { "epoch": 0.65, "learning_rate": 0.0005747059029795249, "loss": 2.4074, "step": 24211 }, { "epoch": 0.65, "learning_rate": 0.0005746271293150651, "loss": 2.6049, "step": 24212 }, { "epoch": 0.65, "learning_rate": 0.0005745483588731541, "loss": 2.5325, "step": 24213 }, { "epoch": 0.65, "learning_rate": 0.000574469591654389, "loss": 2.2806, "step": 24214 }, { "epoch": 0.65, "learning_rate": 0.0005743908276593658, "loss": 2.4313, "step": 24215 }, { "epoch": 0.65, "learning_rate": 0.0005743120668886821, "loss": 2.4501, "step": 24216 }, { "epoch": 0.65, "learning_rate": 0.000574233309342933, "loss": 2.0421, "step": 24217 }, { "epoch": 0.65, "learning_rate": 0.0005741545550227169, "loss": 2.2623, "step": 24218 }, { "epoch": 0.65, "learning_rate": 0.0005740758039286301, "loss": 2.624, "step": 24219 }, { "epoch": 0.65, "learning_rate": 0.0005739970560612685, "loss": 2.5722, "step": 24220 }, { "epoch": 0.65, "learning_rate": 0.000573918311421229, "loss": 2.58, "step": 24221 }, { "epoch": 0.65, "learning_rate": 0.0005738395700091086, "loss": 2.4897, "step": 24222 }, { "epoch": 0.65, "learning_rate": 0.000573760831825503, "loss": 2.939, "step": 24223 }, { "epoch": 0.65, "learning_rate": 0.0005736820968710091, "loss": 2.5464, "step": 24224 }, { "epoch": 0.65, "learning_rate": 0.0005736033651462235, "loss": 2.6507, "step": 24225 }, { "epoch": 0.65, "learning_rate": 0.0005735246366517425, "loss": 2.4293, "step": 24226 }, { "epoch": 0.65, "learning_rate": 0.0005734459113881631, "loss": 2.4776, "step": 24227 }, { "epoch": 0.65, "learning_rate": 0.0005733671893560807, "loss": 2.6346, "step": 24228 }, { "epoch": 0.65, "learning_rate": 0.0005732884705560923, "loss": 2.8255, "step": 24229 }, { "epoch": 0.65, "learning_rate": 0.000573209754988794, "loss": 2.5639, "step": 24230 }, { "epoch": 0.65, "learning_rate": 0.0005731310426547824, "loss": 2.6753, "step": 24231 }, { "epoch": 0.65, "learning_rate": 0.0005730523335546538, "loss": 2.7501, "step": 24232 }, { "epoch": 0.65, "learning_rate": 0.0005729736276890048, "loss": 2.3296, "step": 24233 }, { "epoch": 0.65, "learning_rate": 0.0005728949250584306, "loss": 2.2208, "step": 24234 }, { "epoch": 0.65, "learning_rate": 0.0005728162256635286, "loss": 2.6105, "step": 24235 }, { "epoch": 0.65, "learning_rate": 0.0005727375295048942, "loss": 2.6659, "step": 24236 }, { "epoch": 0.65, "learning_rate": 0.0005726588365831238, "loss": 2.5658, "step": 24237 }, { "epoch": 0.65, "learning_rate": 0.0005725801468988137, "loss": 2.3711, "step": 24238 }, { "epoch": 0.65, "learning_rate": 0.00057250146045256, "loss": 2.2587, "step": 24239 }, { "epoch": 0.65, "learning_rate": 0.0005724227772449589, "loss": 2.3055, "step": 24240 }, { "epoch": 0.65, "learning_rate": 0.0005723440972766065, "loss": 2.185, "step": 24241 }, { "epoch": 0.65, "learning_rate": 0.0005722654205480986, "loss": 2.4663, "step": 24242 }, { "epoch": 0.65, "learning_rate": 0.0005721867470600313, "loss": 2.4617, "step": 24243 }, { "epoch": 0.65, "learning_rate": 0.0005721080768130007, "loss": 2.0016, "step": 24244 }, { "epoch": 0.65, "learning_rate": 0.0005720294098076028, "loss": 2.4812, "step": 24245 }, { "epoch": 0.65, "learning_rate": 0.0005719507460444342, "loss": 3.0231, "step": 24246 }, { "epoch": 0.65, "learning_rate": 0.0005718720855240896, "loss": 2.4648, "step": 24247 }, { "epoch": 0.65, "learning_rate": 0.0005717934282471657, "loss": 2.4096, "step": 24248 }, { "epoch": 0.65, "learning_rate": 0.0005717147742142585, "loss": 2.3951, "step": 24249 }, { "epoch": 0.65, "learning_rate": 0.0005716361234259633, "loss": 2.4289, "step": 24250 }, { "epoch": 0.65, "learning_rate": 0.0005715574758828761, "loss": 2.6103, "step": 24251 }, { "epoch": 0.65, "learning_rate": 0.000571478831585593, "loss": 2.9363, "step": 24252 }, { "epoch": 0.65, "learning_rate": 0.0005714001905347094, "loss": 2.9213, "step": 24253 }, { "epoch": 0.65, "learning_rate": 0.0005713215527308221, "loss": 2.6962, "step": 24254 }, { "epoch": 0.65, "learning_rate": 0.0005712429181745256, "loss": 2.5101, "step": 24255 }, { "epoch": 0.65, "learning_rate": 0.000571164286866416, "loss": 2.5837, "step": 24256 }, { "epoch": 0.65, "learning_rate": 0.000571085658807089, "loss": 2.697, "step": 24257 }, { "epoch": 0.65, "learning_rate": 0.0005710070339971405, "loss": 2.4429, "step": 24258 }, { "epoch": 0.65, "learning_rate": 0.0005709284124371663, "loss": 2.3571, "step": 24259 }, { "epoch": 0.65, "learning_rate": 0.0005708497941277615, "loss": 2.6973, "step": 24260 }, { "epoch": 0.65, "learning_rate": 0.0005707711790695218, "loss": 2.5504, "step": 24261 }, { "epoch": 0.65, "learning_rate": 0.0005706925672630434, "loss": 3.0285, "step": 24262 }, { "epoch": 0.65, "learning_rate": 0.0005706139587089209, "loss": 2.5188, "step": 24263 }, { "epoch": 0.65, "learning_rate": 0.0005705353534077498, "loss": 2.2614, "step": 24264 }, { "epoch": 0.65, "learning_rate": 0.0005704567513601271, "loss": 2.7659, "step": 24265 }, { "epoch": 0.65, "learning_rate": 0.0005703781525666467, "loss": 2.4435, "step": 24266 }, { "epoch": 0.65, "learning_rate": 0.0005702995570279046, "loss": 2.5157, "step": 24267 }, { "epoch": 0.65, "learning_rate": 0.0005702209647444967, "loss": 2.7622, "step": 24268 }, { "epoch": 0.65, "learning_rate": 0.0005701423757170175, "loss": 2.275, "step": 24269 }, { "epoch": 0.65, "learning_rate": 0.0005700637899460628, "loss": 2.5258, "step": 24270 }, { "epoch": 0.65, "learning_rate": 0.000569985207432228, "loss": 1.8591, "step": 24271 }, { "epoch": 0.65, "learning_rate": 0.0005699066281761084, "loss": 2.1528, "step": 24272 }, { "epoch": 0.65, "learning_rate": 0.0005698280521782997, "loss": 2.5511, "step": 24273 }, { "epoch": 0.65, "learning_rate": 0.0005697494794393962, "loss": 3.4242, "step": 24274 }, { "epoch": 0.65, "learning_rate": 0.000569670909959994, "loss": 2.7073, "step": 24275 }, { "epoch": 0.65, "learning_rate": 0.0005695923437406882, "loss": 2.4056, "step": 24276 }, { "epoch": 0.65, "learning_rate": 0.0005695137807820731, "loss": 2.625, "step": 24277 }, { "epoch": 0.65, "learning_rate": 0.0005694352210847455, "loss": 2.7771, "step": 24278 }, { "epoch": 0.65, "learning_rate": 0.0005693566646492994, "loss": 2.3573, "step": 24279 }, { "epoch": 0.65, "learning_rate": 0.0005692781114763301, "loss": 2.5352, "step": 24280 }, { "epoch": 0.65, "learning_rate": 0.0005691995615664332, "loss": 2.0307, "step": 24281 }, { "epoch": 0.65, "learning_rate": 0.0005691210149202031, "loss": 2.4174, "step": 24282 }, { "epoch": 0.65, "learning_rate": 0.000569042471538235, "loss": 2.5097, "step": 24283 }, { "epoch": 0.65, "learning_rate": 0.0005689639314211242, "loss": 2.7685, "step": 24284 }, { "epoch": 0.65, "learning_rate": 0.0005688853945694655, "loss": 2.7061, "step": 24285 }, { "epoch": 0.65, "learning_rate": 0.0005688068609838545, "loss": 2.3697, "step": 24286 }, { "epoch": 0.65, "learning_rate": 0.0005687283306648851, "loss": 2.5404, "step": 24287 }, { "epoch": 0.65, "learning_rate": 0.0005686498036131529, "loss": 2.2944, "step": 24288 }, { "epoch": 0.65, "learning_rate": 0.0005685712798292529, "loss": 2.7296, "step": 24289 }, { "epoch": 0.65, "learning_rate": 0.000568492759313779, "loss": 2.6766, "step": 24290 }, { "epoch": 0.65, "learning_rate": 0.0005684142420673273, "loss": 2.8338, "step": 24291 }, { "epoch": 0.65, "learning_rate": 0.0005683357280904926, "loss": 2.4836, "step": 24292 }, { "epoch": 0.65, "learning_rate": 0.0005682572173838687, "loss": 2.3135, "step": 24293 }, { "epoch": 0.65, "learning_rate": 0.0005681787099480513, "loss": 2.3936, "step": 24294 }, { "epoch": 0.65, "learning_rate": 0.0005681002057836345, "loss": 2.5092, "step": 24295 }, { "epoch": 0.65, "learning_rate": 0.0005680217048912133, "loss": 2.4515, "step": 24296 }, { "epoch": 0.65, "learning_rate": 0.0005679432072713825, "loss": 2.1724, "step": 24297 }, { "epoch": 0.65, "learning_rate": 0.0005678647129247367, "loss": 2.4392, "step": 24298 }, { "epoch": 0.65, "learning_rate": 0.0005677862218518705, "loss": 1.8743, "step": 24299 }, { "epoch": 0.65, "learning_rate": 0.0005677077340533789, "loss": 2.552, "step": 24300 }, { "epoch": 0.65, "learning_rate": 0.000567629249529856, "loss": 2.369, "step": 24301 }, { "epoch": 0.65, "learning_rate": 0.0005675507682818965, "loss": 2.3288, "step": 24302 }, { "epoch": 0.65, "learning_rate": 0.0005674722903100953, "loss": 2.2207, "step": 24303 }, { "epoch": 0.65, "learning_rate": 0.0005673938156150464, "loss": 2.4512, "step": 24304 }, { "epoch": 0.65, "learning_rate": 0.0005673153441973451, "loss": 2.7388, "step": 24305 }, { "epoch": 0.65, "learning_rate": 0.0005672368760575851, "loss": 2.702, "step": 24306 }, { "epoch": 0.65, "learning_rate": 0.000567158411196361, "loss": 2.3629, "step": 24307 }, { "epoch": 0.65, "learning_rate": 0.000567079949614268, "loss": 2.5312, "step": 24308 }, { "epoch": 0.65, "learning_rate": 0.0005670014913118994, "loss": 2.4611, "step": 24309 }, { "epoch": 0.65, "learning_rate": 0.0005669230362898501, "loss": 2.6537, "step": 24310 }, { "epoch": 0.65, "learning_rate": 0.0005668445845487144, "loss": 2.3259, "step": 24311 }, { "epoch": 0.65, "learning_rate": 0.0005667661360890866, "loss": 2.5384, "step": 24312 }, { "epoch": 0.65, "learning_rate": 0.0005666876909115616, "loss": 2.77, "step": 24313 }, { "epoch": 0.65, "learning_rate": 0.0005666092490167328, "loss": 2.643, "step": 24314 }, { "epoch": 0.65, "learning_rate": 0.000566530810405195, "loss": 2.1489, "step": 24315 }, { "epoch": 0.65, "learning_rate": 0.000566452375077542, "loss": 2.7633, "step": 24316 }, { "epoch": 0.65, "learning_rate": 0.0005663739430343684, "loss": 2.417, "step": 24317 }, { "epoch": 0.65, "learning_rate": 0.0005662955142762682, "loss": 2.7919, "step": 24318 }, { "epoch": 0.65, "learning_rate": 0.0005662170888038363, "loss": 2.3473, "step": 24319 }, { "epoch": 0.65, "learning_rate": 0.0005661386666176656, "loss": 2.2368, "step": 24320 }, { "epoch": 0.65, "learning_rate": 0.0005660602477183512, "loss": 2.7229, "step": 24321 }, { "epoch": 0.65, "learning_rate": 0.0005659818321064865, "loss": 2.7453, "step": 24322 }, { "epoch": 0.65, "learning_rate": 0.0005659034197826655, "loss": 2.6991, "step": 24323 }, { "epoch": 0.65, "learning_rate": 0.0005658250107474829, "loss": 2.6489, "step": 24324 }, { "epoch": 0.65, "learning_rate": 0.0005657466050015323, "loss": 2.6231, "step": 24325 }, { "epoch": 0.65, "learning_rate": 0.0005656682025454078, "loss": 2.2994, "step": 24326 }, { "epoch": 0.65, "learning_rate": 0.0005655898033797038, "loss": 2.8903, "step": 24327 }, { "epoch": 0.65, "learning_rate": 0.0005655114075050134, "loss": 2.3876, "step": 24328 }, { "epoch": 0.65, "learning_rate": 0.0005654330149219309, "loss": 2.4222, "step": 24329 }, { "epoch": 0.65, "learning_rate": 0.00056535462563105, "loss": 2.4577, "step": 24330 }, { "epoch": 0.65, "learning_rate": 0.0005652762396329649, "loss": 2.425, "step": 24331 }, { "epoch": 0.65, "learning_rate": 0.0005651978569282696, "loss": 2.7847, "step": 24332 }, { "epoch": 0.65, "learning_rate": 0.0005651194775175573, "loss": 2.4234, "step": 24333 }, { "epoch": 0.65, "learning_rate": 0.000565041101401422, "loss": 1.9597, "step": 24334 }, { "epoch": 0.65, "learning_rate": 0.000564962728580458, "loss": 2.4154, "step": 24335 }, { "epoch": 0.65, "learning_rate": 0.0005648843590552583, "loss": 2.6976, "step": 24336 }, { "epoch": 0.65, "learning_rate": 0.0005648059928264163, "loss": 2.5788, "step": 24337 }, { "epoch": 0.65, "learning_rate": 0.0005647276298945272, "loss": 2.3739, "step": 24338 }, { "epoch": 0.65, "learning_rate": 0.0005646492702601833, "loss": 2.8002, "step": 24339 }, { "epoch": 0.65, "learning_rate": 0.0005645709139239792, "loss": 2.4552, "step": 24340 }, { "epoch": 0.65, "learning_rate": 0.0005644925608865075, "loss": 2.1928, "step": 24341 }, { "epoch": 0.65, "learning_rate": 0.0005644142111483623, "loss": 2.6565, "step": 24342 }, { "epoch": 0.65, "learning_rate": 0.0005643358647101373, "loss": 2.6524, "step": 24343 }, { "epoch": 0.65, "learning_rate": 0.0005642575215724258, "loss": 2.2932, "step": 24344 }, { "epoch": 0.65, "learning_rate": 0.0005641791817358215, "loss": 2.6845, "step": 24345 }, { "epoch": 0.65, "learning_rate": 0.0005641008452009179, "loss": 2.6845, "step": 24346 }, { "epoch": 0.65, "learning_rate": 0.0005640225119683083, "loss": 2.6279, "step": 24347 }, { "epoch": 0.65, "learning_rate": 0.0005639441820385864, "loss": 2.9878, "step": 24348 }, { "epoch": 0.65, "learning_rate": 0.0005638658554123448, "loss": 2.0949, "step": 24349 }, { "epoch": 0.65, "learning_rate": 0.0005637875320901777, "loss": 2.2254, "step": 24350 }, { "epoch": 0.65, "learning_rate": 0.0005637092120726789, "loss": 2.5069, "step": 24351 }, { "epoch": 0.65, "learning_rate": 0.0005636308953604406, "loss": 2.3105, "step": 24352 }, { "epoch": 0.65, "learning_rate": 0.0005635525819540566, "loss": 2.3519, "step": 24353 }, { "epoch": 0.65, "learning_rate": 0.0005634742718541206, "loss": 2.5059, "step": 24354 }, { "epoch": 0.65, "learning_rate": 0.000563395965061225, "loss": 2.704, "step": 24355 }, { "epoch": 0.65, "learning_rate": 0.0005633176615759636, "loss": 2.3978, "step": 24356 }, { "epoch": 0.65, "learning_rate": 0.0005632393613989298, "loss": 2.0552, "step": 24357 }, { "epoch": 0.65, "learning_rate": 0.0005631610645307161, "loss": 2.8649, "step": 24358 }, { "epoch": 0.65, "learning_rate": 0.0005630827709719166, "loss": 2.5355, "step": 24359 }, { "epoch": 0.65, "learning_rate": 0.0005630044807231236, "loss": 2.7065, "step": 24360 }, { "epoch": 0.65, "learning_rate": 0.0005629261937849304, "loss": 2.404, "step": 24361 }, { "epoch": 0.65, "learning_rate": 0.0005628479101579303, "loss": 2.4771, "step": 24362 }, { "epoch": 0.65, "learning_rate": 0.0005627696298427162, "loss": 2.4159, "step": 24363 }, { "epoch": 0.65, "learning_rate": 0.0005626913528398816, "loss": 2.9031, "step": 24364 }, { "epoch": 0.65, "learning_rate": 0.0005626130791500188, "loss": 2.4597, "step": 24365 }, { "epoch": 0.65, "learning_rate": 0.0005625348087737212, "loss": 2.5621, "step": 24366 }, { "epoch": 0.65, "learning_rate": 0.0005624565417115819, "loss": 2.4946, "step": 24367 }, { "epoch": 0.65, "learning_rate": 0.0005623782779641933, "loss": 2.2732, "step": 24368 }, { "epoch": 0.65, "learning_rate": 0.0005623000175321486, "loss": 2.7746, "step": 24369 }, { "epoch": 0.65, "learning_rate": 0.0005622217604160408, "loss": 2.3566, "step": 24370 }, { "epoch": 0.65, "learning_rate": 0.0005621435066164626, "loss": 2.7441, "step": 24371 }, { "epoch": 0.65, "learning_rate": 0.0005620652561340074, "loss": 2.3047, "step": 24372 }, { "epoch": 0.65, "learning_rate": 0.0005619870089692671, "loss": 2.4012, "step": 24373 }, { "epoch": 0.66, "learning_rate": 0.0005619087651228347, "loss": 2.5205, "step": 24374 }, { "epoch": 0.66, "learning_rate": 0.0005618305245953033, "loss": 2.857, "step": 24375 }, { "epoch": 0.66, "learning_rate": 0.0005617522873872656, "loss": 2.4701, "step": 24376 }, { "epoch": 0.66, "learning_rate": 0.0005616740534993142, "loss": 2.3709, "step": 24377 }, { "epoch": 0.66, "learning_rate": 0.0005615958229320422, "loss": 2.4166, "step": 24378 }, { "epoch": 0.66, "learning_rate": 0.0005615175956860414, "loss": 2.0267, "step": 24379 }, { "epoch": 0.66, "learning_rate": 0.0005614393717619048, "loss": 2.7864, "step": 24380 }, { "epoch": 0.66, "learning_rate": 0.0005613611511602257, "loss": 2.3752, "step": 24381 }, { "epoch": 0.66, "learning_rate": 0.0005612829338815957, "loss": 2.3589, "step": 24382 }, { "epoch": 0.66, "learning_rate": 0.0005612047199266077, "loss": 2.5084, "step": 24383 }, { "epoch": 0.66, "learning_rate": 0.0005611265092958543, "loss": 2.6969, "step": 24384 }, { "epoch": 0.66, "learning_rate": 0.0005610483019899279, "loss": 2.6856, "step": 24385 }, { "epoch": 0.66, "learning_rate": 0.0005609700980094217, "loss": 2.4936, "step": 24386 }, { "epoch": 0.66, "learning_rate": 0.0005608918973549271, "loss": 2.5603, "step": 24387 }, { "epoch": 0.66, "learning_rate": 0.0005608137000270368, "loss": 2.2071, "step": 24388 }, { "epoch": 0.66, "learning_rate": 0.0005607355060263435, "loss": 2.6929, "step": 24389 }, { "epoch": 0.66, "learning_rate": 0.0005606573153534395, "loss": 2.4176, "step": 24390 }, { "epoch": 0.66, "learning_rate": 0.0005605791280089174, "loss": 2.4792, "step": 24391 }, { "epoch": 0.66, "learning_rate": 0.0005605009439933691, "loss": 2.771, "step": 24392 }, { "epoch": 0.66, "learning_rate": 0.0005604227633073868, "loss": 2.5764, "step": 24393 }, { "epoch": 0.66, "learning_rate": 0.0005603445859515637, "loss": 2.6398, "step": 24394 }, { "epoch": 0.66, "learning_rate": 0.0005602664119264909, "loss": 2.407, "step": 24395 }, { "epoch": 0.66, "learning_rate": 0.0005601882412327607, "loss": 2.3803, "step": 24396 }, { "epoch": 0.66, "learning_rate": 0.0005601100738709667, "loss": 2.768, "step": 24397 }, { "epoch": 0.66, "learning_rate": 0.0005600319098416997, "loss": 2.579, "step": 24398 }, { "epoch": 0.66, "learning_rate": 0.0005599537491455526, "loss": 2.5379, "step": 24399 }, { "epoch": 0.66, "learning_rate": 0.0005598755917831169, "loss": 2.0957, "step": 24400 }, { "epoch": 0.66, "learning_rate": 0.0005597974377549849, "loss": 2.4885, "step": 24401 }, { "epoch": 0.66, "learning_rate": 0.0005597192870617489, "loss": 2.3277, "step": 24402 }, { "epoch": 0.66, "learning_rate": 0.0005596411397040009, "loss": 2.7297, "step": 24403 }, { "epoch": 0.66, "learning_rate": 0.0005595629956823329, "loss": 2.7265, "step": 24404 }, { "epoch": 0.66, "learning_rate": 0.0005594848549973372, "loss": 2.369, "step": 24405 }, { "epoch": 0.66, "learning_rate": 0.0005594067176496051, "loss": 2.4932, "step": 24406 }, { "epoch": 0.66, "learning_rate": 0.0005593285836397295, "loss": 2.496, "step": 24407 }, { "epoch": 0.66, "learning_rate": 0.0005592504529683013, "loss": 2.6782, "step": 24408 }, { "epoch": 0.66, "learning_rate": 0.0005591723256359124, "loss": 2.6133, "step": 24409 }, { "epoch": 0.66, "learning_rate": 0.000559094201643156, "loss": 2.0634, "step": 24410 }, { "epoch": 0.66, "learning_rate": 0.0005590160809906226, "loss": 2.7532, "step": 24411 }, { "epoch": 0.66, "learning_rate": 0.0005589379636789046, "loss": 2.786, "step": 24412 }, { "epoch": 0.66, "learning_rate": 0.0005588598497085942, "loss": 2.5891, "step": 24413 }, { "epoch": 0.66, "learning_rate": 0.0005587817390802822, "loss": 3.08, "step": 24414 }, { "epoch": 0.66, "learning_rate": 0.0005587036317945608, "loss": 2.4042, "step": 24415 }, { "epoch": 0.66, "learning_rate": 0.0005586255278520221, "loss": 2.5296, "step": 24416 }, { "epoch": 0.66, "learning_rate": 0.0005585474272532571, "loss": 2.4717, "step": 24417 }, { "epoch": 0.66, "learning_rate": 0.0005584693299988586, "loss": 2.3187, "step": 24418 }, { "epoch": 0.66, "learning_rate": 0.0005583912360894169, "loss": 2.2058, "step": 24419 }, { "epoch": 0.66, "learning_rate": 0.0005583131455255244, "loss": 2.4979, "step": 24420 }, { "epoch": 0.66, "learning_rate": 0.0005582350583077728, "loss": 2.4763, "step": 24421 }, { "epoch": 0.66, "learning_rate": 0.0005581569744367526, "loss": 2.2992, "step": 24422 }, { "epoch": 0.66, "learning_rate": 0.0005580788939130567, "loss": 2.7512, "step": 24423 }, { "epoch": 0.66, "learning_rate": 0.0005580008167372765, "loss": 2.7428, "step": 24424 }, { "epoch": 0.66, "learning_rate": 0.0005579227429100026, "loss": 2.484, "step": 24425 }, { "epoch": 0.66, "learning_rate": 0.0005578446724318274, "loss": 2.7047, "step": 24426 }, { "epoch": 0.66, "learning_rate": 0.0005577666053033414, "loss": 2.4599, "step": 24427 }, { "epoch": 0.66, "learning_rate": 0.0005576885415251367, "loss": 2.5671, "step": 24428 }, { "epoch": 0.66, "learning_rate": 0.0005576104810978044, "loss": 2.9956, "step": 24429 }, { "epoch": 0.66, "learning_rate": 0.0005575324240219362, "loss": 2.282, "step": 24430 }, { "epoch": 0.66, "learning_rate": 0.000557454370298123, "loss": 2.2815, "step": 24431 }, { "epoch": 0.66, "learning_rate": 0.0005573763199269569, "loss": 2.675, "step": 24432 }, { "epoch": 0.66, "learning_rate": 0.0005572982729090284, "loss": 2.5909, "step": 24433 }, { "epoch": 0.66, "learning_rate": 0.0005572202292449291, "loss": 2.4188, "step": 24434 }, { "epoch": 0.66, "learning_rate": 0.0005571421889352497, "loss": 2.3953, "step": 24435 }, { "epoch": 0.66, "learning_rate": 0.0005570641519805821, "loss": 2.5775, "step": 24436 }, { "epoch": 0.66, "learning_rate": 0.0005569861183815178, "loss": 2.0679, "step": 24437 }, { "epoch": 0.66, "learning_rate": 0.000556908088138647, "loss": 2.5743, "step": 24438 }, { "epoch": 0.66, "learning_rate": 0.0005568300612525614, "loss": 2.1899, "step": 24439 }, { "epoch": 0.66, "learning_rate": 0.0005567520377238525, "loss": 2.6491, "step": 24440 }, { "epoch": 0.66, "learning_rate": 0.0005566740175531102, "loss": 2.4037, "step": 24441 }, { "epoch": 0.66, "learning_rate": 0.0005565960007409265, "loss": 2.3572, "step": 24442 }, { "epoch": 0.66, "learning_rate": 0.0005565179872878921, "loss": 2.5392, "step": 24443 }, { "epoch": 0.66, "learning_rate": 0.0005564399771945983, "loss": 2.1737, "step": 24444 }, { "epoch": 0.66, "learning_rate": 0.0005563619704616363, "loss": 2.7929, "step": 24445 }, { "epoch": 0.66, "learning_rate": 0.0005562839670895963, "loss": 2.9127, "step": 24446 }, { "epoch": 0.66, "learning_rate": 0.0005562059670790695, "loss": 2.1304, "step": 24447 }, { "epoch": 0.66, "learning_rate": 0.0005561279704306471, "loss": 3.065, "step": 24448 }, { "epoch": 0.66, "learning_rate": 0.0005560499771449197, "loss": 2.8211, "step": 24449 }, { "epoch": 0.66, "learning_rate": 0.0005559719872224784, "loss": 3.0067, "step": 24450 }, { "epoch": 0.66, "learning_rate": 0.0005558940006639144, "loss": 2.2972, "step": 24451 }, { "epoch": 0.66, "learning_rate": 0.0005558160174698176, "loss": 2.3918, "step": 24452 }, { "epoch": 0.66, "learning_rate": 0.0005557380376407797, "loss": 2.4048, "step": 24453 }, { "epoch": 0.66, "learning_rate": 0.0005556600611773904, "loss": 2.5092, "step": 24454 }, { "epoch": 0.66, "learning_rate": 0.0005555820880802411, "loss": 2.7801, "step": 24455 }, { "epoch": 0.66, "learning_rate": 0.0005555041183499225, "loss": 2.746, "step": 24456 }, { "epoch": 0.66, "learning_rate": 0.0005554261519870254, "loss": 2.3783, "step": 24457 }, { "epoch": 0.66, "learning_rate": 0.0005553481889921401, "loss": 2.3271, "step": 24458 }, { "epoch": 0.66, "learning_rate": 0.0005552702293658578, "loss": 2.4322, "step": 24459 }, { "epoch": 0.66, "learning_rate": 0.0005551922731087684, "loss": 2.3523, "step": 24460 }, { "epoch": 0.66, "learning_rate": 0.0005551143202214628, "loss": 2.4365, "step": 24461 }, { "epoch": 0.66, "learning_rate": 0.0005550363707045316, "loss": 2.5439, "step": 24462 }, { "epoch": 0.66, "learning_rate": 0.0005549584245585653, "loss": 2.3678, "step": 24463 }, { "epoch": 0.66, "learning_rate": 0.0005548804817841547, "loss": 2.1824, "step": 24464 }, { "epoch": 0.66, "learning_rate": 0.0005548025423818897, "loss": 2.2573, "step": 24465 }, { "epoch": 0.66, "learning_rate": 0.000554724606352361, "loss": 2.5948, "step": 24466 }, { "epoch": 0.66, "learning_rate": 0.0005546466736961595, "loss": 2.6797, "step": 24467 }, { "epoch": 0.66, "learning_rate": 0.0005545687444138747, "loss": 2.3296, "step": 24468 }, { "epoch": 0.66, "learning_rate": 0.0005544908185060975, "loss": 2.5902, "step": 24469 }, { "epoch": 0.66, "learning_rate": 0.0005544128959734183, "loss": 2.576, "step": 24470 }, { "epoch": 0.66, "learning_rate": 0.0005543349768164273, "loss": 2.9296, "step": 24471 }, { "epoch": 0.66, "learning_rate": 0.0005542570610357152, "loss": 2.3932, "step": 24472 }, { "epoch": 0.66, "learning_rate": 0.0005541791486318715, "loss": 2.2887, "step": 24473 }, { "epoch": 0.66, "learning_rate": 0.000554101239605487, "loss": 2.4368, "step": 24474 }, { "epoch": 0.66, "learning_rate": 0.0005540233339571517, "loss": 2.1445, "step": 24475 }, { "epoch": 0.66, "learning_rate": 0.0005539454316874557, "loss": 2.6509, "step": 24476 }, { "epoch": 0.66, "learning_rate": 0.00055386753279699, "loss": 2.7497, "step": 24477 }, { "epoch": 0.66, "learning_rate": 0.0005537896372863435, "loss": 2.8344, "step": 24478 }, { "epoch": 0.66, "learning_rate": 0.0005537117451561071, "loss": 1.9599, "step": 24479 }, { "epoch": 0.66, "learning_rate": 0.0005536338564068713, "loss": 2.3114, "step": 24480 }, { "epoch": 0.66, "learning_rate": 0.0005535559710392248, "loss": 2.4124, "step": 24481 }, { "epoch": 0.66, "learning_rate": 0.0005534780890537583, "loss": 2.7954, "step": 24482 }, { "epoch": 0.66, "learning_rate": 0.0005534002104510627, "loss": 2.9243, "step": 24483 }, { "epoch": 0.66, "learning_rate": 0.0005533223352317269, "loss": 3.0573, "step": 24484 }, { "epoch": 0.66, "learning_rate": 0.0005532444633963416, "loss": 2.3926, "step": 24485 }, { "epoch": 0.66, "learning_rate": 0.0005531665949454961, "loss": 2.6634, "step": 24486 }, { "epoch": 0.66, "learning_rate": 0.0005530887298797804, "loss": 2.1695, "step": 24487 }, { "epoch": 0.66, "learning_rate": 0.0005530108681997848, "loss": 2.5465, "step": 24488 }, { "epoch": 0.66, "learning_rate": 0.0005529330099060988, "loss": 2.2612, "step": 24489 }, { "epoch": 0.66, "learning_rate": 0.0005528551549993123, "loss": 2.0557, "step": 24490 }, { "epoch": 0.66, "learning_rate": 0.0005527773034800156, "loss": 2.0901, "step": 24491 }, { "epoch": 0.66, "learning_rate": 0.0005526994553487979, "loss": 2.2887, "step": 24492 }, { "epoch": 0.66, "learning_rate": 0.0005526216106062489, "loss": 2.534, "step": 24493 }, { "epoch": 0.66, "learning_rate": 0.0005525437692529592, "loss": 2.8509, "step": 24494 }, { "epoch": 0.66, "learning_rate": 0.0005524659312895171, "loss": 2.7705, "step": 24495 }, { "epoch": 0.66, "learning_rate": 0.0005523880967165138, "loss": 2.9122, "step": 24496 }, { "epoch": 0.66, "learning_rate": 0.0005523102655345379, "loss": 2.6759, "step": 24497 }, { "epoch": 0.66, "learning_rate": 0.0005522324377441794, "loss": 2.7305, "step": 24498 }, { "epoch": 0.66, "learning_rate": 0.0005521546133460283, "loss": 2.3869, "step": 24499 }, { "epoch": 0.66, "learning_rate": 0.0005520767923406733, "loss": 2.7871, "step": 24500 }, { "epoch": 0.66, "learning_rate": 0.0005519989747287045, "loss": 2.2077, "step": 24501 }, { "epoch": 0.66, "learning_rate": 0.0005519211605107114, "loss": 2.7466, "step": 24502 }, { "epoch": 0.66, "learning_rate": 0.0005518433496872835, "loss": 2.1294, "step": 24503 }, { "epoch": 0.66, "learning_rate": 0.0005517655422590105, "loss": 2.5862, "step": 24504 }, { "epoch": 0.66, "learning_rate": 0.0005516877382264813, "loss": 2.2056, "step": 24505 }, { "epoch": 0.66, "learning_rate": 0.0005516099375902858, "loss": 2.5031, "step": 24506 }, { "epoch": 0.66, "learning_rate": 0.0005515321403510134, "loss": 2.2565, "step": 24507 }, { "epoch": 0.66, "learning_rate": 0.0005514543465092528, "loss": 2.7544, "step": 24508 }, { "epoch": 0.66, "learning_rate": 0.0005513765560655941, "loss": 2.6881, "step": 24509 }, { "epoch": 0.66, "learning_rate": 0.0005512987690206268, "loss": 2.2785, "step": 24510 }, { "epoch": 0.66, "learning_rate": 0.0005512209853749395, "loss": 2.7949, "step": 24511 }, { "epoch": 0.66, "learning_rate": 0.000551143205129122, "loss": 2.6141, "step": 24512 }, { "epoch": 0.66, "learning_rate": 0.000551065428283763, "loss": 2.6993, "step": 24513 }, { "epoch": 0.66, "learning_rate": 0.0005509876548394522, "loss": 2.6346, "step": 24514 }, { "epoch": 0.66, "learning_rate": 0.0005509098847967785, "loss": 2.4451, "step": 24515 }, { "epoch": 0.66, "learning_rate": 0.0005508321181563313, "loss": 2.9208, "step": 24516 }, { "epoch": 0.66, "learning_rate": 0.0005507543549186997, "loss": 2.5907, "step": 24517 }, { "epoch": 0.66, "learning_rate": 0.000550676595084473, "loss": 2.8274, "step": 24518 }, { "epoch": 0.66, "learning_rate": 0.0005505988386542399, "loss": 2.2613, "step": 24519 }, { "epoch": 0.66, "learning_rate": 0.0005505210856285896, "loss": 2.3982, "step": 24520 }, { "epoch": 0.66, "learning_rate": 0.0005504433360081112, "loss": 2.9738, "step": 24521 }, { "epoch": 0.66, "learning_rate": 0.0005503655897933935, "loss": 2.1059, "step": 24522 }, { "epoch": 0.66, "learning_rate": 0.0005502878469850263, "loss": 2.6809, "step": 24523 }, { "epoch": 0.66, "learning_rate": 0.0005502101075835977, "loss": 2.1139, "step": 24524 }, { "epoch": 0.66, "learning_rate": 0.0005501323715896967, "loss": 2.6296, "step": 24525 }, { "epoch": 0.66, "learning_rate": 0.000550054639003913, "loss": 2.6926, "step": 24526 }, { "epoch": 0.66, "learning_rate": 0.0005499769098268343, "loss": 2.4879, "step": 24527 }, { "epoch": 0.66, "learning_rate": 0.0005498991840590498, "loss": 2.9677, "step": 24528 }, { "epoch": 0.66, "learning_rate": 0.0005498214617011494, "loss": 2.9057, "step": 24529 }, { "epoch": 0.66, "learning_rate": 0.0005497437427537206, "loss": 2.8545, "step": 24530 }, { "epoch": 0.66, "learning_rate": 0.0005496660272173532, "loss": 2.827, "step": 24531 }, { "epoch": 0.66, "learning_rate": 0.0005495883150926351, "loss": 2.7232, "step": 24532 }, { "epoch": 0.66, "learning_rate": 0.0005495106063801554, "loss": 2.4727, "step": 24533 }, { "epoch": 0.66, "learning_rate": 0.0005494329010805028, "loss": 2.4257, "step": 24534 }, { "epoch": 0.66, "learning_rate": 0.000549355199194266, "loss": 2.7287, "step": 24535 }, { "epoch": 0.66, "learning_rate": 0.0005492775007220336, "loss": 2.4987, "step": 24536 }, { "epoch": 0.66, "learning_rate": 0.0005491998056643947, "loss": 2.2988, "step": 24537 }, { "epoch": 0.66, "learning_rate": 0.000549122114021937, "loss": 2.6287, "step": 24538 }, { "epoch": 0.66, "learning_rate": 0.00054904442579525, "loss": 2.4896, "step": 24539 }, { "epoch": 0.66, "learning_rate": 0.0005489667409849215, "loss": 2.8905, "step": 24540 }, { "epoch": 0.66, "learning_rate": 0.0005488890595915399, "loss": 2.157, "step": 24541 }, { "epoch": 0.66, "learning_rate": 0.0005488113816156947, "loss": 2.774, "step": 24542 }, { "epoch": 0.66, "learning_rate": 0.0005487337070579736, "loss": 2.3519, "step": 24543 }, { "epoch": 0.66, "learning_rate": 0.0005486560359189654, "loss": 2.3748, "step": 24544 }, { "epoch": 0.66, "learning_rate": 0.0005485783681992587, "loss": 2.9987, "step": 24545 }, { "epoch": 0.66, "learning_rate": 0.000548500703899441, "loss": 2.4385, "step": 24546 }, { "epoch": 0.66, "learning_rate": 0.0005484230430201014, "loss": 2.6705, "step": 24547 }, { "epoch": 0.66, "learning_rate": 0.0005483453855618281, "loss": 2.5901, "step": 24548 }, { "epoch": 0.66, "learning_rate": 0.0005482677315252094, "loss": 2.5116, "step": 24549 }, { "epoch": 0.66, "learning_rate": 0.0005481900809108337, "loss": 1.9597, "step": 24550 }, { "epoch": 0.66, "learning_rate": 0.0005481124337192892, "loss": 2.3142, "step": 24551 }, { "epoch": 0.66, "learning_rate": 0.0005480347899511639, "loss": 2.5626, "step": 24552 }, { "epoch": 0.66, "learning_rate": 0.0005479571496070468, "loss": 2.4803, "step": 24553 }, { "epoch": 0.66, "learning_rate": 0.0005478795126875244, "loss": 2.4077, "step": 24554 }, { "epoch": 0.66, "learning_rate": 0.0005478018791931871, "loss": 2.2418, "step": 24555 }, { "epoch": 0.66, "learning_rate": 0.0005477242491246214, "loss": 2.4129, "step": 24556 }, { "epoch": 0.66, "learning_rate": 0.0005476466224824159, "loss": 2.4933, "step": 24557 }, { "epoch": 0.66, "learning_rate": 0.000547568999267159, "loss": 2.2265, "step": 24558 }, { "epoch": 0.66, "learning_rate": 0.0005474913794794383, "loss": 2.4838, "step": 24559 }, { "epoch": 0.66, "learning_rate": 0.0005474137631198419, "loss": 2.4176, "step": 24560 }, { "epoch": 0.66, "learning_rate": 0.000547336150188958, "loss": 2.397, "step": 24561 }, { "epoch": 0.66, "learning_rate": 0.0005472585406873744, "loss": 2.6182, "step": 24562 }, { "epoch": 0.66, "learning_rate": 0.0005471809346156792, "loss": 2.6249, "step": 24563 }, { "epoch": 0.66, "learning_rate": 0.0005471033319744607, "loss": 2.3079, "step": 24564 }, { "epoch": 0.66, "learning_rate": 0.0005470257327643059, "loss": 2.4917, "step": 24565 }, { "epoch": 0.66, "learning_rate": 0.0005469481369858036, "loss": 2.5673, "step": 24566 }, { "epoch": 0.66, "learning_rate": 0.0005468705446395405, "loss": 2.1022, "step": 24567 }, { "epoch": 0.66, "learning_rate": 0.0005467929557261054, "loss": 2.6368, "step": 24568 }, { "epoch": 0.66, "learning_rate": 0.0005467153702460863, "loss": 2.5845, "step": 24569 }, { "epoch": 0.66, "learning_rate": 0.0005466377882000702, "loss": 2.3479, "step": 24570 }, { "epoch": 0.66, "learning_rate": 0.000546560209588645, "loss": 2.7896, "step": 24571 }, { "epoch": 0.66, "learning_rate": 0.0005464826344123992, "loss": 2.4971, "step": 24572 }, { "epoch": 0.66, "learning_rate": 0.0005464050626719192, "loss": 2.2201, "step": 24573 }, { "epoch": 0.66, "learning_rate": 0.0005463274943677937, "loss": 2.3789, "step": 24574 }, { "epoch": 0.66, "learning_rate": 0.0005462499295006098, "loss": 2.5822, "step": 24575 }, { "epoch": 0.66, "learning_rate": 0.0005461723680709553, "loss": 2.6725, "step": 24576 }, { "epoch": 0.66, "learning_rate": 0.000546094810079418, "loss": 2.7732, "step": 24577 }, { "epoch": 0.66, "learning_rate": 0.0005460172555265852, "loss": 2.9906, "step": 24578 }, { "epoch": 0.66, "learning_rate": 0.0005459397044130446, "loss": 2.1444, "step": 24579 }, { "epoch": 0.66, "learning_rate": 0.0005458621567393833, "loss": 2.6295, "step": 24580 }, { "epoch": 0.66, "learning_rate": 0.0005457846125061891, "loss": 2.2693, "step": 24581 }, { "epoch": 0.66, "learning_rate": 0.00054570707171405, "loss": 2.491, "step": 24582 }, { "epoch": 0.66, "learning_rate": 0.0005456295343635526, "loss": 2.4906, "step": 24583 }, { "epoch": 0.66, "learning_rate": 0.0005455520004552845, "loss": 2.9464, "step": 24584 }, { "epoch": 0.66, "learning_rate": 0.0005454744699898335, "loss": 2.3267, "step": 24585 }, { "epoch": 0.66, "learning_rate": 0.0005453969429677865, "loss": 2.1211, "step": 24586 }, { "epoch": 0.66, "learning_rate": 0.0005453194193897308, "loss": 2.7007, "step": 24587 }, { "epoch": 0.66, "learning_rate": 0.000545241899256254, "loss": 2.5809, "step": 24588 }, { "epoch": 0.66, "learning_rate": 0.0005451643825679431, "loss": 2.2727, "step": 24589 }, { "epoch": 0.66, "learning_rate": 0.0005450868693253861, "loss": 2.4514, "step": 24590 }, { "epoch": 0.66, "learning_rate": 0.0005450093595291692, "loss": 2.7511, "step": 24591 }, { "epoch": 0.66, "learning_rate": 0.00054493185317988, "loss": 2.6606, "step": 24592 }, { "epoch": 0.66, "learning_rate": 0.0005448543502781057, "loss": 2.4612, "step": 24593 }, { "epoch": 0.66, "learning_rate": 0.0005447768508244335, "loss": 2.3663, "step": 24594 }, { "epoch": 0.66, "learning_rate": 0.0005446993548194506, "loss": 2.2518, "step": 24595 }, { "epoch": 0.66, "learning_rate": 0.0005446218622637443, "loss": 2.7571, "step": 24596 }, { "epoch": 0.66, "learning_rate": 0.0005445443731579008, "loss": 2.1793, "step": 24597 }, { "epoch": 0.66, "learning_rate": 0.0005444668875025079, "loss": 2.8519, "step": 24598 }, { "epoch": 0.66, "learning_rate": 0.0005443894052981527, "loss": 2.2447, "step": 24599 }, { "epoch": 0.66, "learning_rate": 0.0005443119265454216, "loss": 2.535, "step": 24600 }, { "epoch": 0.66, "learning_rate": 0.0005442344512449019, "loss": 2.4171, "step": 24601 }, { "epoch": 0.66, "learning_rate": 0.0005441569793971805, "loss": 2.7996, "step": 24602 }, { "epoch": 0.66, "learning_rate": 0.0005440795110028443, "loss": 2.4824, "step": 24603 }, { "epoch": 0.66, "learning_rate": 0.0005440020460624806, "loss": 2.369, "step": 24604 }, { "epoch": 0.66, "learning_rate": 0.0005439245845766754, "loss": 2.6018, "step": 24605 }, { "epoch": 0.66, "learning_rate": 0.000543847126546016, "loss": 2.3395, "step": 24606 }, { "epoch": 0.66, "learning_rate": 0.0005437696719710894, "loss": 2.4094, "step": 24607 }, { "epoch": 0.66, "learning_rate": 0.0005436922208524822, "loss": 2.7481, "step": 24608 }, { "epoch": 0.66, "learning_rate": 0.0005436147731907815, "loss": 2.5672, "step": 24609 }, { "epoch": 0.66, "learning_rate": 0.0005435373289865732, "loss": 2.6438, "step": 24610 }, { "epoch": 0.66, "learning_rate": 0.0005434598882404445, "loss": 2.5498, "step": 24611 }, { "epoch": 0.66, "learning_rate": 0.0005433824509529824, "loss": 2.7179, "step": 24612 }, { "epoch": 0.66, "learning_rate": 0.000543305017124773, "loss": 2.4676, "step": 24613 }, { "epoch": 0.66, "learning_rate": 0.0005432275867564028, "loss": 2.429, "step": 24614 }, { "epoch": 0.66, "learning_rate": 0.0005431501598484592, "loss": 3.0709, "step": 24615 }, { "epoch": 0.66, "learning_rate": 0.0005430727364015282, "loss": 2.4061, "step": 24616 }, { "epoch": 0.66, "learning_rate": 0.0005429953164161967, "loss": 2.4257, "step": 24617 }, { "epoch": 0.66, "learning_rate": 0.0005429178998930507, "loss": 2.6303, "step": 24618 }, { "epoch": 0.66, "learning_rate": 0.0005428404868326769, "loss": 2.8137, "step": 24619 }, { "epoch": 0.66, "learning_rate": 0.0005427630772356618, "loss": 2.8232, "step": 24620 }, { "epoch": 0.66, "learning_rate": 0.0005426856711025919, "loss": 2.6411, "step": 24621 }, { "epoch": 0.66, "learning_rate": 0.0005426082684340536, "loss": 2.4079, "step": 24622 }, { "epoch": 0.66, "learning_rate": 0.0005425308692306338, "loss": 2.7986, "step": 24623 }, { "epoch": 0.66, "learning_rate": 0.0005424534734929179, "loss": 2.256, "step": 24624 }, { "epoch": 0.66, "learning_rate": 0.0005423760812214931, "loss": 2.3876, "step": 24625 }, { "epoch": 0.66, "learning_rate": 0.0005422986924169447, "loss": 2.7173, "step": 24626 }, { "epoch": 0.66, "learning_rate": 0.0005422213070798594, "loss": 2.6029, "step": 24627 }, { "epoch": 0.66, "learning_rate": 0.0005421439252108242, "loss": 2.4508, "step": 24628 }, { "epoch": 0.66, "learning_rate": 0.0005420665468104246, "loss": 2.6036, "step": 24629 }, { "epoch": 0.66, "learning_rate": 0.0005419891718792469, "loss": 2.5214, "step": 24630 }, { "epoch": 0.66, "learning_rate": 0.0005419118004178778, "loss": 2.3967, "step": 24631 }, { "epoch": 0.66, "learning_rate": 0.0005418344324269025, "loss": 2.6236, "step": 24632 }, { "epoch": 0.66, "learning_rate": 0.0005417570679069076, "loss": 2.4606, "step": 24633 }, { "epoch": 0.66, "learning_rate": 0.0005416797068584793, "loss": 2.1572, "step": 24634 }, { "epoch": 0.66, "learning_rate": 0.0005416023492822035, "loss": 2.7657, "step": 24635 }, { "epoch": 0.66, "learning_rate": 0.000541524995178667, "loss": 2.3496, "step": 24636 }, { "epoch": 0.66, "learning_rate": 0.0005414476445484546, "loss": 2.6037, "step": 24637 }, { "epoch": 0.66, "learning_rate": 0.0005413702973921528, "loss": 2.9325, "step": 24638 }, { "epoch": 0.66, "learning_rate": 0.0005412929537103482, "loss": 2.7341, "step": 24639 }, { "epoch": 0.66, "learning_rate": 0.0005412156135036252, "loss": 2.6344, "step": 24640 }, { "epoch": 0.66, "learning_rate": 0.0005411382767725713, "loss": 2.4257, "step": 24641 }, { "epoch": 0.66, "learning_rate": 0.0005410609435177719, "loss": 2.3763, "step": 24642 }, { "epoch": 0.66, "learning_rate": 0.0005409836137398125, "loss": 2.4199, "step": 24643 }, { "epoch": 0.66, "learning_rate": 0.0005409062874392796, "loss": 2.6381, "step": 24644 }, { "epoch": 0.66, "learning_rate": 0.0005408289646167581, "loss": 2.2546, "step": 24645 }, { "epoch": 0.66, "learning_rate": 0.0005407516452728343, "loss": 2.5799, "step": 24646 }, { "epoch": 0.66, "learning_rate": 0.000540674329408094, "loss": 2.5842, "step": 24647 }, { "epoch": 0.66, "learning_rate": 0.0005405970170231228, "loss": 2.5267, "step": 24648 }, { "epoch": 0.66, "learning_rate": 0.0005405197081185065, "loss": 2.4742, "step": 24649 }, { "epoch": 0.66, "learning_rate": 0.0005404424026948312, "loss": 2.4331, "step": 24650 }, { "epoch": 0.66, "learning_rate": 0.0005403651007526815, "loss": 2.5396, "step": 24651 }, { "epoch": 0.66, "learning_rate": 0.0005402878022926441, "loss": 2.4466, "step": 24652 }, { "epoch": 0.66, "learning_rate": 0.0005402105073153034, "loss": 2.7566, "step": 24653 }, { "epoch": 0.66, "learning_rate": 0.0005401332158212461, "loss": 2.6545, "step": 24654 }, { "epoch": 0.66, "learning_rate": 0.0005400559278110577, "loss": 2.6737, "step": 24655 }, { "epoch": 0.66, "learning_rate": 0.0005399786432853229, "loss": 2.8814, "step": 24656 }, { "epoch": 0.66, "learning_rate": 0.0005399013622446277, "loss": 2.2335, "step": 24657 }, { "epoch": 0.66, "learning_rate": 0.0005398240846895579, "loss": 2.8269, "step": 24658 }, { "epoch": 0.66, "learning_rate": 0.0005397468106206982, "loss": 2.7367, "step": 24659 }, { "epoch": 0.66, "learning_rate": 0.0005396695400386345, "loss": 2.3389, "step": 24660 }, { "epoch": 0.66, "learning_rate": 0.0005395922729439518, "loss": 1.7356, "step": 24661 }, { "epoch": 0.66, "learning_rate": 0.0005395150093372358, "loss": 2.3539, "step": 24662 }, { "epoch": 0.66, "learning_rate": 0.0005394377492190723, "loss": 2.4665, "step": 24663 }, { "epoch": 0.66, "learning_rate": 0.0005393604925900457, "loss": 2.0678, "step": 24664 }, { "epoch": 0.66, "learning_rate": 0.0005392832394507415, "loss": 2.8423, "step": 24665 }, { "epoch": 0.66, "learning_rate": 0.0005392059898017452, "loss": 2.3604, "step": 24666 }, { "epoch": 0.66, "learning_rate": 0.0005391287436436418, "loss": 3.031, "step": 24667 }, { "epoch": 0.66, "learning_rate": 0.0005390515009770172, "loss": 2.976, "step": 24668 }, { "epoch": 0.66, "learning_rate": 0.0005389742618024556, "loss": 2.5098, "step": 24669 }, { "epoch": 0.66, "learning_rate": 0.0005388970261205425, "loss": 2.2671, "step": 24670 }, { "epoch": 0.66, "learning_rate": 0.0005388197939318636, "loss": 2.5246, "step": 24671 }, { "epoch": 0.66, "learning_rate": 0.000538742565237003, "loss": 2.5875, "step": 24672 }, { "epoch": 0.66, "learning_rate": 0.0005386653400365462, "loss": 2.2974, "step": 24673 }, { "epoch": 0.66, "learning_rate": 0.0005385881183310783, "loss": 2.3142, "step": 24674 }, { "epoch": 0.66, "learning_rate": 0.0005385109001211846, "loss": 2.9201, "step": 24675 }, { "epoch": 0.66, "learning_rate": 0.0005384336854074494, "loss": 2.1587, "step": 24676 }, { "epoch": 0.66, "learning_rate": 0.0005383564741904587, "loss": 2.4211, "step": 24677 }, { "epoch": 0.66, "learning_rate": 0.0005382792664707965, "loss": 2.5268, "step": 24678 }, { "epoch": 0.66, "learning_rate": 0.000538202062249048, "loss": 2.3499, "step": 24679 }, { "epoch": 0.66, "learning_rate": 0.000538124861525798, "loss": 2.2457, "step": 24680 }, { "epoch": 0.66, "learning_rate": 0.0005380476643016314, "loss": 2.2229, "step": 24681 }, { "epoch": 0.66, "learning_rate": 0.0005379704705771338, "loss": 2.5814, "step": 24682 }, { "epoch": 0.66, "learning_rate": 0.0005378932803528887, "loss": 2.5187, "step": 24683 }, { "epoch": 0.66, "learning_rate": 0.0005378160936294815, "loss": 2.4795, "step": 24684 }, { "epoch": 0.66, "learning_rate": 0.0005377389104074975, "loss": 2.4368, "step": 24685 }, { "epoch": 0.66, "learning_rate": 0.0005376617306875199, "loss": 2.492, "step": 24686 }, { "epoch": 0.66, "learning_rate": 0.0005375845544701352, "loss": 2.202, "step": 24687 }, { "epoch": 0.66, "learning_rate": 0.0005375073817559268, "loss": 2.5451, "step": 24688 }, { "epoch": 0.66, "learning_rate": 0.00053743021254548, "loss": 2.4068, "step": 24689 }, { "epoch": 0.66, "learning_rate": 0.0005373530468393793, "loss": 2.9323, "step": 24690 }, { "epoch": 0.66, "learning_rate": 0.0005372758846382091, "loss": 2.5674, "step": 24691 }, { "epoch": 0.66, "learning_rate": 0.0005371987259425539, "loss": 2.2099, "step": 24692 }, { "epoch": 0.66, "learning_rate": 0.0005371215707529984, "loss": 2.6119, "step": 24693 }, { "epoch": 0.66, "learning_rate": 0.0005370444190701271, "loss": 2.4659, "step": 24694 }, { "epoch": 0.66, "learning_rate": 0.000536967270894525, "loss": 2.6579, "step": 24695 }, { "epoch": 0.66, "learning_rate": 0.0005368901262267758, "loss": 2.3384, "step": 24696 }, { "epoch": 0.66, "learning_rate": 0.000536812985067464, "loss": 2.3163, "step": 24697 }, { "epoch": 0.66, "learning_rate": 0.0005367358474171746, "loss": 2.2209, "step": 24698 }, { "epoch": 0.66, "learning_rate": 0.000536658713276491, "loss": 2.6449, "step": 24699 }, { "epoch": 0.66, "learning_rate": 0.0005365815826459983, "loss": 2.5667, "step": 24700 }, { "epoch": 0.66, "learning_rate": 0.0005365044555262812, "loss": 2.1997, "step": 24701 }, { "epoch": 0.66, "learning_rate": 0.0005364273319179232, "loss": 2.2386, "step": 24702 }, { "epoch": 0.66, "learning_rate": 0.0005363502118215091, "loss": 2.3054, "step": 24703 }, { "epoch": 0.66, "learning_rate": 0.0005362730952376226, "loss": 2.3126, "step": 24704 }, { "epoch": 0.66, "learning_rate": 0.0005361959821668481, "loss": 2.6013, "step": 24705 }, { "epoch": 0.66, "learning_rate": 0.0005361188726097701, "loss": 2.4858, "step": 24706 }, { "epoch": 0.66, "learning_rate": 0.0005360417665669723, "loss": 2.3558, "step": 24707 }, { "epoch": 0.66, "learning_rate": 0.0005359646640390395, "loss": 2.4458, "step": 24708 }, { "epoch": 0.66, "learning_rate": 0.0005358875650265556, "loss": 2.6037, "step": 24709 }, { "epoch": 0.66, "learning_rate": 0.0005358104695301042, "loss": 2.1726, "step": 24710 }, { "epoch": 0.66, "learning_rate": 0.0005357333775502696, "loss": 2.6564, "step": 24711 }, { "epoch": 0.66, "learning_rate": 0.000535656289087636, "loss": 2.31, "step": 24712 }, { "epoch": 0.66, "learning_rate": 0.0005355792041427874, "loss": 2.58, "step": 24713 }, { "epoch": 0.66, "learning_rate": 0.0005355021227163079, "loss": 2.7936, "step": 24714 }, { "epoch": 0.66, "learning_rate": 0.0005354250448087812, "loss": 2.8206, "step": 24715 }, { "epoch": 0.66, "learning_rate": 0.0005353479704207911, "loss": 2.3185, "step": 24716 }, { "epoch": 0.66, "learning_rate": 0.0005352708995529221, "loss": 2.1458, "step": 24717 }, { "epoch": 0.66, "learning_rate": 0.0005351938322057572, "loss": 2.1856, "step": 24718 }, { "epoch": 0.66, "learning_rate": 0.000535116768379881, "loss": 2.5726, "step": 24719 }, { "epoch": 0.66, "learning_rate": 0.0005350397080758769, "loss": 2.4479, "step": 24720 }, { "epoch": 0.66, "learning_rate": 0.0005349626512943288, "loss": 2.5504, "step": 24721 }, { "epoch": 0.66, "learning_rate": 0.000534885598035821, "loss": 2.3361, "step": 24722 }, { "epoch": 0.66, "learning_rate": 0.0005348085483009361, "loss": 2.5295, "step": 24723 }, { "epoch": 0.66, "learning_rate": 0.0005347315020902588, "loss": 2.3983, "step": 24724 }, { "epoch": 0.66, "learning_rate": 0.0005346544594043723, "loss": 2.5478, "step": 24725 }, { "epoch": 0.66, "learning_rate": 0.0005345774202438605, "loss": 2.6537, "step": 24726 }, { "epoch": 0.66, "learning_rate": 0.0005345003846093068, "loss": 2.2522, "step": 24727 }, { "epoch": 0.66, "learning_rate": 0.0005344233525012956, "loss": 2.1963, "step": 24728 }, { "epoch": 0.66, "learning_rate": 0.0005343463239204093, "loss": 2.1872, "step": 24729 }, { "epoch": 0.66, "learning_rate": 0.0005342692988672324, "loss": 2.3075, "step": 24730 }, { "epoch": 0.66, "learning_rate": 0.0005341922773423475, "loss": 2.2891, "step": 24731 }, { "epoch": 0.66, "learning_rate": 0.0005341152593463388, "loss": 2.0232, "step": 24732 }, { "epoch": 0.66, "learning_rate": 0.0005340382448797896, "loss": 2.3277, "step": 24733 }, { "epoch": 0.66, "learning_rate": 0.0005339612339432834, "loss": 2.4205, "step": 24734 }, { "epoch": 0.66, "learning_rate": 0.0005338842265374035, "loss": 2.6097, "step": 24735 }, { "epoch": 0.66, "learning_rate": 0.0005338072226627337, "loss": 2.4586, "step": 24736 }, { "epoch": 0.66, "learning_rate": 0.0005337302223198568, "loss": 2.5654, "step": 24737 }, { "epoch": 0.66, "learning_rate": 0.0005336532255093562, "loss": 2.8495, "step": 24738 }, { "epoch": 0.66, "learning_rate": 0.0005335762322318154, "loss": 2.7614, "step": 24739 }, { "epoch": 0.66, "learning_rate": 0.0005334992424878178, "loss": 2.5783, "step": 24740 }, { "epoch": 0.66, "learning_rate": 0.0005334222562779469, "loss": 2.608, "step": 24741 }, { "epoch": 0.66, "learning_rate": 0.000533345273602785, "loss": 2.3094, "step": 24742 }, { "epoch": 0.66, "learning_rate": 0.0005332682944629161, "loss": 2.2829, "step": 24743 }, { "epoch": 0.66, "learning_rate": 0.0005331913188589234, "loss": 2.4781, "step": 24744 }, { "epoch": 0.66, "learning_rate": 0.0005331143467913894, "loss": 2.678, "step": 24745 }, { "epoch": 0.67, "learning_rate": 0.0005330373782608975, "loss": 2.7654, "step": 24746 }, { "epoch": 0.67, "learning_rate": 0.0005329604132680314, "loss": 2.6965, "step": 24747 }, { "epoch": 0.67, "learning_rate": 0.0005328834518133737, "loss": 2.86, "step": 24748 }, { "epoch": 0.67, "learning_rate": 0.0005328064938975075, "loss": 2.856, "step": 24749 }, { "epoch": 0.67, "learning_rate": 0.0005327295395210154, "loss": 2.2042, "step": 24750 }, { "epoch": 0.67, "learning_rate": 0.0005326525886844809, "loss": 2.2542, "step": 24751 }, { "epoch": 0.67, "learning_rate": 0.0005325756413884869, "loss": 2.8151, "step": 24752 }, { "epoch": 0.67, "learning_rate": 0.0005324986976336161, "loss": 2.9185, "step": 24753 }, { "epoch": 0.67, "learning_rate": 0.0005324217574204517, "loss": 2.3809, "step": 24754 }, { "epoch": 0.67, "learning_rate": 0.0005323448207495769, "loss": 2.7333, "step": 24755 }, { "epoch": 0.67, "learning_rate": 0.0005322678876215737, "loss": 2.4967, "step": 24756 }, { "epoch": 0.67, "learning_rate": 0.0005321909580370257, "loss": 2.5712, "step": 24757 }, { "epoch": 0.67, "learning_rate": 0.000532114031996515, "loss": 2.6284, "step": 24758 }, { "epoch": 0.67, "learning_rate": 0.0005320371095006242, "loss": 2.3635, "step": 24759 }, { "epoch": 0.67, "learning_rate": 0.0005319601905499376, "loss": 2.8117, "step": 24760 }, { "epoch": 0.67, "learning_rate": 0.0005318832751450365, "loss": 2.4981, "step": 24761 }, { "epoch": 0.67, "learning_rate": 0.0005318063632865039, "loss": 2.2456, "step": 24762 }, { "epoch": 0.67, "learning_rate": 0.000531729454974923, "loss": 2.4188, "step": 24763 }, { "epoch": 0.67, "learning_rate": 0.0005316525502108757, "loss": 2.7719, "step": 24764 }, { "epoch": 0.67, "learning_rate": 0.000531575648994945, "loss": 2.5907, "step": 24765 }, { "epoch": 0.67, "learning_rate": 0.0005314987513277133, "loss": 2.6022, "step": 24766 }, { "epoch": 0.67, "learning_rate": 0.0005314218572097634, "loss": 2.5714, "step": 24767 }, { "epoch": 0.67, "learning_rate": 0.000531344966641678, "loss": 2.5575, "step": 24768 }, { "epoch": 0.67, "learning_rate": 0.000531268079624039, "loss": 2.8799, "step": 24769 }, { "epoch": 0.67, "learning_rate": 0.0005311911961574294, "loss": 2.7016, "step": 24770 }, { "epoch": 0.67, "learning_rate": 0.0005311143162424317, "loss": 2.4575, "step": 24771 }, { "epoch": 0.67, "learning_rate": 0.0005310374398796273, "loss": 2.2315, "step": 24772 }, { "epoch": 0.67, "learning_rate": 0.0005309605670696003, "loss": 2.0144, "step": 24773 }, { "epoch": 0.67, "learning_rate": 0.0005308836978129318, "loss": 2.5622, "step": 24774 }, { "epoch": 0.67, "learning_rate": 0.0005308068321102044, "loss": 2.7773, "step": 24775 }, { "epoch": 0.67, "learning_rate": 0.0005307299699620012, "loss": 2.3486, "step": 24776 }, { "epoch": 0.67, "learning_rate": 0.0005306531113689032, "loss": 2.5637, "step": 24777 }, { "epoch": 0.67, "learning_rate": 0.0005305762563314935, "loss": 2.2638, "step": 24778 }, { "epoch": 0.67, "learning_rate": 0.000530499404850354, "loss": 2.5946, "step": 24779 }, { "epoch": 0.67, "learning_rate": 0.0005304225569260672, "loss": 2.445, "step": 24780 }, { "epoch": 0.67, "learning_rate": 0.0005303457125592155, "loss": 2.5065, "step": 24781 }, { "epoch": 0.67, "learning_rate": 0.0005302688717503803, "loss": 2.5381, "step": 24782 }, { "epoch": 0.67, "learning_rate": 0.0005301920345001442, "loss": 2.3936, "step": 24783 }, { "epoch": 0.67, "learning_rate": 0.0005301152008090896, "loss": 2.3586, "step": 24784 }, { "epoch": 0.67, "learning_rate": 0.0005300383706777974, "loss": 2.684, "step": 24785 }, { "epoch": 0.67, "learning_rate": 0.0005299615441068511, "loss": 2.4578, "step": 24786 }, { "epoch": 0.67, "learning_rate": 0.0005298847210968323, "loss": 2.5536, "step": 24787 }, { "epoch": 0.67, "learning_rate": 0.0005298079016483224, "loss": 2.947, "step": 24788 }, { "epoch": 0.67, "learning_rate": 0.0005297310857619037, "loss": 2.5454, "step": 24789 }, { "epoch": 0.67, "learning_rate": 0.0005296542734381589, "loss": 2.6867, "step": 24790 }, { "epoch": 0.67, "learning_rate": 0.0005295774646776686, "loss": 2.384, "step": 24791 }, { "epoch": 0.67, "learning_rate": 0.0005295006594810154, "loss": 2.8795, "step": 24792 }, { "epoch": 0.67, "learning_rate": 0.0005294238578487812, "loss": 2.5521, "step": 24793 }, { "epoch": 0.67, "learning_rate": 0.0005293470597815475, "loss": 2.1965, "step": 24794 }, { "epoch": 0.67, "learning_rate": 0.0005292702652798969, "loss": 2.2676, "step": 24795 }, { "epoch": 0.67, "learning_rate": 0.00052919347434441, "loss": 2.5869, "step": 24796 }, { "epoch": 0.67, "learning_rate": 0.0005291166869756694, "loss": 2.0948, "step": 24797 }, { "epoch": 0.67, "learning_rate": 0.0005290399031742564, "loss": 2.768, "step": 24798 }, { "epoch": 0.67, "learning_rate": 0.000528963122940753, "loss": 2.6545, "step": 24799 }, { "epoch": 0.67, "learning_rate": 0.0005288863462757412, "loss": 2.2389, "step": 24800 }, { "epoch": 0.67, "learning_rate": 0.0005288095731798017, "loss": 2.2132, "step": 24801 }, { "epoch": 0.67, "learning_rate": 0.0005287328036535169, "loss": 2.9805, "step": 24802 }, { "epoch": 0.67, "learning_rate": 0.0005286560376974683, "loss": 2.4209, "step": 24803 }, { "epoch": 0.67, "learning_rate": 0.0005285792753122369, "loss": 2.7414, "step": 24804 }, { "epoch": 0.67, "learning_rate": 0.0005285025164984046, "loss": 2.5701, "step": 24805 }, { "epoch": 0.67, "learning_rate": 0.000528425761256553, "loss": 2.8071, "step": 24806 }, { "epoch": 0.67, "learning_rate": 0.0005283490095872635, "loss": 2.6334, "step": 24807 }, { "epoch": 0.67, "learning_rate": 0.0005282722614911179, "loss": 2.322, "step": 24808 }, { "epoch": 0.67, "learning_rate": 0.0005281955169686972, "loss": 2.1915, "step": 24809 }, { "epoch": 0.67, "learning_rate": 0.0005281187760205827, "loss": 2.2293, "step": 24810 }, { "epoch": 0.67, "learning_rate": 0.0005280420386473559, "loss": 3.0115, "step": 24811 }, { "epoch": 0.67, "learning_rate": 0.0005279653048495985, "loss": 2.4596, "step": 24812 }, { "epoch": 0.67, "learning_rate": 0.0005278885746278913, "loss": 2.6486, "step": 24813 }, { "epoch": 0.67, "learning_rate": 0.0005278118479828163, "loss": 2.2298, "step": 24814 }, { "epoch": 0.67, "learning_rate": 0.000527735124914954, "loss": 2.4404, "step": 24815 }, { "epoch": 0.67, "learning_rate": 0.0005276584054248863, "loss": 2.7141, "step": 24816 }, { "epoch": 0.67, "learning_rate": 0.0005275816895131938, "loss": 2.1117, "step": 24817 }, { "epoch": 0.67, "learning_rate": 0.0005275049771804579, "loss": 2.3855, "step": 24818 }, { "epoch": 0.67, "learning_rate": 0.0005274282684272597, "loss": 2.3436, "step": 24819 }, { "epoch": 0.67, "learning_rate": 0.0005273515632541805, "loss": 2.6407, "step": 24820 }, { "epoch": 0.67, "learning_rate": 0.0005272748616618015, "loss": 1.91, "step": 24821 }, { "epoch": 0.67, "learning_rate": 0.000527198163650704, "loss": 2.2655, "step": 24822 }, { "epoch": 0.67, "learning_rate": 0.0005271214692214681, "loss": 2.5886, "step": 24823 }, { "epoch": 0.67, "learning_rate": 0.0005270447783746754, "loss": 2.4951, "step": 24824 }, { "epoch": 0.67, "learning_rate": 0.0005269680911109072, "loss": 2.1709, "step": 24825 }, { "epoch": 0.67, "learning_rate": 0.0005268914074307439, "loss": 2.7498, "step": 24826 }, { "epoch": 0.67, "learning_rate": 0.0005268147273347672, "loss": 2.7222, "step": 24827 }, { "epoch": 0.67, "learning_rate": 0.0005267380508235572, "loss": 2.7655, "step": 24828 }, { "epoch": 0.67, "learning_rate": 0.000526661377897695, "loss": 2.5048, "step": 24829 }, { "epoch": 0.67, "learning_rate": 0.000526584708557762, "loss": 2.3381, "step": 24830 }, { "epoch": 0.67, "learning_rate": 0.0005265080428043383, "loss": 2.9287, "step": 24831 }, { "epoch": 0.67, "learning_rate": 0.0005264313806380046, "loss": 2.2444, "step": 24832 }, { "epoch": 0.67, "learning_rate": 0.0005263547220593428, "loss": 2.775, "step": 24833 }, { "epoch": 0.67, "learning_rate": 0.0005262780670689326, "loss": 2.4951, "step": 24834 }, { "epoch": 0.67, "learning_rate": 0.0005262014156673554, "loss": 2.9419, "step": 24835 }, { "epoch": 0.67, "learning_rate": 0.0005261247678551912, "loss": 2.924, "step": 24836 }, { "epoch": 0.67, "learning_rate": 0.0005260481236330211, "loss": 2.7403, "step": 24837 }, { "epoch": 0.67, "learning_rate": 0.0005259714830014257, "loss": 2.6902, "step": 24838 }, { "epoch": 0.67, "learning_rate": 0.0005258948459609856, "loss": 2.7632, "step": 24839 }, { "epoch": 0.67, "learning_rate": 0.0005258182125122813, "loss": 2.1833, "step": 24840 }, { "epoch": 0.67, "learning_rate": 0.0005257415826558937, "loss": 2.3445, "step": 24841 }, { "epoch": 0.67, "learning_rate": 0.000525664956392403, "loss": 2.2277, "step": 24842 }, { "epoch": 0.67, "learning_rate": 0.00052558833372239, "loss": 2.4646, "step": 24843 }, { "epoch": 0.67, "learning_rate": 0.0005255117146464346, "loss": 2.2072, "step": 24844 }, { "epoch": 0.67, "learning_rate": 0.0005254350991651172, "loss": 2.0333, "step": 24845 }, { "epoch": 0.67, "learning_rate": 0.0005253584872790196, "loss": 2.5733, "step": 24846 }, { "epoch": 0.67, "learning_rate": 0.0005252818789887206, "loss": 1.7871, "step": 24847 }, { "epoch": 0.67, "learning_rate": 0.0005252052742948013, "loss": 2.4971, "step": 24848 }, { "epoch": 0.67, "learning_rate": 0.0005251286731978424, "loss": 2.4703, "step": 24849 }, { "epoch": 0.67, "learning_rate": 0.0005250520756984234, "loss": 2.5799, "step": 24850 }, { "epoch": 0.67, "learning_rate": 0.0005249754817971249, "loss": 2.0636, "step": 24851 }, { "epoch": 0.67, "learning_rate": 0.0005248988914945272, "loss": 2.4349, "step": 24852 }, { "epoch": 0.67, "learning_rate": 0.0005248223047912106, "loss": 2.6802, "step": 24853 }, { "epoch": 0.67, "learning_rate": 0.0005247457216877557, "loss": 2.5567, "step": 24854 }, { "epoch": 0.67, "learning_rate": 0.0005246691421847418, "loss": 2.3238, "step": 24855 }, { "epoch": 0.67, "learning_rate": 0.0005245925662827496, "loss": 2.2105, "step": 24856 }, { "epoch": 0.67, "learning_rate": 0.0005245159939823589, "loss": 2.7434, "step": 24857 }, { "epoch": 0.67, "learning_rate": 0.0005244394252841503, "loss": 2.3396, "step": 24858 }, { "epoch": 0.67, "learning_rate": 0.0005243628601887034, "loss": 2.4132, "step": 24859 }, { "epoch": 0.67, "learning_rate": 0.0005242862986965988, "loss": 2.4498, "step": 24860 }, { "epoch": 0.67, "learning_rate": 0.0005242097408084159, "loss": 2.5671, "step": 24861 }, { "epoch": 0.67, "learning_rate": 0.0005241331865247352, "loss": 2.6535, "step": 24862 }, { "epoch": 0.67, "learning_rate": 0.000524056635846136, "loss": 2.43, "step": 24863 }, { "epoch": 0.67, "learning_rate": 0.0005239800887731988, "loss": 2.4668, "step": 24864 }, { "epoch": 0.67, "learning_rate": 0.0005239035453065033, "loss": 2.4234, "step": 24865 }, { "epoch": 0.67, "learning_rate": 0.0005238270054466293, "loss": 2.8278, "step": 24866 }, { "epoch": 0.67, "learning_rate": 0.0005237504691941569, "loss": 3.1707, "step": 24867 }, { "epoch": 0.67, "learning_rate": 0.0005236739365496662, "loss": 2.4019, "step": 24868 }, { "epoch": 0.67, "learning_rate": 0.0005235974075137361, "loss": 2.4035, "step": 24869 }, { "epoch": 0.67, "learning_rate": 0.0005235208820869469, "loss": 2.8789, "step": 24870 }, { "epoch": 0.67, "learning_rate": 0.0005234443602698782, "loss": 2.4112, "step": 24871 }, { "epoch": 0.67, "learning_rate": 0.0005233678420631101, "loss": 2.1167, "step": 24872 }, { "epoch": 0.67, "learning_rate": 0.0005232913274672222, "loss": 2.3668, "step": 24873 }, { "epoch": 0.67, "learning_rate": 0.0005232148164827936, "loss": 1.896, "step": 24874 }, { "epoch": 0.67, "learning_rate": 0.0005231383091104045, "loss": 2.4554, "step": 24875 }, { "epoch": 0.67, "learning_rate": 0.0005230618053506344, "loss": 2.3183, "step": 24876 }, { "epoch": 0.67, "learning_rate": 0.0005229853052040627, "loss": 1.8794, "step": 24877 }, { "epoch": 0.67, "learning_rate": 0.0005229088086712688, "loss": 2.2954, "step": 24878 }, { "epoch": 0.67, "learning_rate": 0.0005228323157528326, "loss": 2.5827, "step": 24879 }, { "epoch": 0.67, "learning_rate": 0.0005227558264493335, "loss": 2.5504, "step": 24880 }, { "epoch": 0.67, "learning_rate": 0.0005226793407613513, "loss": 2.8802, "step": 24881 }, { "epoch": 0.67, "learning_rate": 0.0005226028586894646, "loss": 2.6399, "step": 24882 }, { "epoch": 0.67, "learning_rate": 0.0005225263802342534, "loss": 2.5294, "step": 24883 }, { "epoch": 0.67, "learning_rate": 0.0005224499053962969, "loss": 2.5317, "step": 24884 }, { "epoch": 0.67, "learning_rate": 0.0005223734341761745, "loss": 2.3319, "step": 24885 }, { "epoch": 0.67, "learning_rate": 0.0005222969665744661, "loss": 2.7074, "step": 24886 }, { "epoch": 0.67, "learning_rate": 0.0005222205025917499, "loss": 2.2702, "step": 24887 }, { "epoch": 0.67, "learning_rate": 0.0005221440422286059, "loss": 2.4181, "step": 24888 }, { "epoch": 0.67, "learning_rate": 0.0005220675854856136, "loss": 2.5747, "step": 24889 }, { "epoch": 0.67, "learning_rate": 0.0005219911323633514, "loss": 2.2094, "step": 24890 }, { "epoch": 0.67, "learning_rate": 0.0005219146828623985, "loss": 2.6014, "step": 24891 }, { "epoch": 0.67, "learning_rate": 0.0005218382369833354, "loss": 2.4265, "step": 24892 }, { "epoch": 0.67, "learning_rate": 0.0005217617947267396, "loss": 2.7744, "step": 24893 }, { "epoch": 0.67, "learning_rate": 0.0005216853560931917, "loss": 2.703, "step": 24894 }, { "epoch": 0.67, "learning_rate": 0.0005216089210832696, "loss": 2.7307, "step": 24895 }, { "epoch": 0.67, "learning_rate": 0.0005215324896975526, "loss": 2.3464, "step": 24896 }, { "epoch": 0.67, "learning_rate": 0.00052145606193662, "loss": 2.7837, "step": 24897 }, { "epoch": 0.67, "learning_rate": 0.0005213796378010507, "loss": 2.7489, "step": 24898 }, { "epoch": 0.67, "learning_rate": 0.0005213032172914239, "loss": 2.1828, "step": 24899 }, { "epoch": 0.67, "learning_rate": 0.0005212268004083185, "loss": 2.0186, "step": 24900 }, { "epoch": 0.67, "learning_rate": 0.0005211503871523129, "loss": 2.43, "step": 24901 }, { "epoch": 0.67, "learning_rate": 0.0005210739775239863, "loss": 2.6265, "step": 24902 }, { "epoch": 0.67, "learning_rate": 0.0005209975715239182, "loss": 2.6272, "step": 24903 }, { "epoch": 0.67, "learning_rate": 0.0005209211691526858, "loss": 2.4167, "step": 24904 }, { "epoch": 0.67, "learning_rate": 0.0005208447704108701, "loss": 2.623, "step": 24905 }, { "epoch": 0.67, "learning_rate": 0.0005207683752990481, "loss": 2.62, "step": 24906 }, { "epoch": 0.67, "learning_rate": 0.0005206919838177992, "loss": 2.7394, "step": 24907 }, { "epoch": 0.67, "learning_rate": 0.0005206155959677028, "loss": 2.3074, "step": 24908 }, { "epoch": 0.67, "learning_rate": 0.0005205392117493364, "loss": 2.6507, "step": 24909 }, { "epoch": 0.67, "learning_rate": 0.0005204628311632791, "loss": 3.0143, "step": 24910 }, { "epoch": 0.67, "learning_rate": 0.0005203864542101098, "loss": 2.6788, "step": 24911 }, { "epoch": 0.67, "learning_rate": 0.0005203100808904069, "loss": 2.4745, "step": 24912 }, { "epoch": 0.67, "learning_rate": 0.0005202337112047495, "loss": 2.6232, "step": 24913 }, { "epoch": 0.67, "learning_rate": 0.0005201573451537153, "loss": 2.3938, "step": 24914 }, { "epoch": 0.67, "learning_rate": 0.0005200809827378833, "loss": 2.6647, "step": 24915 }, { "epoch": 0.67, "learning_rate": 0.0005200046239578325, "loss": 2.6863, "step": 24916 }, { "epoch": 0.67, "learning_rate": 0.0005199282688141398, "loss": 2.4369, "step": 24917 }, { "epoch": 0.67, "learning_rate": 0.0005198519173073852, "loss": 2.2478, "step": 24918 }, { "epoch": 0.67, "learning_rate": 0.000519775569438147, "loss": 2.3697, "step": 24919 }, { "epoch": 0.67, "learning_rate": 0.000519699225207003, "loss": 2.4502, "step": 24920 }, { "epoch": 0.67, "learning_rate": 0.000519622884614532, "loss": 2.1251, "step": 24921 }, { "epoch": 0.67, "learning_rate": 0.0005195465476613118, "loss": 2.072, "step": 24922 }, { "epoch": 0.67, "learning_rate": 0.0005194702143479211, "loss": 2.6535, "step": 24923 }, { "epoch": 0.67, "learning_rate": 0.0005193938846749382, "loss": 2.7946, "step": 24924 }, { "epoch": 0.67, "learning_rate": 0.0005193175586429412, "loss": 2.4046, "step": 24925 }, { "epoch": 0.67, "learning_rate": 0.0005192412362525085, "loss": 2.4343, "step": 24926 }, { "epoch": 0.67, "learning_rate": 0.0005191649175042186, "loss": 2.4246, "step": 24927 }, { "epoch": 0.67, "learning_rate": 0.000519088602398649, "loss": 2.5601, "step": 24928 }, { "epoch": 0.67, "learning_rate": 0.0005190122909363784, "loss": 2.5714, "step": 24929 }, { "epoch": 0.67, "learning_rate": 0.000518935983117984, "loss": 2.4629, "step": 24930 }, { "epoch": 0.67, "learning_rate": 0.000518859678944045, "loss": 2.5154, "step": 24931 }, { "epoch": 0.67, "learning_rate": 0.0005187833784151395, "loss": 2.4713, "step": 24932 }, { "epoch": 0.67, "learning_rate": 0.0005187070815318445, "loss": 2.152, "step": 24933 }, { "epoch": 0.67, "learning_rate": 0.0005186307882947388, "loss": 2.4379, "step": 24934 }, { "epoch": 0.67, "learning_rate": 0.0005185544987044004, "loss": 2.1334, "step": 24935 }, { "epoch": 0.67, "learning_rate": 0.0005184782127614069, "loss": 2.5789, "step": 24936 }, { "epoch": 0.67, "learning_rate": 0.0005184019304663361, "loss": 2.4148, "step": 24937 }, { "epoch": 0.67, "learning_rate": 0.0005183256518197663, "loss": 2.7322, "step": 24938 }, { "epoch": 0.67, "learning_rate": 0.0005182493768222753, "loss": 2.6571, "step": 24939 }, { "epoch": 0.67, "learning_rate": 0.0005181731054744412, "loss": 2.2795, "step": 24940 }, { "epoch": 0.67, "learning_rate": 0.0005180968377768412, "loss": 2.3505, "step": 24941 }, { "epoch": 0.67, "learning_rate": 0.0005180205737300534, "loss": 2.0991, "step": 24942 }, { "epoch": 0.67, "learning_rate": 0.0005179443133346555, "loss": 2.4082, "step": 24943 }, { "epoch": 0.67, "learning_rate": 0.0005178680565912253, "loss": 3.1203, "step": 24944 }, { "epoch": 0.67, "learning_rate": 0.0005177918035003405, "loss": 2.2103, "step": 24945 }, { "epoch": 0.67, "learning_rate": 0.0005177155540625792, "loss": 2.3308, "step": 24946 }, { "epoch": 0.67, "learning_rate": 0.0005176393082785182, "loss": 2.4549, "step": 24947 }, { "epoch": 0.67, "learning_rate": 0.0005175630661487361, "loss": 2.6179, "step": 24948 }, { "epoch": 0.67, "learning_rate": 0.0005174868276738094, "loss": 2.8211, "step": 24949 }, { "epoch": 0.67, "learning_rate": 0.0005174105928543163, "loss": 2.5679, "step": 24950 }, { "epoch": 0.67, "learning_rate": 0.0005173343616908342, "loss": 2.7371, "step": 24951 }, { "epoch": 0.67, "learning_rate": 0.0005172581341839408, "loss": 2.5417, "step": 24952 }, { "epoch": 0.67, "learning_rate": 0.0005171819103342134, "loss": 2.73, "step": 24953 }, { "epoch": 0.67, "learning_rate": 0.00051710569014223, "loss": 2.5873, "step": 24954 }, { "epoch": 0.67, "learning_rate": 0.000517029473608567, "loss": 2.9488, "step": 24955 }, { "epoch": 0.67, "learning_rate": 0.0005169532607338025, "loss": 2.5582, "step": 24956 }, { "epoch": 0.67, "learning_rate": 0.0005168770515185137, "loss": 2.8933, "step": 24957 }, { "epoch": 0.67, "learning_rate": 0.000516800845963278, "loss": 2.0771, "step": 24958 }, { "epoch": 0.67, "learning_rate": 0.000516724644068673, "loss": 2.2759, "step": 24959 }, { "epoch": 0.67, "learning_rate": 0.0005166484458352755, "loss": 2.1143, "step": 24960 }, { "epoch": 0.67, "learning_rate": 0.0005165722512636628, "loss": 2.5047, "step": 24961 }, { "epoch": 0.67, "learning_rate": 0.0005164960603544127, "loss": 2.7102, "step": 24962 }, { "epoch": 0.67, "learning_rate": 0.0005164198731081017, "loss": 2.4898, "step": 24963 }, { "epoch": 0.67, "learning_rate": 0.0005163436895253073, "loss": 2.7024, "step": 24964 }, { "epoch": 0.67, "learning_rate": 0.0005162675096066065, "loss": 2.7097, "step": 24965 }, { "epoch": 0.67, "learning_rate": 0.0005161913333525766, "loss": 2.5917, "step": 24966 }, { "epoch": 0.67, "learning_rate": 0.000516115160763795, "loss": 2.6148, "step": 24967 }, { "epoch": 0.67, "learning_rate": 0.0005160389918408382, "loss": 2.306, "step": 24968 }, { "epoch": 0.67, "learning_rate": 0.0005159628265842835, "loss": 2.7638, "step": 24969 }, { "epoch": 0.67, "learning_rate": 0.0005158866649947078, "loss": 2.3932, "step": 24970 }, { "epoch": 0.67, "learning_rate": 0.0005158105070726881, "loss": 2.4592, "step": 24971 }, { "epoch": 0.67, "learning_rate": 0.0005157343528188014, "loss": 2.6376, "step": 24972 }, { "epoch": 0.67, "learning_rate": 0.0005156582022336251, "loss": 2.2605, "step": 24973 }, { "epoch": 0.67, "learning_rate": 0.0005155820553177355, "loss": 2.3883, "step": 24974 }, { "epoch": 0.67, "learning_rate": 0.0005155059120717098, "loss": 2.1277, "step": 24975 }, { "epoch": 0.67, "learning_rate": 0.0005154297724961243, "loss": 2.4246, "step": 24976 }, { "epoch": 0.67, "learning_rate": 0.0005153536365915559, "loss": 2.5206, "step": 24977 }, { "epoch": 0.67, "learning_rate": 0.0005152775043585824, "loss": 2.6503, "step": 24978 }, { "epoch": 0.67, "learning_rate": 0.0005152013757977796, "loss": 2.577, "step": 24979 }, { "epoch": 0.67, "learning_rate": 0.0005151252509097244, "loss": 2.2586, "step": 24980 }, { "epoch": 0.67, "learning_rate": 0.0005150491296949942, "loss": 2.5442, "step": 24981 }, { "epoch": 0.67, "learning_rate": 0.0005149730121541645, "loss": 2.1952, "step": 24982 }, { "epoch": 0.67, "learning_rate": 0.0005148968982878127, "loss": 2.4916, "step": 24983 }, { "epoch": 0.67, "learning_rate": 0.000514820788096515, "loss": 2.65, "step": 24984 }, { "epoch": 0.67, "learning_rate": 0.0005147446815808484, "loss": 2.3738, "step": 24985 }, { "epoch": 0.67, "learning_rate": 0.0005146685787413898, "loss": 2.8569, "step": 24986 }, { "epoch": 0.67, "learning_rate": 0.0005145924795787149, "loss": 2.7023, "step": 24987 }, { "epoch": 0.67, "learning_rate": 0.0005145163840934004, "loss": 1.9093, "step": 24988 }, { "epoch": 0.67, "learning_rate": 0.0005144402922860236, "loss": 2.5446, "step": 24989 }, { "epoch": 0.67, "learning_rate": 0.0005143642041571595, "loss": 2.4227, "step": 24990 }, { "epoch": 0.67, "learning_rate": 0.000514288119707386, "loss": 2.81, "step": 24991 }, { "epoch": 0.67, "learning_rate": 0.0005142120389372786, "loss": 2.5501, "step": 24992 }, { "epoch": 0.67, "learning_rate": 0.000514135961847414, "loss": 2.7523, "step": 24993 }, { "epoch": 0.67, "learning_rate": 0.0005140598884383688, "loss": 2.2956, "step": 24994 }, { "epoch": 0.67, "learning_rate": 0.0005139838187107187, "loss": 2.5966, "step": 24995 }, { "epoch": 0.67, "learning_rate": 0.0005139077526650401, "loss": 2.3486, "step": 24996 }, { "epoch": 0.67, "learning_rate": 0.0005138316903019096, "loss": 1.9878, "step": 24997 }, { "epoch": 0.67, "learning_rate": 0.0005137556316219032, "loss": 2.3819, "step": 24998 }, { "epoch": 0.67, "learning_rate": 0.0005136795766255977, "loss": 2.9104, "step": 24999 }, { "epoch": 0.67, "learning_rate": 0.0005136035253135683, "loss": 2.3825, "step": 25000 }, { "epoch": 0.67, "learning_rate": 0.0005135274776863917, "loss": 2.3739, "step": 25001 }, { "epoch": 0.67, "learning_rate": 0.0005134514337446444, "loss": 2.2954, "step": 25002 }, { "epoch": 0.67, "learning_rate": 0.0005133753934889011, "loss": 2.4732, "step": 25003 }, { "epoch": 0.67, "learning_rate": 0.0005132993569197395, "loss": 2.1737, "step": 25004 }, { "epoch": 0.67, "learning_rate": 0.0005132233240377351, "loss": 2.4307, "step": 25005 }, { "epoch": 0.67, "learning_rate": 0.0005131472948434635, "loss": 2.7166, "step": 25006 }, { "epoch": 0.67, "learning_rate": 0.0005130712693375008, "loss": 2.4511, "step": 25007 }, { "epoch": 0.67, "learning_rate": 0.0005129952475204236, "loss": 2.1571, "step": 25008 }, { "epoch": 0.67, "learning_rate": 0.000512919229392807, "loss": 2.085, "step": 25009 }, { "epoch": 0.67, "learning_rate": 0.0005128432149552271, "loss": 2.6371, "step": 25010 }, { "epoch": 0.67, "learning_rate": 0.00051276720420826, "loss": 2.7007, "step": 25011 }, { "epoch": 0.67, "learning_rate": 0.0005126911971524814, "loss": 2.6136, "step": 25012 }, { "epoch": 0.67, "learning_rate": 0.0005126151937884677, "loss": 2.0742, "step": 25013 }, { "epoch": 0.67, "learning_rate": 0.0005125391941167936, "loss": 2.3569, "step": 25014 }, { "epoch": 0.67, "learning_rate": 0.0005124631981380355, "loss": 2.4688, "step": 25015 }, { "epoch": 0.67, "learning_rate": 0.000512387205852769, "loss": 2.5425, "step": 25016 }, { "epoch": 0.67, "learning_rate": 0.00051231121726157, "loss": 2.6378, "step": 25017 }, { "epoch": 0.67, "learning_rate": 0.0005122352323650143, "loss": 2.4703, "step": 25018 }, { "epoch": 0.67, "learning_rate": 0.0005121592511636768, "loss": 2.8223, "step": 25019 }, { "epoch": 0.67, "learning_rate": 0.0005120832736581337, "loss": 2.512, "step": 25020 }, { "epoch": 0.67, "learning_rate": 0.0005120072998489609, "loss": 2.5169, "step": 25021 }, { "epoch": 0.67, "learning_rate": 0.0005119313297367331, "loss": 2.1509, "step": 25022 }, { "epoch": 0.67, "learning_rate": 0.0005118553633220259, "loss": 2.2883, "step": 25023 }, { "epoch": 0.67, "learning_rate": 0.000511779400605416, "loss": 2.7249, "step": 25024 }, { "epoch": 0.67, "learning_rate": 0.0005117034415874776, "loss": 2.4581, "step": 25025 }, { "epoch": 0.67, "learning_rate": 0.0005116274862687871, "loss": 2.3503, "step": 25026 }, { "epoch": 0.67, "learning_rate": 0.0005115515346499191, "loss": 2.476, "step": 25027 }, { "epoch": 0.67, "learning_rate": 0.0005114755867314493, "loss": 2.1977, "step": 25028 }, { "epoch": 0.67, "learning_rate": 0.0005113996425139531, "loss": 2.7896, "step": 25029 }, { "epoch": 0.67, "learning_rate": 0.0005113237019980058, "loss": 2.7031, "step": 25030 }, { "epoch": 0.67, "learning_rate": 0.0005112477651841829, "loss": 2.1507, "step": 25031 }, { "epoch": 0.67, "learning_rate": 0.0005111718320730598, "loss": 3.005, "step": 25032 }, { "epoch": 0.67, "learning_rate": 0.0005110959026652112, "loss": 2.3841, "step": 25033 }, { "epoch": 0.67, "learning_rate": 0.000511019976961213, "loss": 2.0662, "step": 25034 }, { "epoch": 0.67, "learning_rate": 0.0005109440549616398, "loss": 2.4858, "step": 25035 }, { "epoch": 0.67, "learning_rate": 0.0005108681366670665, "loss": 2.4279, "step": 25036 }, { "epoch": 0.67, "learning_rate": 0.0005107922220780694, "loss": 2.4268, "step": 25037 }, { "epoch": 0.67, "learning_rate": 0.0005107163111952226, "loss": 2.8432, "step": 25038 }, { "epoch": 0.67, "learning_rate": 0.0005106404040191017, "loss": 3.1315, "step": 25039 }, { "epoch": 0.67, "learning_rate": 0.0005105645005502819, "loss": 2.7585, "step": 25040 }, { "epoch": 0.67, "learning_rate": 0.0005104886007893376, "loss": 2.754, "step": 25041 }, { "epoch": 0.67, "learning_rate": 0.0005104127047368441, "loss": 2.7372, "step": 25042 }, { "epoch": 0.67, "learning_rate": 0.0005103368123933764, "loss": 2.5436, "step": 25043 }, { "epoch": 0.67, "learning_rate": 0.0005102609237595095, "loss": 2.3359, "step": 25044 }, { "epoch": 0.67, "learning_rate": 0.0005101850388358187, "loss": 3.0284, "step": 25045 }, { "epoch": 0.67, "learning_rate": 0.000510109157622878, "loss": 2.4696, "step": 25046 }, { "epoch": 0.67, "learning_rate": 0.0005100332801212628, "loss": 2.4044, "step": 25047 }, { "epoch": 0.67, "learning_rate": 0.0005099574063315484, "loss": 2.4928, "step": 25048 }, { "epoch": 0.67, "learning_rate": 0.0005098815362543081, "loss": 2.2736, "step": 25049 }, { "epoch": 0.67, "learning_rate": 0.0005098056698901181, "loss": 2.3409, "step": 25050 }, { "epoch": 0.67, "learning_rate": 0.0005097298072395531, "loss": 2.3874, "step": 25051 }, { "epoch": 0.67, "learning_rate": 0.0005096539483031871, "loss": 2.4003, "step": 25052 }, { "epoch": 0.67, "learning_rate": 0.0005095780930815954, "loss": 2.434, "step": 25053 }, { "epoch": 0.67, "learning_rate": 0.0005095022415753521, "loss": 2.3124, "step": 25054 }, { "epoch": 0.67, "learning_rate": 0.000509426393785032, "loss": 2.5675, "step": 25055 }, { "epoch": 0.67, "learning_rate": 0.0005093505497112099, "loss": 2.5423, "step": 25056 }, { "epoch": 0.67, "learning_rate": 0.0005092747093544603, "loss": 2.6543, "step": 25057 }, { "epoch": 0.67, "learning_rate": 0.0005091988727153578, "loss": 2.4764, "step": 25058 }, { "epoch": 0.67, "learning_rate": 0.0005091230397944773, "loss": 2.6264, "step": 25059 }, { "epoch": 0.67, "learning_rate": 0.0005090472105923925, "loss": 2.4841, "step": 25060 }, { "epoch": 0.67, "learning_rate": 0.0005089713851096786, "loss": 2.5683, "step": 25061 }, { "epoch": 0.67, "learning_rate": 0.000508895563346909, "loss": 2.3473, "step": 25062 }, { "epoch": 0.67, "learning_rate": 0.0005088197453046591, "loss": 2.6201, "step": 25063 }, { "epoch": 0.67, "learning_rate": 0.0005087439309835035, "loss": 2.28, "step": 25064 }, { "epoch": 0.67, "learning_rate": 0.0005086681203840156, "loss": 2.5911, "step": 25065 }, { "epoch": 0.67, "learning_rate": 0.0005085923135067701, "loss": 2.3509, "step": 25066 }, { "epoch": 0.67, "learning_rate": 0.000508516510352342, "loss": 2.6091, "step": 25067 }, { "epoch": 0.67, "learning_rate": 0.0005084407109213043, "loss": 2.2064, "step": 25068 }, { "epoch": 0.67, "learning_rate": 0.000508364915214232, "loss": 2.75, "step": 25069 }, { "epoch": 0.67, "learning_rate": 0.000508289123231699, "loss": 1.9833, "step": 25070 }, { "epoch": 0.67, "learning_rate": 0.0005082133349742801, "loss": 2.1199, "step": 25071 }, { "epoch": 0.67, "learning_rate": 0.0005081375504425492, "loss": 2.2682, "step": 25072 }, { "epoch": 0.67, "learning_rate": 0.00050806176963708, "loss": 2.3992, "step": 25073 }, { "epoch": 0.67, "learning_rate": 0.0005079859925584466, "loss": 2.4746, "step": 25074 }, { "epoch": 0.67, "learning_rate": 0.0005079102192072235, "loss": 2.4587, "step": 25075 }, { "epoch": 0.67, "learning_rate": 0.0005078344495839848, "loss": 2.2072, "step": 25076 }, { "epoch": 0.67, "learning_rate": 0.0005077586836893046, "loss": 2.5584, "step": 25077 }, { "epoch": 0.67, "learning_rate": 0.0005076829215237561, "loss": 2.6379, "step": 25078 }, { "epoch": 0.67, "learning_rate": 0.0005076071630879139, "loss": 2.5546, "step": 25079 }, { "epoch": 0.67, "learning_rate": 0.0005075314083823521, "loss": 2.4844, "step": 25080 }, { "epoch": 0.67, "learning_rate": 0.000507455657407644, "loss": 2.3558, "step": 25081 }, { "epoch": 0.67, "learning_rate": 0.0005073799101643637, "loss": 2.5573, "step": 25082 }, { "epoch": 0.67, "learning_rate": 0.0005073041666530852, "loss": 2.2906, "step": 25083 }, { "epoch": 0.67, "learning_rate": 0.0005072284268743823, "loss": 2.37, "step": 25084 }, { "epoch": 0.67, "learning_rate": 0.0005071526908288287, "loss": 2.3199, "step": 25085 }, { "epoch": 0.67, "learning_rate": 0.0005070769585169984, "loss": 2.3451, "step": 25086 }, { "epoch": 0.67, "learning_rate": 0.0005070012299394647, "loss": 2.3816, "step": 25087 }, { "epoch": 0.67, "learning_rate": 0.0005069255050968016, "loss": 2.5708, "step": 25088 }, { "epoch": 0.67, "learning_rate": 0.0005068497839895826, "loss": 2.8032, "step": 25089 }, { "epoch": 0.67, "learning_rate": 0.0005067740666183816, "loss": 2.6996, "step": 25090 }, { "epoch": 0.67, "learning_rate": 0.0005066983529837723, "loss": 2.2188, "step": 25091 }, { "epoch": 0.67, "learning_rate": 0.0005066226430863279, "loss": 2.4116, "step": 25092 }, { "epoch": 0.67, "learning_rate": 0.000506546936926622, "loss": 2.7579, "step": 25093 }, { "epoch": 0.67, "learning_rate": 0.0005064712345052287, "loss": 2.2794, "step": 25094 }, { "epoch": 0.67, "learning_rate": 0.0005063955358227208, "loss": 2.4855, "step": 25095 }, { "epoch": 0.67, "learning_rate": 0.0005063198408796719, "loss": 2.3103, "step": 25096 }, { "epoch": 0.67, "learning_rate": 0.0005062441496766558, "loss": 2.3729, "step": 25097 }, { "epoch": 0.67, "learning_rate": 0.0005061684622142456, "loss": 2.539, "step": 25098 }, { "epoch": 0.67, "learning_rate": 0.0005060927784930154, "loss": 2.445, "step": 25099 }, { "epoch": 0.67, "learning_rate": 0.0005060170985135375, "loss": 2.3789, "step": 25100 }, { "epoch": 0.67, "learning_rate": 0.0005059414222763857, "loss": 2.7177, "step": 25101 }, { "epoch": 0.67, "learning_rate": 0.0005058657497821334, "loss": 2.4329, "step": 25102 }, { "epoch": 0.67, "learning_rate": 0.0005057900810313538, "loss": 2.7372, "step": 25103 }, { "epoch": 0.67, "learning_rate": 0.0005057144160246208, "loss": 2.8387, "step": 25104 }, { "epoch": 0.67, "learning_rate": 0.0005056387547625063, "loss": 2.7224, "step": 25105 }, { "epoch": 0.67, "learning_rate": 0.0005055630972455845, "loss": 2.0142, "step": 25106 }, { "epoch": 0.67, "learning_rate": 0.0005054874434744285, "loss": 2.6645, "step": 25107 }, { "epoch": 0.67, "learning_rate": 0.0005054117934496109, "loss": 2.1422, "step": 25108 }, { "epoch": 0.67, "learning_rate": 0.0005053361471717046, "loss": 2.7935, "step": 25109 }, { "epoch": 0.67, "learning_rate": 0.0005052605046412842, "loss": 2.5743, "step": 25110 }, { "epoch": 0.67, "learning_rate": 0.0005051848658589212, "loss": 2.4728, "step": 25111 }, { "epoch": 0.67, "learning_rate": 0.0005051092308251897, "loss": 2.6135, "step": 25112 }, { "epoch": 0.67, "learning_rate": 0.0005050335995406616, "loss": 2.3432, "step": 25113 }, { "epoch": 0.67, "learning_rate": 0.0005049579720059108, "loss": 2.8249, "step": 25114 }, { "epoch": 0.67, "learning_rate": 0.0005048823482215097, "loss": 1.7355, "step": 25115 }, { "epoch": 0.67, "learning_rate": 0.0005048067281880313, "loss": 2.5213, "step": 25116 }, { "epoch": 0.67, "learning_rate": 0.0005047311119060487, "loss": 2.5783, "step": 25117 }, { "epoch": 0.68, "learning_rate": 0.0005046554993761352, "loss": 2.973, "step": 25118 }, { "epoch": 0.68, "learning_rate": 0.0005045798905988625, "loss": 2.5967, "step": 25119 }, { "epoch": 0.68, "learning_rate": 0.000504504285574804, "loss": 2.1019, "step": 25120 }, { "epoch": 0.68, "learning_rate": 0.0005044286843045329, "loss": 2.8114, "step": 25121 }, { "epoch": 0.68, "learning_rate": 0.0005043530867886206, "loss": 2.6687, "step": 25122 }, { "epoch": 0.68, "learning_rate": 0.0005042774930276415, "loss": 2.2527, "step": 25123 }, { "epoch": 0.68, "learning_rate": 0.0005042019030221672, "loss": 2.5072, "step": 25124 }, { "epoch": 0.68, "learning_rate": 0.0005041263167727706, "loss": 2.4865, "step": 25125 }, { "epoch": 0.68, "learning_rate": 0.0005040507342800247, "loss": 2.0684, "step": 25126 }, { "epoch": 0.68, "learning_rate": 0.0005039751555445014, "loss": 2.4489, "step": 25127 }, { "epoch": 0.68, "learning_rate": 0.0005038995805667736, "loss": 2.9541, "step": 25128 }, { "epoch": 0.68, "learning_rate": 0.0005038240093474141, "loss": 2.5384, "step": 25129 }, { "epoch": 0.68, "learning_rate": 0.000503748441886995, "loss": 2.6788, "step": 25130 }, { "epoch": 0.68, "learning_rate": 0.0005036728781860894, "loss": 2.9708, "step": 25131 }, { "epoch": 0.68, "learning_rate": 0.0005035973182452688, "loss": 2.5417, "step": 25132 }, { "epoch": 0.68, "learning_rate": 0.0005035217620651065, "loss": 2.4685, "step": 25133 }, { "epoch": 0.68, "learning_rate": 0.0005034462096461747, "loss": 2.552, "step": 25134 }, { "epoch": 0.68, "learning_rate": 0.000503370660989045, "loss": 2.4752, "step": 25135 }, { "epoch": 0.68, "learning_rate": 0.0005032951160942908, "loss": 2.4561, "step": 25136 }, { "epoch": 0.68, "learning_rate": 0.0005032195749624843, "loss": 2.219, "step": 25137 }, { "epoch": 0.68, "learning_rate": 0.0005031440375941971, "loss": 2.6839, "step": 25138 }, { "epoch": 0.68, "learning_rate": 0.0005030685039900023, "loss": 2.2514, "step": 25139 }, { "epoch": 0.68, "learning_rate": 0.0005029929741504711, "loss": 2.1889, "step": 25140 }, { "epoch": 0.68, "learning_rate": 0.0005029174480761765, "loss": 2.4951, "step": 25141 }, { "epoch": 0.68, "learning_rate": 0.0005028419257676902, "loss": 2.3516, "step": 25142 }, { "epoch": 0.68, "learning_rate": 0.0005027664072255848, "loss": 2.6755, "step": 25143 }, { "epoch": 0.68, "learning_rate": 0.0005026908924504321, "loss": 2.7011, "step": 25144 }, { "epoch": 0.68, "learning_rate": 0.0005026153814428047, "loss": 2.8834, "step": 25145 }, { "epoch": 0.68, "learning_rate": 0.0005025398742032739, "loss": 2.9569, "step": 25146 }, { "epoch": 0.68, "learning_rate": 0.0005024643707324123, "loss": 2.2724, "step": 25147 }, { "epoch": 0.68, "learning_rate": 0.0005023888710307911, "loss": 2.4537, "step": 25148 }, { "epoch": 0.68, "learning_rate": 0.0005023133750989832, "loss": 2.5922, "step": 25149 }, { "epoch": 0.68, "learning_rate": 0.0005022378829375604, "loss": 2.8094, "step": 25150 }, { "epoch": 0.68, "learning_rate": 0.0005021623945470943, "loss": 2.3161, "step": 25151 }, { "epoch": 0.68, "learning_rate": 0.0005020869099281568, "loss": 2.4704, "step": 25152 }, { "epoch": 0.68, "learning_rate": 0.0005020114290813202, "loss": 2.8605, "step": 25153 }, { "epoch": 0.68, "learning_rate": 0.0005019359520071556, "loss": 2.47, "step": 25154 }, { "epoch": 0.68, "learning_rate": 0.000501860478706235, "loss": 2.2451, "step": 25155 }, { "epoch": 0.68, "learning_rate": 0.0005017850091791306, "loss": 2.2414, "step": 25156 }, { "epoch": 0.68, "learning_rate": 0.0005017095434264138, "loss": 2.3062, "step": 25157 }, { "epoch": 0.68, "learning_rate": 0.0005016340814486569, "loss": 2.0725, "step": 25158 }, { "epoch": 0.68, "learning_rate": 0.0005015586232464306, "loss": 2.163, "step": 25159 }, { "epoch": 0.68, "learning_rate": 0.0005014831688203071, "loss": 2.6453, "step": 25160 }, { "epoch": 0.68, "learning_rate": 0.0005014077181708579, "loss": 2.5307, "step": 25161 }, { "epoch": 0.68, "learning_rate": 0.0005013322712986548, "loss": 2.8671, "step": 25162 }, { "epoch": 0.68, "learning_rate": 0.0005012568282042693, "loss": 2.473, "step": 25163 }, { "epoch": 0.68, "learning_rate": 0.0005011813888882731, "loss": 2.1578, "step": 25164 }, { "epoch": 0.68, "learning_rate": 0.0005011059533512373, "loss": 2.4675, "step": 25165 }, { "epoch": 0.68, "learning_rate": 0.0005010305215937339, "loss": 2.417, "step": 25166 }, { "epoch": 0.68, "learning_rate": 0.0005009550936163337, "loss": 2.3185, "step": 25167 }, { "epoch": 0.68, "learning_rate": 0.0005008796694196085, "loss": 2.5181, "step": 25168 }, { "epoch": 0.68, "learning_rate": 0.0005008042490041298, "loss": 2.4978, "step": 25169 }, { "epoch": 0.68, "learning_rate": 0.0005007288323704686, "loss": 2.8139, "step": 25170 }, { "epoch": 0.68, "learning_rate": 0.0005006534195191967, "loss": 2.5102, "step": 25171 }, { "epoch": 0.68, "learning_rate": 0.0005005780104508856, "loss": 2.6094, "step": 25172 }, { "epoch": 0.68, "learning_rate": 0.0005005026051661057, "loss": 2.4968, "step": 25173 }, { "epoch": 0.68, "learning_rate": 0.0005004272036654289, "loss": 2.3972, "step": 25174 }, { "epoch": 0.68, "learning_rate": 0.0005003518059494263, "loss": 2.8088, "step": 25175 }, { "epoch": 0.68, "learning_rate": 0.0005002764120186689, "loss": 2.6361, "step": 25176 }, { "epoch": 0.68, "learning_rate": 0.0005002010218737287, "loss": 2.7425, "step": 25177 }, { "epoch": 0.68, "learning_rate": 0.0005001256355151756, "loss": 2.6537, "step": 25178 }, { "epoch": 0.68, "learning_rate": 0.0005000502529435814, "loss": 2.6879, "step": 25179 }, { "epoch": 0.68, "learning_rate": 0.0004999748741595175, "loss": 2.5005, "step": 25180 }, { "epoch": 0.68, "learning_rate": 0.0004998994991635537, "loss": 2.7877, "step": 25181 }, { "epoch": 0.68, "learning_rate": 0.0004998241279562627, "loss": 2.8392, "step": 25182 }, { "epoch": 0.68, "learning_rate": 0.0004997487605382144, "loss": 2.5275, "step": 25183 }, { "epoch": 0.68, "learning_rate": 0.0004996733969099799, "loss": 2.1364, "step": 25184 }, { "epoch": 0.68, "learning_rate": 0.0004995980370721308, "loss": 2.5771, "step": 25185 }, { "epoch": 0.68, "learning_rate": 0.0004995226810252371, "loss": 2.4674, "step": 25186 }, { "epoch": 0.68, "learning_rate": 0.0004994473287698701, "loss": 2.721, "step": 25187 }, { "epoch": 0.68, "learning_rate": 0.0004993719803066006, "loss": 2.8431, "step": 25188 }, { "epoch": 0.68, "learning_rate": 0.0004992966356359994, "loss": 2.2419, "step": 25189 }, { "epoch": 0.68, "learning_rate": 0.000499221294758638, "loss": 2.317, "step": 25190 }, { "epoch": 0.68, "learning_rate": 0.0004991459576750859, "loss": 2.4083, "step": 25191 }, { "epoch": 0.68, "learning_rate": 0.0004990706243859146, "loss": 2.9082, "step": 25192 }, { "epoch": 0.68, "learning_rate": 0.0004989952948916951, "loss": 2.6648, "step": 25193 }, { "epoch": 0.68, "learning_rate": 0.0004989199691929969, "loss": 2.5159, "step": 25194 }, { "epoch": 0.68, "learning_rate": 0.0004988446472903917, "loss": 2.7462, "step": 25195 }, { "epoch": 0.68, "learning_rate": 0.0004987693291844503, "loss": 2.6237, "step": 25196 }, { "epoch": 0.68, "learning_rate": 0.0004986940148757425, "loss": 2.5979, "step": 25197 }, { "epoch": 0.68, "learning_rate": 0.0004986187043648393, "loss": 2.4796, "step": 25198 }, { "epoch": 0.68, "learning_rate": 0.0004985433976523114, "loss": 2.4457, "step": 25199 }, { "epoch": 0.68, "learning_rate": 0.0004984680947387286, "loss": 2.6956, "step": 25200 }, { "epoch": 0.68, "learning_rate": 0.0004983927956246621, "loss": 3.0003, "step": 25201 }, { "epoch": 0.68, "learning_rate": 0.0004983175003106821, "loss": 2.1171, "step": 25202 }, { "epoch": 0.68, "learning_rate": 0.0004982422087973587, "loss": 2.8363, "step": 25203 }, { "epoch": 0.68, "learning_rate": 0.0004981669210852633, "loss": 2.6017, "step": 25204 }, { "epoch": 0.68, "learning_rate": 0.0004980916371749651, "loss": 2.6642, "step": 25205 }, { "epoch": 0.68, "learning_rate": 0.0004980163570670349, "loss": 2.5126, "step": 25206 }, { "epoch": 0.68, "learning_rate": 0.000497941080762043, "loss": 2.0588, "step": 25207 }, { "epoch": 0.68, "learning_rate": 0.0004978658082605598, "loss": 2.0964, "step": 25208 }, { "epoch": 0.68, "learning_rate": 0.0004977905395631559, "loss": 2.7034, "step": 25209 }, { "epoch": 0.68, "learning_rate": 0.0004977152746704006, "loss": 2.3705, "step": 25210 }, { "epoch": 0.68, "learning_rate": 0.0004976400135828646, "loss": 2.3952, "step": 25211 }, { "epoch": 0.68, "learning_rate": 0.0004975647563011184, "loss": 2.3404, "step": 25212 }, { "epoch": 0.68, "learning_rate": 0.0004974895028257315, "loss": 2.3607, "step": 25213 }, { "epoch": 0.68, "learning_rate": 0.0004974142531572742, "loss": 2.9639, "step": 25214 }, { "epoch": 0.68, "learning_rate": 0.0004973390072963166, "loss": 2.787, "step": 25215 }, { "epoch": 0.68, "learning_rate": 0.000497263765243429, "loss": 2.6766, "step": 25216 }, { "epoch": 0.68, "learning_rate": 0.0004971885269991815, "loss": 2.9952, "step": 25217 }, { "epoch": 0.68, "learning_rate": 0.0004971132925641434, "loss": 2.5362, "step": 25218 }, { "epoch": 0.68, "learning_rate": 0.0004970380619388851, "loss": 2.6473, "step": 25219 }, { "epoch": 0.68, "learning_rate": 0.0004969628351239767, "loss": 2.4929, "step": 25220 }, { "epoch": 0.68, "learning_rate": 0.0004968876121199877, "loss": 2.5374, "step": 25221 }, { "epoch": 0.68, "learning_rate": 0.0004968123929274883, "loss": 2.7482, "step": 25222 }, { "epoch": 0.68, "learning_rate": 0.0004967371775470486, "loss": 3.0598, "step": 25223 }, { "epoch": 0.68, "learning_rate": 0.0004966619659792377, "loss": 2.8161, "step": 25224 }, { "epoch": 0.68, "learning_rate": 0.0004965867582246261, "loss": 2.714, "step": 25225 }, { "epoch": 0.68, "learning_rate": 0.0004965115542837829, "loss": 2.3087, "step": 25226 }, { "epoch": 0.68, "learning_rate": 0.0004964363541572782, "loss": 1.9652, "step": 25227 }, { "epoch": 0.68, "learning_rate": 0.0004963611578456816, "loss": 2.3797, "step": 25228 }, { "epoch": 0.68, "learning_rate": 0.0004962859653495627, "loss": 2.8115, "step": 25229 }, { "epoch": 0.68, "learning_rate": 0.0004962107766694915, "loss": 2.103, "step": 25230 }, { "epoch": 0.68, "learning_rate": 0.0004961355918060376, "loss": 2.2529, "step": 25231 }, { "epoch": 0.68, "learning_rate": 0.00049606041075977, "loss": 2.4245, "step": 25232 }, { "epoch": 0.68, "learning_rate": 0.0004959852335312587, "loss": 2.312, "step": 25233 }, { "epoch": 0.68, "learning_rate": 0.0004959100601210732, "loss": 2.58, "step": 25234 }, { "epoch": 0.68, "learning_rate": 0.0004958348905297828, "loss": 2.8326, "step": 25235 }, { "epoch": 0.68, "learning_rate": 0.0004957597247579576, "loss": 2.662, "step": 25236 }, { "epoch": 0.68, "learning_rate": 0.0004956845628061663, "loss": 2.3899, "step": 25237 }, { "epoch": 0.68, "learning_rate": 0.0004956094046749785, "loss": 2.6389, "step": 25238 }, { "epoch": 0.68, "learning_rate": 0.0004955342503649641, "loss": 2.4546, "step": 25239 }, { "epoch": 0.68, "learning_rate": 0.0004954590998766915, "loss": 2.1737, "step": 25240 }, { "epoch": 0.68, "learning_rate": 0.0004953839532107302, "loss": 2.2268, "step": 25241 }, { "epoch": 0.68, "learning_rate": 0.0004953088103676508, "loss": 2.2906, "step": 25242 }, { "epoch": 0.68, "learning_rate": 0.0004952336713480211, "loss": 2.1088, "step": 25243 }, { "epoch": 0.68, "learning_rate": 0.0004951585361524112, "loss": 2.4668, "step": 25244 }, { "epoch": 0.68, "learning_rate": 0.0004950834047813897, "loss": 2.7488, "step": 25245 }, { "epoch": 0.68, "learning_rate": 0.000495008277235526, "loss": 2.9123, "step": 25246 }, { "epoch": 0.68, "learning_rate": 0.0004949331535153893, "loss": 2.5583, "step": 25247 }, { "epoch": 0.68, "learning_rate": 0.0004948580336215488, "loss": 2.7198, "step": 25248 }, { "epoch": 0.68, "learning_rate": 0.0004947829175545735, "loss": 2.5361, "step": 25249 }, { "epoch": 0.68, "learning_rate": 0.0004947078053150329, "loss": 2.1266, "step": 25250 }, { "epoch": 0.68, "learning_rate": 0.0004946326969034953, "loss": 2.3691, "step": 25251 }, { "epoch": 0.68, "learning_rate": 0.0004945575923205303, "loss": 2.3805, "step": 25252 }, { "epoch": 0.68, "learning_rate": 0.0004944824915667063, "loss": 2.3591, "step": 25253 }, { "epoch": 0.68, "learning_rate": 0.000494407394642592, "loss": 2.5555, "step": 25254 }, { "epoch": 0.68, "learning_rate": 0.0004943323015487577, "loss": 2.5474, "step": 25255 }, { "epoch": 0.68, "learning_rate": 0.0004942572122857712, "loss": 2.5184, "step": 25256 }, { "epoch": 0.68, "learning_rate": 0.0004941821268542018, "loss": 2.4683, "step": 25257 }, { "epoch": 0.68, "learning_rate": 0.0004941070452546183, "loss": 2.448, "step": 25258 }, { "epoch": 0.68, "learning_rate": 0.0004940319674875891, "loss": 2.5226, "step": 25259 }, { "epoch": 0.68, "learning_rate": 0.0004939568935536832, "loss": 2.0951, "step": 25260 }, { "epoch": 0.68, "learning_rate": 0.0004938818234534694, "loss": 2.665, "step": 25261 }, { "epoch": 0.68, "learning_rate": 0.0004938067571875165, "loss": 2.4771, "step": 25262 }, { "epoch": 0.68, "learning_rate": 0.0004937316947563934, "loss": 2.121, "step": 25263 }, { "epoch": 0.68, "learning_rate": 0.0004936566361606683, "loss": 2.5993, "step": 25264 }, { "epoch": 0.68, "learning_rate": 0.0004935815814009098, "loss": 2.0646, "step": 25265 }, { "epoch": 0.68, "learning_rate": 0.0004935065304776872, "loss": 2.4299, "step": 25266 }, { "epoch": 0.68, "learning_rate": 0.0004934314833915677, "loss": 2.7201, "step": 25267 }, { "epoch": 0.68, "learning_rate": 0.0004933564401431211, "loss": 2.5148, "step": 25268 }, { "epoch": 0.68, "learning_rate": 0.000493281400732916, "loss": 2.3837, "step": 25269 }, { "epoch": 0.68, "learning_rate": 0.0004932063651615199, "loss": 2.7659, "step": 25270 }, { "epoch": 0.68, "learning_rate": 0.0004931313334295023, "loss": 3.056, "step": 25271 }, { "epoch": 0.68, "learning_rate": 0.0004930563055374305, "loss": 2.3248, "step": 25272 }, { "epoch": 0.68, "learning_rate": 0.0004929812814858738, "loss": 2.5239, "step": 25273 }, { "epoch": 0.68, "learning_rate": 0.0004929062612754, "loss": 3.1125, "step": 25274 }, { "epoch": 0.68, "learning_rate": 0.0004928312449065779, "loss": 2.896, "step": 25275 }, { "epoch": 0.68, "learning_rate": 0.0004927562323799755, "loss": 2.6519, "step": 25276 }, { "epoch": 0.68, "learning_rate": 0.0004926812236961616, "loss": 2.76, "step": 25277 }, { "epoch": 0.68, "learning_rate": 0.0004926062188557036, "loss": 2.2607, "step": 25278 }, { "epoch": 0.68, "learning_rate": 0.0004925312178591706, "loss": 2.7158, "step": 25279 }, { "epoch": 0.68, "learning_rate": 0.0004924562207071297, "loss": 2.3571, "step": 25280 }, { "epoch": 0.68, "learning_rate": 0.00049238122740015, "loss": 2.9362, "step": 25281 }, { "epoch": 0.68, "learning_rate": 0.0004923062379387998, "loss": 2.8745, "step": 25282 }, { "epoch": 0.68, "learning_rate": 0.0004922312523236464, "loss": 2.6648, "step": 25283 }, { "epoch": 0.68, "learning_rate": 0.0004921562705552582, "loss": 2.451, "step": 25284 }, { "epoch": 0.68, "learning_rate": 0.0004920812926342038, "loss": 2.5427, "step": 25285 }, { "epoch": 0.68, "learning_rate": 0.0004920063185610502, "loss": 2.6892, "step": 25286 }, { "epoch": 0.68, "learning_rate": 0.000491931348336366, "loss": 2.4567, "step": 25287 }, { "epoch": 0.68, "learning_rate": 0.0004918563819607191, "loss": 2.4309, "step": 25288 }, { "epoch": 0.68, "learning_rate": 0.0004917814194346773, "loss": 2.5085, "step": 25289 }, { "epoch": 0.68, "learning_rate": 0.000491706460758809, "loss": 2.9722, "step": 25290 }, { "epoch": 0.68, "learning_rate": 0.0004916315059336812, "loss": 2.3374, "step": 25291 }, { "epoch": 0.68, "learning_rate": 0.0004915565549598624, "loss": 2.3483, "step": 25292 }, { "epoch": 0.68, "learning_rate": 0.0004914816078379202, "loss": 2.5189, "step": 25293 }, { "epoch": 0.68, "learning_rate": 0.0004914066645684224, "loss": 2.8152, "step": 25294 }, { "epoch": 0.68, "learning_rate": 0.0004913317251519371, "loss": 2.4756, "step": 25295 }, { "epoch": 0.68, "learning_rate": 0.0004912567895890314, "loss": 2.0028, "step": 25296 }, { "epoch": 0.68, "learning_rate": 0.0004911818578802734, "loss": 2.2777, "step": 25297 }, { "epoch": 0.68, "learning_rate": 0.000491106930026231, "loss": 2.5486, "step": 25298 }, { "epoch": 0.68, "learning_rate": 0.000491032006027471, "loss": 2.675, "step": 25299 }, { "epoch": 0.68, "learning_rate": 0.0004909570858845617, "loss": 1.9541, "step": 25300 }, { "epoch": 0.68, "learning_rate": 0.0004908821695980704, "loss": 2.0833, "step": 25301 }, { "epoch": 0.68, "learning_rate": 0.0004908072571685648, "loss": 2.7367, "step": 25302 }, { "epoch": 0.68, "learning_rate": 0.0004907323485966127, "loss": 2.0375, "step": 25303 }, { "epoch": 0.68, "learning_rate": 0.000490657443882781, "loss": 2.4333, "step": 25304 }, { "epoch": 0.68, "learning_rate": 0.0004905825430276374, "loss": 2.6733, "step": 25305 }, { "epoch": 0.68, "learning_rate": 0.0004905076460317493, "loss": 2.8356, "step": 25306 }, { "epoch": 0.68, "learning_rate": 0.0004904327528956843, "loss": 2.2367, "step": 25307 }, { "epoch": 0.68, "learning_rate": 0.0004903578636200097, "loss": 2.7381, "step": 25308 }, { "epoch": 0.68, "learning_rate": 0.0004902829782052931, "loss": 2.6093, "step": 25309 }, { "epoch": 0.68, "learning_rate": 0.0004902080966521012, "loss": 2.6437, "step": 25310 }, { "epoch": 0.68, "learning_rate": 0.0004901332189610016, "loss": 2.6839, "step": 25311 }, { "epoch": 0.68, "learning_rate": 0.0004900583451325619, "loss": 2.5213, "step": 25312 }, { "epoch": 0.68, "learning_rate": 0.0004899834751673487, "loss": 2.2414, "step": 25313 }, { "epoch": 0.68, "learning_rate": 0.0004899086090659295, "loss": 2.5773, "step": 25314 }, { "epoch": 0.68, "learning_rate": 0.0004898337468288714, "loss": 2.097, "step": 25315 }, { "epoch": 0.68, "learning_rate": 0.0004897588884567417, "loss": 2.7576, "step": 25316 }, { "epoch": 0.68, "learning_rate": 0.0004896840339501078, "loss": 2.647, "step": 25317 }, { "epoch": 0.68, "learning_rate": 0.0004896091833095361, "loss": 2.5651, "step": 25318 }, { "epoch": 0.68, "learning_rate": 0.0004895343365355939, "loss": 2.6242, "step": 25319 }, { "epoch": 0.68, "learning_rate": 0.0004894594936288483, "loss": 2.8316, "step": 25320 }, { "epoch": 0.68, "learning_rate": 0.0004893846545898664, "loss": 2.2917, "step": 25321 }, { "epoch": 0.68, "learning_rate": 0.0004893098194192154, "loss": 2.7039, "step": 25322 }, { "epoch": 0.68, "learning_rate": 0.0004892349881174615, "loss": 2.4186, "step": 25323 }, { "epoch": 0.68, "learning_rate": 0.000489160160685172, "loss": 2.4257, "step": 25324 }, { "epoch": 0.68, "learning_rate": 0.0004890853371229141, "loss": 2.4758, "step": 25325 }, { "epoch": 0.68, "learning_rate": 0.0004890105174312541, "loss": 2.5816, "step": 25326 }, { "epoch": 0.68, "learning_rate": 0.0004889357016107587, "loss": 2.6393, "step": 25327 }, { "epoch": 0.68, "learning_rate": 0.0004888608896619957, "loss": 2.3288, "step": 25328 }, { "epoch": 0.68, "learning_rate": 0.0004887860815855308, "loss": 3.0478, "step": 25329 }, { "epoch": 0.68, "learning_rate": 0.0004887112773819316, "loss": 2.4019, "step": 25330 }, { "epoch": 0.68, "learning_rate": 0.0004886364770517641, "loss": 2.6269, "step": 25331 }, { "epoch": 0.68, "learning_rate": 0.0004885616805955952, "loss": 2.3947, "step": 25332 }, { "epoch": 0.68, "learning_rate": 0.0004884868880139914, "loss": 2.4385, "step": 25333 }, { "epoch": 0.68, "learning_rate": 0.0004884120993075195, "loss": 2.9522, "step": 25334 }, { "epoch": 0.68, "learning_rate": 0.0004883373144767462, "loss": 2.6642, "step": 25335 }, { "epoch": 0.68, "learning_rate": 0.00048826253352223827, "loss": 2.3164, "step": 25336 }, { "epoch": 0.68, "learning_rate": 0.00048818775644456146, "loss": 3.2854, "step": 25337 }, { "epoch": 0.68, "learning_rate": 0.0004881129832442832, "loss": 2.317, "step": 25338 }, { "epoch": 0.68, "learning_rate": 0.000488038213921969, "loss": 2.7092, "step": 25339 }, { "epoch": 0.68, "learning_rate": 0.0004879634484781853, "loss": 2.3332, "step": 25340 }, { "epoch": 0.68, "learning_rate": 0.00048788868691349984, "loss": 2.0061, "step": 25341 }, { "epoch": 0.68, "learning_rate": 0.0004878139292284778, "loss": 2.7034, "step": 25342 }, { "epoch": 0.68, "learning_rate": 0.0004877391754236857, "loss": 2.4042, "step": 25343 }, { "epoch": 0.68, "learning_rate": 0.0004876644254996906, "loss": 2.2694, "step": 25344 }, { "epoch": 0.68, "learning_rate": 0.0004875896794570577, "loss": 2.2763, "step": 25345 }, { "epoch": 0.68, "learning_rate": 0.00048751493729635374, "loss": 2.0906, "step": 25346 }, { "epoch": 0.68, "learning_rate": 0.00048744019901814507, "loss": 2.2697, "step": 25347 }, { "epoch": 0.68, "learning_rate": 0.0004873654646229978, "loss": 2.3635, "step": 25348 }, { "epoch": 0.68, "learning_rate": 0.0004872907341114785, "loss": 2.521, "step": 25349 }, { "epoch": 0.68, "learning_rate": 0.0004872160074841526, "loss": 2.3991, "step": 25350 }, { "epoch": 0.68, "learning_rate": 0.0004871412847415865, "loss": 2.0597, "step": 25351 }, { "epoch": 0.68, "learning_rate": 0.0004870665658843464, "loss": 2.5649, "step": 25352 }, { "epoch": 0.68, "learning_rate": 0.00048699185091299825, "loss": 2.5174, "step": 25353 }, { "epoch": 0.68, "learning_rate": 0.00048691713982810804, "loss": 2.6219, "step": 25354 }, { "epoch": 0.68, "learning_rate": 0.0004868424326302423, "loss": 2.3244, "step": 25355 }, { "epoch": 0.68, "learning_rate": 0.00048676772931996616, "loss": 2.7887, "step": 25356 }, { "epoch": 0.68, "learning_rate": 0.00048669302989784636, "loss": 2.2076, "step": 25357 }, { "epoch": 0.68, "learning_rate": 0.00048661833436444804, "loss": 2.1318, "step": 25358 }, { "epoch": 0.68, "learning_rate": 0.0004865436427203374, "loss": 1.9164, "step": 25359 }, { "epoch": 0.68, "learning_rate": 0.0004864689549660802, "loss": 2.8544, "step": 25360 }, { "epoch": 0.68, "learning_rate": 0.00048639427110224256, "loss": 3.0749, "step": 25361 }, { "epoch": 0.68, "learning_rate": 0.00048631959112938993, "loss": 2.3487, "step": 25362 }, { "epoch": 0.68, "learning_rate": 0.0004862449150480888, "loss": 2.5388, "step": 25363 }, { "epoch": 0.68, "learning_rate": 0.0004861702428589039, "loss": 2.3954, "step": 25364 }, { "epoch": 0.68, "learning_rate": 0.00048609557456240126, "loss": 2.2158, "step": 25365 }, { "epoch": 0.68, "learning_rate": 0.0004860209101591468, "loss": 2.5698, "step": 25366 }, { "epoch": 0.68, "learning_rate": 0.00048594624964970603, "loss": 2.5095, "step": 25367 }, { "epoch": 0.68, "learning_rate": 0.0004858715930346449, "loss": 2.8837, "step": 25368 }, { "epoch": 0.68, "learning_rate": 0.00048579694031452826, "loss": 2.316, "step": 25369 }, { "epoch": 0.68, "learning_rate": 0.0004857222914899222, "loss": 2.5353, "step": 25370 }, { "epoch": 0.68, "learning_rate": 0.0004856476465613924, "loss": 3.031, "step": 25371 }, { "epoch": 0.68, "learning_rate": 0.00048557300552950366, "loss": 2.539, "step": 25372 }, { "epoch": 0.68, "learning_rate": 0.00048549836839482187, "loss": 2.5608, "step": 25373 }, { "epoch": 0.68, "learning_rate": 0.0004854237351579125, "loss": 2.574, "step": 25374 }, { "epoch": 0.68, "learning_rate": 0.0004853491058193409, "loss": 2.8928, "step": 25375 }, { "epoch": 0.68, "learning_rate": 0.00048527448037967284, "loss": 2.4068, "step": 25376 }, { "epoch": 0.68, "learning_rate": 0.0004851998588394729, "loss": 2.7707, "step": 25377 }, { "epoch": 0.68, "learning_rate": 0.00048512524119930677, "loss": 2.0952, "step": 25378 }, { "epoch": 0.68, "learning_rate": 0.0004850506274597398, "loss": 2.3295, "step": 25379 }, { "epoch": 0.68, "learning_rate": 0.00048497601762133725, "loss": 2.1699, "step": 25380 }, { "epoch": 0.68, "learning_rate": 0.00048490141168466426, "loss": 2.5258, "step": 25381 }, { "epoch": 0.68, "learning_rate": 0.0004848268096502865, "loss": 2.9098, "step": 25382 }, { "epoch": 0.68, "learning_rate": 0.00048475221151876834, "loss": 2.1105, "step": 25383 }, { "epoch": 0.68, "learning_rate": 0.0004846776172906757, "loss": 2.16, "step": 25384 }, { "epoch": 0.68, "learning_rate": 0.00048460302696657286, "loss": 2.4475, "step": 25385 }, { "epoch": 0.68, "learning_rate": 0.00048452844054702504, "loss": 2.6703, "step": 25386 }, { "epoch": 0.68, "learning_rate": 0.00048445385803259824, "loss": 2.7723, "step": 25387 }, { "epoch": 0.68, "learning_rate": 0.0004843792794238566, "loss": 2.521, "step": 25388 }, { "epoch": 0.68, "learning_rate": 0.0004843047047213652, "loss": 2.0956, "step": 25389 }, { "epoch": 0.68, "learning_rate": 0.0004842301339256897, "loss": 2.3456, "step": 25390 }, { "epoch": 0.68, "learning_rate": 0.00048415556703739404, "loss": 2.4175, "step": 25391 }, { "epoch": 0.68, "learning_rate": 0.0004840810040570436, "loss": 2.8731, "step": 25392 }, { "epoch": 0.68, "learning_rate": 0.0004840064449852032, "loss": 2.5642, "step": 25393 }, { "epoch": 0.68, "learning_rate": 0.00048393188982243774, "loss": 2.523, "step": 25394 }, { "epoch": 0.68, "learning_rate": 0.00048385733856931237, "loss": 2.4023, "step": 25395 }, { "epoch": 0.68, "learning_rate": 0.00048378279122639114, "loss": 2.6243, "step": 25396 }, { "epoch": 0.68, "learning_rate": 0.0004837082477942393, "loss": 2.6969, "step": 25397 }, { "epoch": 0.68, "learning_rate": 0.0004836337082734218, "loss": 2.2709, "step": 25398 }, { "epoch": 0.68, "learning_rate": 0.0004835591726645021, "loss": 2.2015, "step": 25399 }, { "epoch": 0.68, "learning_rate": 0.00048348464096804666, "loss": 2.0893, "step": 25400 }, { "epoch": 0.68, "learning_rate": 0.00048341011318461894, "loss": 2.6917, "step": 25401 }, { "epoch": 0.68, "learning_rate": 0.0004833355893147837, "loss": 2.5569, "step": 25402 }, { "epoch": 0.68, "learning_rate": 0.0004832610693591062, "loss": 2.9275, "step": 25403 }, { "epoch": 0.68, "learning_rate": 0.00048318655331814985, "loss": 2.5067, "step": 25404 }, { "epoch": 0.68, "learning_rate": 0.00048311204119248, "loss": 2.0584, "step": 25405 }, { "epoch": 0.68, "learning_rate": 0.00048303753298266084, "loss": 2.1331, "step": 25406 }, { "epoch": 0.68, "learning_rate": 0.0004829630286892568, "loss": 3.1678, "step": 25407 }, { "epoch": 0.68, "learning_rate": 0.00048288852831283294, "loss": 2.1302, "step": 25408 }, { "epoch": 0.68, "learning_rate": 0.00048281403185395266, "loss": 2.3564, "step": 25409 }, { "epoch": 0.68, "learning_rate": 0.0004827395393131809, "loss": 2.8168, "step": 25410 }, { "epoch": 0.68, "learning_rate": 0.00048266505069108226, "loss": 2.5937, "step": 25411 }, { "epoch": 0.68, "learning_rate": 0.0004825905659882199, "loss": 2.7164, "step": 25412 }, { "epoch": 0.68, "learning_rate": 0.00048251608520515933, "loss": 2.2276, "step": 25413 }, { "epoch": 0.68, "learning_rate": 0.00048244160834246474, "loss": 2.4604, "step": 25414 }, { "epoch": 0.68, "learning_rate": 0.00048236713540069964, "loss": 2.381, "step": 25415 }, { "epoch": 0.68, "learning_rate": 0.0004822926663804286, "loss": 2.7367, "step": 25416 }, { "epoch": 0.68, "learning_rate": 0.00048221820128221607, "loss": 2.8478, "step": 25417 }, { "epoch": 0.68, "learning_rate": 0.00048214374010662554, "loss": 2.4854, "step": 25418 }, { "epoch": 0.68, "learning_rate": 0.00048206928285422134, "loss": 2.326, "step": 25419 }, { "epoch": 0.68, "learning_rate": 0.00048199482952556783, "loss": 2.5636, "step": 25420 }, { "epoch": 0.68, "learning_rate": 0.00048192038012122876, "loss": 2.4735, "step": 25421 }, { "epoch": 0.68, "learning_rate": 0.0004818459346417687, "loss": 2.5183, "step": 25422 }, { "epoch": 0.68, "learning_rate": 0.0004817714930877508, "loss": 2.2969, "step": 25423 }, { "epoch": 0.68, "learning_rate": 0.0004816970554597394, "loss": 2.8177, "step": 25424 }, { "epoch": 0.68, "learning_rate": 0.0004816226217582985, "loss": 2.2865, "step": 25425 }, { "epoch": 0.68, "learning_rate": 0.0004815481919839919, "loss": 2.4412, "step": 25426 }, { "epoch": 0.68, "learning_rate": 0.0004814737661373839, "loss": 2.6815, "step": 25427 }, { "epoch": 0.68, "learning_rate": 0.00048139934421903764, "loss": 2.6143, "step": 25428 }, { "epoch": 0.68, "learning_rate": 0.00048132492622951717, "loss": 2.6787, "step": 25429 }, { "epoch": 0.68, "learning_rate": 0.00048125051216938667, "loss": 2.0738, "step": 25430 }, { "epoch": 0.68, "learning_rate": 0.00048117610203920926, "loss": 3.0029, "step": 25431 }, { "epoch": 0.68, "learning_rate": 0.0004811016958395488, "loss": 2.7291, "step": 25432 }, { "epoch": 0.68, "learning_rate": 0.0004810272935709692, "loss": 2.5166, "step": 25433 }, { "epoch": 0.68, "learning_rate": 0.0004809528952340341, "loss": 2.7749, "step": 25434 }, { "epoch": 0.68, "learning_rate": 0.0004808785008293074, "loss": 1.84, "step": 25435 }, { "epoch": 0.68, "learning_rate": 0.00048080411035735193, "loss": 2.5038, "step": 25436 }, { "epoch": 0.68, "learning_rate": 0.0004807297238187317, "loss": 2.4834, "step": 25437 }, { "epoch": 0.68, "learning_rate": 0.00048065534121401036, "loss": 2.6049, "step": 25438 }, { "epoch": 0.68, "learning_rate": 0.0004805809625437512, "loss": 2.3, "step": 25439 }, { "epoch": 0.68, "learning_rate": 0.00048050658780851785, "loss": 2.6952, "step": 25440 }, { "epoch": 0.68, "learning_rate": 0.00048043221700887407, "loss": 2.346, "step": 25441 }, { "epoch": 0.68, "learning_rate": 0.0004803578501453826, "loss": 2.4787, "step": 25442 }, { "epoch": 0.68, "learning_rate": 0.0004802834872186075, "loss": 2.7982, "step": 25443 }, { "epoch": 0.68, "learning_rate": 0.00048020912822911135, "loss": 1.9361, "step": 25444 }, { "epoch": 0.68, "learning_rate": 0.0004801347731774579, "loss": 2.597, "step": 25445 }, { "epoch": 0.68, "learning_rate": 0.00048006042206421055, "loss": 2.7145, "step": 25446 }, { "epoch": 0.68, "learning_rate": 0.00047998607488993253, "loss": 2.4013, "step": 25447 }, { "epoch": 0.68, "learning_rate": 0.00047991173165518687, "loss": 2.4089, "step": 25448 }, { "epoch": 0.68, "learning_rate": 0.00047983739236053745, "loss": 2.8245, "step": 25449 }, { "epoch": 0.68, "learning_rate": 0.00047976305700654653, "loss": 2.9051, "step": 25450 }, { "epoch": 0.68, "learning_rate": 0.00047968872559377775, "loss": 2.4536, "step": 25451 }, { "epoch": 0.68, "learning_rate": 0.00047961439812279407, "loss": 2.3427, "step": 25452 }, { "epoch": 0.68, "learning_rate": 0.00047954007459415874, "loss": 1.9177, "step": 25453 }, { "epoch": 0.68, "learning_rate": 0.00047946575500843505, "loss": 2.3868, "step": 25454 }, { "epoch": 0.68, "learning_rate": 0.00047939143936618543, "loss": 2.7352, "step": 25455 }, { "epoch": 0.68, "learning_rate": 0.0004793171276679732, "loss": 2.7301, "step": 25456 }, { "epoch": 0.68, "learning_rate": 0.00047924281991436167, "loss": 2.098, "step": 25457 }, { "epoch": 0.68, "learning_rate": 0.00047916851610591303, "loss": 2.704, "step": 25458 }, { "epoch": 0.68, "learning_rate": 0.0004790942162431903, "loss": 2.5395, "step": 25459 }, { "epoch": 0.68, "learning_rate": 0.00047901992032675736, "loss": 2.6616, "step": 25460 }, { "epoch": 0.68, "learning_rate": 0.0004789456283571759, "loss": 2.3057, "step": 25461 }, { "epoch": 0.68, "learning_rate": 0.00047887134033500965, "loss": 2.3616, "step": 25462 }, { "epoch": 0.68, "learning_rate": 0.0004787970562608206, "loss": 2.5847, "step": 25463 }, { "epoch": 0.68, "learning_rate": 0.0004787227761351719, "loss": 2.4062, "step": 25464 }, { "epoch": 0.68, "learning_rate": 0.00047864849995862623, "loss": 2.9332, "step": 25465 }, { "epoch": 0.68, "learning_rate": 0.0004785742277317463, "loss": 2.2855, "step": 25466 }, { "epoch": 0.68, "learning_rate": 0.0004784999594550947, "loss": 1.9905, "step": 25467 }, { "epoch": 0.68, "learning_rate": 0.0004784256951292347, "loss": 2.1839, "step": 25468 }, { "epoch": 0.68, "learning_rate": 0.000478351434754728, "loss": 2.4834, "step": 25469 }, { "epoch": 0.68, "learning_rate": 0.0004782771783321379, "loss": 2.6967, "step": 25470 }, { "epoch": 0.68, "learning_rate": 0.0004782029258620262, "loss": 2.4929, "step": 25471 }, { "epoch": 0.68, "learning_rate": 0.0004781286773449556, "loss": 2.2117, "step": 25472 }, { "epoch": 0.68, "learning_rate": 0.0004780544327814894, "loss": 2.4054, "step": 25473 }, { "epoch": 0.68, "learning_rate": 0.00047798019217218927, "loss": 2.7457, "step": 25474 }, { "epoch": 0.68, "learning_rate": 0.0004779059555176178, "loss": 2.8216, "step": 25475 }, { "epoch": 0.68, "learning_rate": 0.00047783172281833797, "loss": 2.5684, "step": 25476 }, { "epoch": 0.68, "learning_rate": 0.00047775749407491107, "loss": 2.3689, "step": 25477 }, { "epoch": 0.68, "learning_rate": 0.0004776832692879002, "loss": 2.4606, "step": 25478 }, { "epoch": 0.68, "learning_rate": 0.0004776090484578675, "loss": 2.2351, "step": 25479 }, { "epoch": 0.68, "learning_rate": 0.00047753483158537516, "loss": 2.7035, "step": 25480 }, { "epoch": 0.68, "learning_rate": 0.000477460618670986, "loss": 2.5622, "step": 25481 }, { "epoch": 0.68, "learning_rate": 0.0004773864097152613, "loss": 2.5125, "step": 25482 }, { "epoch": 0.68, "learning_rate": 0.0004773122047187638, "loss": 2.4234, "step": 25483 }, { "epoch": 0.68, "learning_rate": 0.00047723800368205585, "loss": 2.2778, "step": 25484 }, { "epoch": 0.68, "learning_rate": 0.0004771638066056987, "loss": 2.4903, "step": 25485 }, { "epoch": 0.68, "learning_rate": 0.0004770896134902558, "loss": 2.4245, "step": 25486 }, { "epoch": 0.68, "learning_rate": 0.00047701542433628807, "loss": 2.5249, "step": 25487 }, { "epoch": 0.68, "learning_rate": 0.00047694123914435806, "loss": 2.7173, "step": 25488 }, { "epoch": 0.68, "learning_rate": 0.00047686705791502804, "loss": 2.5015, "step": 25489 }, { "epoch": 0.69, "learning_rate": 0.0004767928806488593, "loss": 2.3325, "step": 25490 }, { "epoch": 0.69, "learning_rate": 0.0004767187073464141, "loss": 2.4875, "step": 25491 }, { "epoch": 0.69, "learning_rate": 0.00047664453800825446, "loss": 2.285, "step": 25492 }, { "epoch": 0.69, "learning_rate": 0.00047657037263494216, "loss": 2.4971, "step": 25493 }, { "epoch": 0.69, "learning_rate": 0.00047649621122703925, "loss": 2.5819, "step": 25494 }, { "epoch": 0.69, "learning_rate": 0.0004764220537851078, "loss": 2.6525, "step": 25495 }, { "epoch": 0.69, "learning_rate": 0.00047634790030970885, "loss": 2.4562, "step": 25496 }, { "epoch": 0.69, "learning_rate": 0.00047627375080140503, "loss": 2.4912, "step": 25497 }, { "epoch": 0.69, "learning_rate": 0.0004761996052607569, "loss": 2.3489, "step": 25498 }, { "epoch": 0.69, "learning_rate": 0.0004761254636883272, "loss": 2.557, "step": 25499 }, { "epoch": 0.69, "learning_rate": 0.0004760513260846777, "loss": 2.4057, "step": 25500 }, { "epoch": 0.69, "learning_rate": 0.00047597719245036943, "loss": 2.6373, "step": 25501 }, { "epoch": 0.69, "learning_rate": 0.00047590306278596416, "loss": 2.5794, "step": 25502 }, { "epoch": 0.69, "learning_rate": 0.0004758289370920239, "loss": 2.5884, "step": 25503 }, { "epoch": 0.69, "learning_rate": 0.0004757548153691097, "loss": 2.5793, "step": 25504 }, { "epoch": 0.69, "learning_rate": 0.00047568069761778323, "loss": 2.4775, "step": 25505 }, { "epoch": 0.69, "learning_rate": 0.000475606583838606, "loss": 2.6368, "step": 25506 }, { "epoch": 0.69, "learning_rate": 0.0004755324740321395, "loss": 2.7018, "step": 25507 }, { "epoch": 0.69, "learning_rate": 0.0004754583681989456, "loss": 2.7436, "step": 25508 }, { "epoch": 0.69, "learning_rate": 0.00047538426633958507, "loss": 2.189, "step": 25509 }, { "epoch": 0.69, "learning_rate": 0.0004753101684546195, "loss": 2.4872, "step": 25510 }, { "epoch": 0.69, "learning_rate": 0.00047523607454461026, "loss": 2.6407, "step": 25511 }, { "epoch": 0.69, "learning_rate": 0.00047516198461011863, "loss": 2.7156, "step": 25512 }, { "epoch": 0.69, "learning_rate": 0.00047508789865170645, "loss": 2.3227, "step": 25513 }, { "epoch": 0.69, "learning_rate": 0.00047501381666993403, "loss": 2.5695, "step": 25514 }, { "epoch": 0.69, "learning_rate": 0.0004749397386653632, "loss": 2.5541, "step": 25515 }, { "epoch": 0.69, "learning_rate": 0.0004748656646385554, "loss": 2.5441, "step": 25516 }, { "epoch": 0.69, "learning_rate": 0.00047479159459007093, "loss": 2.716, "step": 25517 }, { "epoch": 0.69, "learning_rate": 0.00047471752852047125, "loss": 2.118, "step": 25518 }, { "epoch": 0.69, "learning_rate": 0.0004746434664303183, "loss": 2.1741, "step": 25519 }, { "epoch": 0.69, "learning_rate": 0.00047456940832017215, "loss": 2.4777, "step": 25520 }, { "epoch": 0.69, "learning_rate": 0.0004744953541905946, "loss": 2.3324, "step": 25521 }, { "epoch": 0.69, "learning_rate": 0.0004744213040421459, "loss": 2.3298, "step": 25522 }, { "epoch": 0.69, "learning_rate": 0.00047434725787538746, "loss": 2.7526, "step": 25523 }, { "epoch": 0.69, "learning_rate": 0.00047427321569088024, "loss": 2.3315, "step": 25524 }, { "epoch": 0.69, "learning_rate": 0.00047419917748918515, "loss": 2.79, "step": 25525 }, { "epoch": 0.69, "learning_rate": 0.0004741251432708631, "loss": 2.2154, "step": 25526 }, { "epoch": 0.69, "learning_rate": 0.0004740511130364753, "loss": 2.4704, "step": 25527 }, { "epoch": 0.69, "learning_rate": 0.0004739770867865818, "loss": 2.1715, "step": 25528 }, { "epoch": 0.69, "learning_rate": 0.0004739030645217439, "loss": 2.3918, "step": 25529 }, { "epoch": 0.69, "learning_rate": 0.00047382904624252277, "loss": 2.1001, "step": 25530 }, { "epoch": 0.69, "learning_rate": 0.0004737550319494779, "loss": 2.3359, "step": 25531 }, { "epoch": 0.69, "learning_rate": 0.0004736810216431715, "loss": 2.4827, "step": 25532 }, { "epoch": 0.69, "learning_rate": 0.0004736070153241633, "loss": 2.0479, "step": 25533 }, { "epoch": 0.69, "learning_rate": 0.0004735330129930142, "loss": 2.5043, "step": 25534 }, { "epoch": 0.69, "learning_rate": 0.0004734590146502853, "loss": 2.6407, "step": 25535 }, { "epoch": 0.69, "learning_rate": 0.0004733850202965364, "loss": 2.4457, "step": 25536 }, { "epoch": 0.69, "learning_rate": 0.00047331102993232834, "loss": 2.6707, "step": 25537 }, { "epoch": 0.69, "learning_rate": 0.00047323704355822186, "loss": 2.7234, "step": 25538 }, { "epoch": 0.69, "learning_rate": 0.00047316306117477724, "loss": 2.7514, "step": 25539 }, { "epoch": 0.69, "learning_rate": 0.0004730890827825556, "loss": 2.3346, "step": 25540 }, { "epoch": 0.69, "learning_rate": 0.00047301510838211635, "loss": 2.398, "step": 25541 }, { "epoch": 0.69, "learning_rate": 0.0004729411379740205, "loss": 2.2142, "step": 25542 }, { "epoch": 0.69, "learning_rate": 0.00047286717155882875, "loss": 2.2629, "step": 25543 }, { "epoch": 0.69, "learning_rate": 0.0004727932091371003, "loss": 2.4459, "step": 25544 }, { "epoch": 0.69, "learning_rate": 0.0004727192507093966, "loss": 2.7261, "step": 25545 }, { "epoch": 0.69, "learning_rate": 0.0004726452962762779, "loss": 2.7397, "step": 25546 }, { "epoch": 0.69, "learning_rate": 0.000472571345838304, "loss": 2.5074, "step": 25547 }, { "epoch": 0.69, "learning_rate": 0.0004724973993960354, "loss": 2.5579, "step": 25548 }, { "epoch": 0.69, "learning_rate": 0.000472423456950032, "loss": 2.4001, "step": 25549 }, { "epoch": 0.69, "learning_rate": 0.00047234951850085407, "loss": 2.8202, "step": 25550 }, { "epoch": 0.69, "learning_rate": 0.0004722755840490619, "loss": 2.6449, "step": 25551 }, { "epoch": 0.69, "learning_rate": 0.0004722016535952155, "loss": 2.7603, "step": 25552 }, { "epoch": 0.69, "learning_rate": 0.0004721277271398751, "loss": 2.8446, "step": 25553 }, { "epoch": 0.69, "learning_rate": 0.00047205380468360095, "loss": 2.8631, "step": 25554 }, { "epoch": 0.69, "learning_rate": 0.0004719798862269524, "loss": 2.2736, "step": 25555 }, { "epoch": 0.69, "learning_rate": 0.0004719059717704903, "loss": 2.5275, "step": 25556 }, { "epoch": 0.69, "learning_rate": 0.0004718320613147733, "loss": 2.2069, "step": 25557 }, { "epoch": 0.69, "learning_rate": 0.00047175815486036267, "loss": 2.7067, "step": 25558 }, { "epoch": 0.69, "learning_rate": 0.0004716842524078181, "loss": 2.3987, "step": 25559 }, { "epoch": 0.69, "learning_rate": 0.0004716103539576988, "loss": 2.3279, "step": 25560 }, { "epoch": 0.69, "learning_rate": 0.000471536459510565, "loss": 2.8589, "step": 25561 }, { "epoch": 0.69, "learning_rate": 0.00047146256906697694, "loss": 2.5296, "step": 25562 }, { "epoch": 0.69, "learning_rate": 0.0004713886826274936, "loss": 2.5024, "step": 25563 }, { "epoch": 0.69, "learning_rate": 0.00047131480019267505, "loss": 2.7029, "step": 25564 }, { "epoch": 0.69, "learning_rate": 0.00047124092176308095, "loss": 2.5804, "step": 25565 }, { "epoch": 0.69, "learning_rate": 0.00047116704733927116, "loss": 2.335, "step": 25566 }, { "epoch": 0.69, "learning_rate": 0.0004710931769218058, "loss": 2.4637, "step": 25567 }, { "epoch": 0.69, "learning_rate": 0.0004710193105112434, "loss": 1.9712, "step": 25568 }, { "epoch": 0.69, "learning_rate": 0.0004709454481081442, "loss": 2.3745, "step": 25569 }, { "epoch": 0.69, "learning_rate": 0.00047087158971306764, "loss": 2.3869, "step": 25570 }, { "epoch": 0.69, "learning_rate": 0.00047079773532657346, "loss": 2.354, "step": 25571 }, { "epoch": 0.69, "learning_rate": 0.00047072388494922093, "loss": 2.666, "step": 25572 }, { "epoch": 0.69, "learning_rate": 0.00047065003858157, "loss": 2.2512, "step": 25573 }, { "epoch": 0.69, "learning_rate": 0.0004705761962241794, "loss": 2.4584, "step": 25574 }, { "epoch": 0.69, "learning_rate": 0.0004705023578776092, "loss": 2.8122, "step": 25575 }, { "epoch": 0.69, "learning_rate": 0.0004704285235424182, "loss": 2.3749, "step": 25576 }, { "epoch": 0.69, "learning_rate": 0.0004703546932191659, "loss": 2.652, "step": 25577 }, { "epoch": 0.69, "learning_rate": 0.00047028086690841176, "loss": 2.2536, "step": 25578 }, { "epoch": 0.69, "learning_rate": 0.0004702070446107152, "loss": 2.8589, "step": 25579 }, { "epoch": 0.69, "learning_rate": 0.00047013322632663524, "loss": 2.6584, "step": 25580 }, { "epoch": 0.69, "learning_rate": 0.00047005941205673167, "loss": 2.4174, "step": 25581 }, { "epoch": 0.69, "learning_rate": 0.0004699856018015628, "loss": 2.3817, "step": 25582 }, { "epoch": 0.69, "learning_rate": 0.0004699117955616883, "loss": 2.3258, "step": 25583 }, { "epoch": 0.69, "learning_rate": 0.0004698379933376672, "loss": 2.1542, "step": 25584 }, { "epoch": 0.69, "learning_rate": 0.00046976419513005877, "loss": 2.3602, "step": 25585 }, { "epoch": 0.69, "learning_rate": 0.00046969040093942227, "loss": 2.8263, "step": 25586 }, { "epoch": 0.69, "learning_rate": 0.0004696166107663162, "loss": 2.4078, "step": 25587 }, { "epoch": 0.69, "learning_rate": 0.0004695428246112998, "loss": 2.4998, "step": 25588 }, { "epoch": 0.69, "learning_rate": 0.0004694690424749326, "loss": 2.7735, "step": 25589 }, { "epoch": 0.69, "learning_rate": 0.0004693952643577727, "loss": 2.4939, "step": 25590 }, { "epoch": 0.69, "learning_rate": 0.0004693214902603793, "loss": 2.1105, "step": 25591 }, { "epoch": 0.69, "learning_rate": 0.00046924772018331153, "loss": 2.5668, "step": 25592 }, { "epoch": 0.69, "learning_rate": 0.00046917395412712803, "loss": 2.8695, "step": 25593 }, { "epoch": 0.69, "learning_rate": 0.0004691001920923882, "loss": 2.9822, "step": 25594 }, { "epoch": 0.69, "learning_rate": 0.00046902643407964993, "loss": 2.474, "step": 25595 }, { "epoch": 0.69, "learning_rate": 0.00046895268008947255, "loss": 2.0684, "step": 25596 }, { "epoch": 0.69, "learning_rate": 0.0004688789301224148, "loss": 2.5726, "step": 25597 }, { "epoch": 0.69, "learning_rate": 0.0004688051841790352, "loss": 2.231, "step": 25598 }, { "epoch": 0.69, "learning_rate": 0.00046873144225989294, "loss": 2.5883, "step": 25599 }, { "epoch": 0.69, "learning_rate": 0.000468657704365546, "loss": 2.5882, "step": 25600 }, { "epoch": 0.69, "learning_rate": 0.0004685839704965532, "loss": 2.6951, "step": 25601 }, { "epoch": 0.69, "learning_rate": 0.0004685102406534737, "loss": 2.3314, "step": 25602 }, { "epoch": 0.69, "learning_rate": 0.0004684365148368651, "loss": 2.8455, "step": 25603 }, { "epoch": 0.69, "learning_rate": 0.00046836279304728615, "loss": 2.1421, "step": 25604 }, { "epoch": 0.69, "learning_rate": 0.00046828907528529627, "loss": 2.6835, "step": 25605 }, { "epoch": 0.69, "learning_rate": 0.00046821536155145307, "loss": 2.4804, "step": 25606 }, { "epoch": 0.69, "learning_rate": 0.0004681416518463152, "loss": 2.662, "step": 25607 }, { "epoch": 0.69, "learning_rate": 0.00046806794617044133, "loss": 2.3243, "step": 25608 }, { "epoch": 0.69, "learning_rate": 0.00046799424452438935, "loss": 2.2796, "step": 25609 }, { "epoch": 0.69, "learning_rate": 0.0004679205469087178, "loss": 2.0573, "step": 25610 }, { "epoch": 0.69, "learning_rate": 0.00046784685332398505, "loss": 2.5744, "step": 25611 }, { "epoch": 0.69, "learning_rate": 0.0004677731637707494, "loss": 2.5453, "step": 25612 }, { "epoch": 0.69, "learning_rate": 0.00046769947824956947, "loss": 2.359, "step": 25613 }, { "epoch": 0.69, "learning_rate": 0.0004676257967610028, "loss": 2.8392, "step": 25614 }, { "epoch": 0.69, "learning_rate": 0.0004675521193056079, "loss": 2.3448, "step": 25615 }, { "epoch": 0.69, "learning_rate": 0.0004674784458839434, "loss": 2.9089, "step": 25616 }, { "epoch": 0.69, "learning_rate": 0.0004674047764965661, "loss": 2.9472, "step": 25617 }, { "epoch": 0.69, "learning_rate": 0.0004673311111440358, "loss": 2.5488, "step": 25618 }, { "epoch": 0.69, "learning_rate": 0.00046725744982690945, "loss": 2.5673, "step": 25619 }, { "epoch": 0.69, "learning_rate": 0.00046718379254574537, "loss": 2.4567, "step": 25620 }, { "epoch": 0.69, "learning_rate": 0.00046711013930110203, "loss": 2.2237, "step": 25621 }, { "epoch": 0.69, "learning_rate": 0.00046703649009353655, "loss": 2.7589, "step": 25622 }, { "epoch": 0.69, "learning_rate": 0.0004669628449236074, "loss": 2.7622, "step": 25623 }, { "epoch": 0.69, "learning_rate": 0.0004668892037918724, "loss": 2.2917, "step": 25624 }, { "epoch": 0.69, "learning_rate": 0.00046681556669888946, "loss": 2.976, "step": 25625 }, { "epoch": 0.69, "learning_rate": 0.00046674193364521687, "loss": 2.7206, "step": 25626 }, { "epoch": 0.69, "learning_rate": 0.00046666830463141173, "loss": 2.3989, "step": 25627 }, { "epoch": 0.69, "learning_rate": 0.00046659467965803214, "loss": 2.6124, "step": 25628 }, { "epoch": 0.69, "learning_rate": 0.00046652105872563624, "loss": 2.1595, "step": 25629 }, { "epoch": 0.69, "learning_rate": 0.0004664474418347806, "loss": 2.6862, "step": 25630 }, { "epoch": 0.69, "learning_rate": 0.0004663738289860242, "loss": 2.7362, "step": 25631 }, { "epoch": 0.69, "learning_rate": 0.0004663002201799247, "loss": 2.465, "step": 25632 }, { "epoch": 0.69, "learning_rate": 0.0004662266154170389, "loss": 2.3898, "step": 25633 }, { "epoch": 0.69, "learning_rate": 0.00046615301469792514, "loss": 2.7693, "step": 25634 }, { "epoch": 0.69, "learning_rate": 0.00046607941802314035, "loss": 2.4083, "step": 25635 }, { "epoch": 0.69, "learning_rate": 0.00046600582539324255, "loss": 2.3099, "step": 25636 }, { "epoch": 0.69, "learning_rate": 0.00046593223680878906, "loss": 2.2728, "step": 25637 }, { "epoch": 0.69, "learning_rate": 0.0004658586522703374, "loss": 2.35, "step": 25638 }, { "epoch": 0.69, "learning_rate": 0.0004657850717784452, "loss": 2.4244, "step": 25639 }, { "epoch": 0.69, "learning_rate": 0.0004657114953336701, "loss": 2.3478, "step": 25640 }, { "epoch": 0.69, "learning_rate": 0.00046563792293656883, "loss": 2.3504, "step": 25641 }, { "epoch": 0.69, "learning_rate": 0.00046556435458769906, "loss": 2.6635, "step": 25642 }, { "epoch": 0.69, "learning_rate": 0.0004654907902876183, "loss": 2.4817, "step": 25643 }, { "epoch": 0.69, "learning_rate": 0.0004654172300368837, "loss": 2.5539, "step": 25644 }, { "epoch": 0.69, "learning_rate": 0.00046534367383605293, "loss": 2.1982, "step": 25645 }, { "epoch": 0.69, "learning_rate": 0.00046527012168568263, "loss": 2.7481, "step": 25646 }, { "epoch": 0.69, "learning_rate": 0.00046519657358633015, "loss": 2.4392, "step": 25647 }, { "epoch": 0.69, "learning_rate": 0.00046512302953855336, "loss": 2.3854, "step": 25648 }, { "epoch": 0.69, "learning_rate": 0.00046504948954290837, "loss": 2.4128, "step": 25649 }, { "epoch": 0.69, "learning_rate": 0.0004649759535999528, "loss": 2.1166, "step": 25650 }, { "epoch": 0.69, "learning_rate": 0.00046490242171024377, "loss": 2.8472, "step": 25651 }, { "epoch": 0.69, "learning_rate": 0.00046482889387433835, "loss": 3.1778, "step": 25652 }, { "epoch": 0.69, "learning_rate": 0.0004647553700927939, "loss": 2.555, "step": 25653 }, { "epoch": 0.69, "learning_rate": 0.00046468185036616674, "loss": 2.8328, "step": 25654 }, { "epoch": 0.69, "learning_rate": 0.0004646083346950142, "loss": 2.4998, "step": 25655 }, { "epoch": 0.69, "learning_rate": 0.00046453482307989304, "loss": 2.5496, "step": 25656 }, { "epoch": 0.69, "learning_rate": 0.0004644613155213605, "loss": 2.7201, "step": 25657 }, { "epoch": 0.69, "learning_rate": 0.00046438781201997315, "loss": 2.1635, "step": 25658 }, { "epoch": 0.69, "learning_rate": 0.00046431431257628854, "loss": 2.7328, "step": 25659 }, { "epoch": 0.69, "learning_rate": 0.00046424081719086244, "loss": 2.3407, "step": 25660 }, { "epoch": 0.69, "learning_rate": 0.0004641673258642525, "loss": 2.3515, "step": 25661 }, { "epoch": 0.69, "learning_rate": 0.0004640938385970147, "loss": 2.5441, "step": 25662 }, { "epoch": 0.69, "learning_rate": 0.0004640203553897061, "loss": 2.8867, "step": 25663 }, { "epoch": 0.69, "learning_rate": 0.00046394687624288356, "loss": 2.1609, "step": 25664 }, { "epoch": 0.69, "learning_rate": 0.00046387340115710375, "loss": 2.4177, "step": 25665 }, { "epoch": 0.69, "learning_rate": 0.000463799930132923, "loss": 2.3992, "step": 25666 }, { "epoch": 0.69, "learning_rate": 0.00046372646317089863, "loss": 2.6407, "step": 25667 }, { "epoch": 0.69, "learning_rate": 0.0004636530002715863, "loss": 2.5008, "step": 25668 }, { "epoch": 0.69, "learning_rate": 0.0004635795414355429, "loss": 2.5205, "step": 25669 }, { "epoch": 0.69, "learning_rate": 0.00046350608666332504, "loss": 1.9924, "step": 25670 }, { "epoch": 0.69, "learning_rate": 0.0004634326359554891, "loss": 2.5452, "step": 25671 }, { "epoch": 0.69, "learning_rate": 0.000463359189312592, "loss": 2.0149, "step": 25672 }, { "epoch": 0.69, "learning_rate": 0.00046328574673518933, "loss": 2.4106, "step": 25673 }, { "epoch": 0.69, "learning_rate": 0.00046321230822383796, "loss": 2.536, "step": 25674 }, { "epoch": 0.69, "learning_rate": 0.00046313887377909447, "loss": 2.4831, "step": 25675 }, { "epoch": 0.69, "learning_rate": 0.0004630654434015146, "loss": 2.6268, "step": 25676 }, { "epoch": 0.69, "learning_rate": 0.0004629920170916545, "loss": 2.6735, "step": 25677 }, { "epoch": 0.69, "learning_rate": 0.0004629185948500716, "loss": 2.4524, "step": 25678 }, { "epoch": 0.69, "learning_rate": 0.0004628451766773211, "loss": 2.5062, "step": 25679 }, { "epoch": 0.69, "learning_rate": 0.0004627717625739598, "loss": 2.7515, "step": 25680 }, { "epoch": 0.69, "learning_rate": 0.00046269835254054325, "loss": 2.5364, "step": 25681 }, { "epoch": 0.69, "learning_rate": 0.0004626249465776279, "loss": 2.305, "step": 25682 }, { "epoch": 0.69, "learning_rate": 0.00046255154468576986, "loss": 2.7708, "step": 25683 }, { "epoch": 0.69, "learning_rate": 0.0004624781468655253, "loss": 1.7153, "step": 25684 }, { "epoch": 0.69, "learning_rate": 0.0004624047531174501, "loss": 2.2152, "step": 25685 }, { "epoch": 0.69, "learning_rate": 0.0004623313634421008, "loss": 2.4468, "step": 25686 }, { "epoch": 0.69, "learning_rate": 0.0004622579778400327, "loss": 2.2521, "step": 25687 }, { "epoch": 0.69, "learning_rate": 0.0004621845963118022, "loss": 2.91, "step": 25688 }, { "epoch": 0.69, "learning_rate": 0.0004621112188579645, "loss": 2.5697, "step": 25689 }, { "epoch": 0.69, "learning_rate": 0.00046203784547907623, "loss": 2.7805, "step": 25690 }, { "epoch": 0.69, "learning_rate": 0.0004619644761756936, "loss": 2.8262, "step": 25691 }, { "epoch": 0.69, "learning_rate": 0.00046189111094837145, "loss": 2.4492, "step": 25692 }, { "epoch": 0.69, "learning_rate": 0.000461817749797666, "loss": 2.8112, "step": 25693 }, { "epoch": 0.69, "learning_rate": 0.0004617443927241335, "loss": 2.3642, "step": 25694 }, { "epoch": 0.69, "learning_rate": 0.0004616710397283288, "loss": 2.8132, "step": 25695 }, { "epoch": 0.69, "learning_rate": 0.00046159769081080814, "loss": 2.5764, "step": 25696 }, { "epoch": 0.69, "learning_rate": 0.00046152434597212714, "loss": 2.2279, "step": 25697 }, { "epoch": 0.69, "learning_rate": 0.0004614510052128413, "loss": 2.41, "step": 25698 }, { "epoch": 0.69, "learning_rate": 0.00046137766853350683, "loss": 2.8201, "step": 25699 }, { "epoch": 0.69, "learning_rate": 0.00046130433593467846, "loss": 2.6115, "step": 25700 }, { "epoch": 0.69, "learning_rate": 0.0004612310074169121, "loss": 3.197, "step": 25701 }, { "epoch": 0.69, "learning_rate": 0.0004611576829807633, "loss": 2.5709, "step": 25702 }, { "epoch": 0.69, "learning_rate": 0.00046108436262678765, "loss": 2.4484, "step": 25703 }, { "epoch": 0.69, "learning_rate": 0.0004610110463555408, "loss": 1.9518, "step": 25704 }, { "epoch": 0.69, "learning_rate": 0.00046093773416757756, "loss": 2.3232, "step": 25705 }, { "epoch": 0.69, "learning_rate": 0.0004608644260634537, "loss": 2.7532, "step": 25706 }, { "epoch": 0.69, "learning_rate": 0.00046079112204372484, "loss": 2.4757, "step": 25707 }, { "epoch": 0.69, "learning_rate": 0.0004607178221089457, "loss": 2.8049, "step": 25708 }, { "epoch": 0.69, "learning_rate": 0.00046064452625967203, "loss": 2.3457, "step": 25709 }, { "epoch": 0.69, "learning_rate": 0.0004605712344964589, "loss": 2.2211, "step": 25710 }, { "epoch": 0.69, "learning_rate": 0.0004604979468198617, "loss": 2.3343, "step": 25711 }, { "epoch": 0.69, "learning_rate": 0.00046042466323043587, "loss": 2.0508, "step": 25712 }, { "epoch": 0.69, "learning_rate": 0.0004603513837287361, "loss": 2.2927, "step": 25713 }, { "epoch": 0.69, "learning_rate": 0.0004602781083153176, "loss": 2.49, "step": 25714 }, { "epoch": 0.69, "learning_rate": 0.0004602048369907358, "loss": 2.3987, "step": 25715 }, { "epoch": 0.69, "learning_rate": 0.0004601315697555456, "loss": 2.437, "step": 25716 }, { "epoch": 0.69, "learning_rate": 0.00046005830661030215, "loss": 2.4741, "step": 25717 }, { "epoch": 0.69, "learning_rate": 0.0004599850475555607, "loss": 2.3077, "step": 25718 }, { "epoch": 0.69, "learning_rate": 0.00045991179259187567, "loss": 2.5881, "step": 25719 }, { "epoch": 0.69, "learning_rate": 0.00045983854171980244, "loss": 2.0297, "step": 25720 }, { "epoch": 0.69, "learning_rate": 0.0004597652949398961, "loss": 2.7954, "step": 25721 }, { "epoch": 0.69, "learning_rate": 0.00045969205225271094, "loss": 2.1599, "step": 25722 }, { "epoch": 0.69, "learning_rate": 0.0004596188136588022, "loss": 2.459, "step": 25723 }, { "epoch": 0.69, "learning_rate": 0.00045954557915872473, "loss": 2.4606, "step": 25724 }, { "epoch": 0.69, "learning_rate": 0.00045947234875303334, "loss": 2.5006, "step": 25725 }, { "epoch": 0.69, "learning_rate": 0.00045939912244228324, "loss": 2.117, "step": 25726 }, { "epoch": 0.69, "learning_rate": 0.00045932590022702824, "loss": 2.1265, "step": 25727 }, { "epoch": 0.69, "learning_rate": 0.00045925268210782357, "loss": 2.4504, "step": 25728 }, { "epoch": 0.69, "learning_rate": 0.00045917946808522395, "loss": 2.27, "step": 25729 }, { "epoch": 0.69, "learning_rate": 0.0004591062581597839, "loss": 2.412, "step": 25730 }, { "epoch": 0.69, "learning_rate": 0.00045903305233205863, "loss": 2.2644, "step": 25731 }, { "epoch": 0.69, "learning_rate": 0.0004589598506026018, "loss": 2.5571, "step": 25732 }, { "epoch": 0.69, "learning_rate": 0.0004588866529719684, "loss": 2.5188, "step": 25733 }, { "epoch": 0.69, "learning_rate": 0.0004588134594407134, "loss": 2.4112, "step": 25734 }, { "epoch": 0.69, "learning_rate": 0.00045874027000939057, "loss": 2.4336, "step": 25735 }, { "epoch": 0.69, "learning_rate": 0.0004586670846785542, "loss": 2.5377, "step": 25736 }, { "epoch": 0.69, "learning_rate": 0.00045859390344875995, "loss": 2.3665, "step": 25737 }, { "epoch": 0.69, "learning_rate": 0.00045852072632056117, "loss": 2.1122, "step": 25738 }, { "epoch": 0.69, "learning_rate": 0.0004584475532945129, "loss": 2.1342, "step": 25739 }, { "epoch": 0.69, "learning_rate": 0.00045837438437116884, "loss": 2.4651, "step": 25740 }, { "epoch": 0.69, "learning_rate": 0.0004583012195510835, "loss": 2.4426, "step": 25741 }, { "epoch": 0.69, "learning_rate": 0.00045822805883481146, "loss": 2.3288, "step": 25742 }, { "epoch": 0.69, "learning_rate": 0.0004581549022229066, "loss": 2.9561, "step": 25743 }, { "epoch": 0.69, "learning_rate": 0.0004580817497159234, "loss": 2.2897, "step": 25744 }, { "epoch": 0.69, "learning_rate": 0.0004580086013144164, "loss": 2.3985, "step": 25745 }, { "epoch": 0.69, "learning_rate": 0.0004579354570189388, "loss": 2.163, "step": 25746 }, { "epoch": 0.69, "learning_rate": 0.0004578623168300458, "loss": 2.5522, "step": 25747 }, { "epoch": 0.69, "learning_rate": 0.0004577891807482906, "loss": 2.7987, "step": 25748 }, { "epoch": 0.69, "learning_rate": 0.0004577160487742271, "loss": 2.4139, "step": 25749 }, { "epoch": 0.69, "learning_rate": 0.00045764292090841075, "loss": 2.6477, "step": 25750 }, { "epoch": 0.69, "learning_rate": 0.0004575697971513942, "loss": 2.2531, "step": 25751 }, { "epoch": 0.69, "learning_rate": 0.00045749667750373193, "loss": 2.5173, "step": 25752 }, { "epoch": 0.69, "learning_rate": 0.00045742356196597824, "loss": 2.0829, "step": 25753 }, { "epoch": 0.69, "learning_rate": 0.0004573504505386863, "loss": 2.0814, "step": 25754 }, { "epoch": 0.69, "learning_rate": 0.0004572773432224102, "loss": 2.2064, "step": 25755 }, { "epoch": 0.69, "learning_rate": 0.000457204240017704, "loss": 2.5224, "step": 25756 }, { "epoch": 0.69, "learning_rate": 0.00045713114092512145, "loss": 2.5727, "step": 25757 }, { "epoch": 0.69, "learning_rate": 0.0004570580459452167, "loss": 2.3711, "step": 25758 }, { "epoch": 0.69, "learning_rate": 0.00045698495507854263, "loss": 2.6853, "step": 25759 }, { "epoch": 0.69, "learning_rate": 0.0004569118683256537, "loss": 2.5869, "step": 25760 }, { "epoch": 0.69, "learning_rate": 0.0004568387856871035, "loss": 2.3222, "step": 25761 }, { "epoch": 0.69, "learning_rate": 0.0004567657071634449, "loss": 2.4701, "step": 25762 }, { "epoch": 0.69, "learning_rate": 0.00045669263275523257, "loss": 2.8285, "step": 25763 }, { "epoch": 0.69, "learning_rate": 0.0004566195624630201, "loss": 2.4852, "step": 25764 }, { "epoch": 0.69, "learning_rate": 0.0004565464962873602, "loss": 2.6397, "step": 25765 }, { "epoch": 0.69, "learning_rate": 0.00045647343422880736, "loss": 2.3485, "step": 25766 }, { "epoch": 0.69, "learning_rate": 0.0004564003762879142, "loss": 2.6547, "step": 25767 }, { "epoch": 0.69, "learning_rate": 0.00045632732246523455, "loss": 2.5603, "step": 25768 }, { "epoch": 0.69, "learning_rate": 0.000456254272761322, "loss": 2.1511, "step": 25769 }, { "epoch": 0.69, "learning_rate": 0.00045618122717672985, "loss": 2.9109, "step": 25770 }, { "epoch": 0.69, "learning_rate": 0.0004561081857120115, "loss": 2.571, "step": 25771 }, { "epoch": 0.69, "learning_rate": 0.00045603514836772065, "loss": 2.7922, "step": 25772 }, { "epoch": 0.69, "learning_rate": 0.00045596211514440987, "loss": 2.3915, "step": 25773 }, { "epoch": 0.69, "learning_rate": 0.00045588908604263326, "loss": 2.6328, "step": 25774 }, { "epoch": 0.69, "learning_rate": 0.00045581606106294284, "loss": 2.3804, "step": 25775 }, { "epoch": 0.69, "learning_rate": 0.0004557430402058931, "loss": 2.3099, "step": 25776 }, { "epoch": 0.69, "learning_rate": 0.0004556700234720371, "loss": 2.5829, "step": 25777 }, { "epoch": 0.69, "learning_rate": 0.0004555970108619274, "loss": 2.3027, "step": 25778 }, { "epoch": 0.69, "learning_rate": 0.0004555240023761173, "loss": 2.3915, "step": 25779 }, { "epoch": 0.69, "learning_rate": 0.0004554509980151604, "loss": 2.6652, "step": 25780 }, { "epoch": 0.69, "learning_rate": 0.00045537799777960907, "loss": 2.345, "step": 25781 }, { "epoch": 0.69, "learning_rate": 0.00045530500167001664, "loss": 2.6191, "step": 25782 }, { "epoch": 0.69, "learning_rate": 0.0004552320096869361, "loss": 2.1784, "step": 25783 }, { "epoch": 0.69, "learning_rate": 0.0004551590218309205, "loss": 2.0055, "step": 25784 }, { "epoch": 0.69, "learning_rate": 0.00045508603810252314, "loss": 2.6419, "step": 25785 }, { "epoch": 0.69, "learning_rate": 0.00045501305850229615, "loss": 2.6253, "step": 25786 }, { "epoch": 0.69, "learning_rate": 0.00045494008303079283, "loss": 2.2042, "step": 25787 }, { "epoch": 0.69, "learning_rate": 0.00045486711168856586, "loss": 2.6947, "step": 25788 }, { "epoch": 0.69, "learning_rate": 0.0004547941444761683, "loss": 2.686, "step": 25789 }, { "epoch": 0.69, "learning_rate": 0.00045472118139415274, "loss": 1.987, "step": 25790 }, { "epoch": 0.69, "learning_rate": 0.00045464822244307247, "loss": 2.2358, "step": 25791 }, { "epoch": 0.69, "learning_rate": 0.00045457526762347934, "loss": 2.359, "step": 25792 }, { "epoch": 0.69, "learning_rate": 0.0004545023169359269, "loss": 2.2812, "step": 25793 }, { "epoch": 0.69, "learning_rate": 0.000454429370380967, "loss": 2.4435, "step": 25794 }, { "epoch": 0.69, "learning_rate": 0.00045435642795915265, "loss": 2.1127, "step": 25795 }, { "epoch": 0.69, "learning_rate": 0.0004542834896710364, "loss": 2.5926, "step": 25796 }, { "epoch": 0.69, "learning_rate": 0.0004542105555171709, "loss": 2.4075, "step": 25797 }, { "epoch": 0.69, "learning_rate": 0.0004541376254981087, "loss": 2.346, "step": 25798 }, { "epoch": 0.69, "learning_rate": 0.00045406469961440255, "loss": 2.0509, "step": 25799 }, { "epoch": 0.69, "learning_rate": 0.0004539917778666043, "loss": 2.3506, "step": 25800 }, { "epoch": 0.69, "learning_rate": 0.00045391886025526675, "loss": 2.5192, "step": 25801 }, { "epoch": 0.69, "learning_rate": 0.00045384594678094225, "loss": 2.5007, "step": 25802 }, { "epoch": 0.69, "learning_rate": 0.0004537730374441832, "loss": 2.5612, "step": 25803 }, { "epoch": 0.69, "learning_rate": 0.0004537001322455424, "loss": 2.2651, "step": 25804 }, { "epoch": 0.69, "learning_rate": 0.00045362723118557124, "loss": 2.7244, "step": 25805 }, { "epoch": 0.69, "learning_rate": 0.00045355433426482264, "loss": 2.6541, "step": 25806 }, { "epoch": 0.69, "learning_rate": 0.000453481441483849, "loss": 2.2915, "step": 25807 }, { "epoch": 0.69, "learning_rate": 0.0004534085528432019, "loss": 2.4044, "step": 25808 }, { "epoch": 0.69, "learning_rate": 0.0004533356683434339, "loss": 2.3179, "step": 25809 }, { "epoch": 0.69, "learning_rate": 0.000453262787985097, "loss": 2.6622, "step": 25810 }, { "epoch": 0.69, "learning_rate": 0.00045318991176874357, "loss": 2.182, "step": 25811 }, { "epoch": 0.69, "learning_rate": 0.000453117039694926, "loss": 2.5644, "step": 25812 }, { "epoch": 0.69, "learning_rate": 0.00045304417176419563, "loss": 2.1312, "step": 25813 }, { "epoch": 0.69, "learning_rate": 0.00045297130797710474, "loss": 2.6083, "step": 25814 }, { "epoch": 0.69, "learning_rate": 0.00045289844833420545, "loss": 2.2437, "step": 25815 }, { "epoch": 0.69, "learning_rate": 0.00045282559283604974, "loss": 2.8391, "step": 25816 }, { "epoch": 0.69, "learning_rate": 0.0004527527414831899, "loss": 2.5186, "step": 25817 }, { "epoch": 0.69, "learning_rate": 0.0004526798942761771, "loss": 2.5279, "step": 25818 }, { "epoch": 0.69, "learning_rate": 0.00045260705121556347, "loss": 2.3013, "step": 25819 }, { "epoch": 0.69, "learning_rate": 0.0004525342123019013, "loss": 2.2836, "step": 25820 }, { "epoch": 0.69, "learning_rate": 0.0004524613775357418, "loss": 2.2747, "step": 25821 }, { "epoch": 0.69, "learning_rate": 0.0004523885469176365, "loss": 2.0893, "step": 25822 }, { "epoch": 0.69, "learning_rate": 0.0004523157204481386, "loss": 2.8439, "step": 25823 }, { "epoch": 0.69, "learning_rate": 0.0004522428981277984, "loss": 2.1011, "step": 25824 }, { "epoch": 0.69, "learning_rate": 0.00045217007995716806, "loss": 2.5865, "step": 25825 }, { "epoch": 0.69, "learning_rate": 0.0004520972659367997, "loss": 2.3372, "step": 25826 }, { "epoch": 0.69, "learning_rate": 0.00045202445606724406, "loss": 2.7759, "step": 25827 }, { "epoch": 0.69, "learning_rate": 0.00045195165034905317, "loss": 2.73, "step": 25828 }, { "epoch": 0.69, "learning_rate": 0.0004518788487827786, "loss": 2.4048, "step": 25829 }, { "epoch": 0.69, "learning_rate": 0.0004518060513689719, "loss": 2.9177, "step": 25830 }, { "epoch": 0.69, "learning_rate": 0.0004517332581081849, "loss": 2.3281, "step": 25831 }, { "epoch": 0.69, "learning_rate": 0.0004516604690009684, "loss": 2.4434, "step": 25832 }, { "epoch": 0.69, "learning_rate": 0.0004515876840478741, "loss": 2.28, "step": 25833 }, { "epoch": 0.69, "learning_rate": 0.0004515149032494539, "loss": 2.6411, "step": 25834 }, { "epoch": 0.69, "learning_rate": 0.00045144212660625785, "loss": 2.182, "step": 25835 }, { "epoch": 0.69, "learning_rate": 0.00045136935411883904, "loss": 2.5696, "step": 25836 }, { "epoch": 0.69, "learning_rate": 0.0004512965857877475, "loss": 2.2943, "step": 25837 }, { "epoch": 0.69, "learning_rate": 0.0004512238216135349, "loss": 2.84, "step": 25838 }, { "epoch": 0.69, "learning_rate": 0.0004511510615967529, "loss": 2.0314, "step": 25839 }, { "epoch": 0.69, "learning_rate": 0.00045107830573795193, "loss": 2.8936, "step": 25840 }, { "epoch": 0.69, "learning_rate": 0.0004510055540376837, "loss": 2.473, "step": 25841 }, { "epoch": 0.69, "learning_rate": 0.00045093280649649917, "loss": 2.4507, "step": 25842 }, { "epoch": 0.69, "learning_rate": 0.00045086006311494955, "loss": 2.5604, "step": 25843 }, { "epoch": 0.69, "learning_rate": 0.00045078732389358623, "loss": 2.4004, "step": 25844 }, { "epoch": 0.69, "learning_rate": 0.00045071458883295956, "loss": 2.6322, "step": 25845 }, { "epoch": 0.69, "learning_rate": 0.0004506418579336211, "loss": 2.2928, "step": 25846 }, { "epoch": 0.69, "learning_rate": 0.00045056913119612195, "loss": 2.5852, "step": 25847 }, { "epoch": 0.69, "learning_rate": 0.0004504964086210122, "loss": 2.7293, "step": 25848 }, { "epoch": 0.69, "learning_rate": 0.00045042369020884367, "loss": 2.032, "step": 25849 }, { "epoch": 0.69, "learning_rate": 0.0004503509759601675, "loss": 2.2869, "step": 25850 }, { "epoch": 0.69, "learning_rate": 0.00045027826587553364, "loss": 2.3782, "step": 25851 }, { "epoch": 0.69, "learning_rate": 0.0004502055599554937, "loss": 2.3265, "step": 25852 }, { "epoch": 0.69, "learning_rate": 0.0004501328582005978, "loss": 2.8435, "step": 25853 }, { "epoch": 0.69, "learning_rate": 0.0004500601606113971, "loss": 2.7539, "step": 25854 }, { "epoch": 0.69, "learning_rate": 0.0004499874671884422, "loss": 2.8098, "step": 25855 }, { "epoch": 0.69, "learning_rate": 0.00044991477793228396, "loss": 2.1498, "step": 25856 }, { "epoch": 0.69, "learning_rate": 0.0004498420928434731, "loss": 2.9481, "step": 25857 }, { "epoch": 0.69, "learning_rate": 0.0004497694119225605, "loss": 2.6601, "step": 25858 }, { "epoch": 0.69, "learning_rate": 0.000449696735170096, "loss": 2.3843, "step": 25859 }, { "epoch": 0.69, "learning_rate": 0.0004496240625866308, "loss": 2.6916, "step": 25860 }, { "epoch": 0.69, "learning_rate": 0.00044955139417271516, "loss": 2.3986, "step": 25861 }, { "epoch": 0.7, "learning_rate": 0.00044947872992889983, "loss": 2.1589, "step": 25862 }, { "epoch": 0.7, "learning_rate": 0.00044940606985573563, "loss": 2.5633, "step": 25863 }, { "epoch": 0.7, "learning_rate": 0.00044933341395377214, "loss": 2.8684, "step": 25864 }, { "epoch": 0.7, "learning_rate": 0.00044926076222356025, "loss": 2.4886, "step": 25865 }, { "epoch": 0.7, "learning_rate": 0.0004491881146656508, "loss": 2.3411, "step": 25866 }, { "epoch": 0.7, "learning_rate": 0.00044911547128059337, "loss": 2.412, "step": 25867 }, { "epoch": 0.7, "learning_rate": 0.00044904283206893825, "loss": 2.4123, "step": 25868 }, { "epoch": 0.7, "learning_rate": 0.00044897019703123685, "loss": 2.2512, "step": 25869 }, { "epoch": 0.7, "learning_rate": 0.00044889756616803836, "loss": 2.2062, "step": 25870 }, { "epoch": 0.7, "learning_rate": 0.0004488249394798938, "loss": 2.5432, "step": 25871 }, { "epoch": 0.7, "learning_rate": 0.0004487523169673524, "loss": 2.627, "step": 25872 }, { "epoch": 0.7, "learning_rate": 0.00044867969863096515, "loss": 2.3017, "step": 25873 }, { "epoch": 0.7, "learning_rate": 0.00044860708447128176, "loss": 2.3276, "step": 25874 }, { "epoch": 0.7, "learning_rate": 0.00044853447448885256, "loss": 2.6374, "step": 25875 }, { "epoch": 0.7, "learning_rate": 0.00044846186868422757, "loss": 2.6098, "step": 25876 }, { "epoch": 0.7, "learning_rate": 0.00044838926705795734, "loss": 2.3814, "step": 25877 }, { "epoch": 0.7, "learning_rate": 0.0004483166696105909, "loss": 2.6091, "step": 25878 }, { "epoch": 0.7, "learning_rate": 0.0004482440763426792, "loss": 2.2434, "step": 25879 }, { "epoch": 0.7, "learning_rate": 0.0004481714872547713, "loss": 2.559, "step": 25880 }, { "epoch": 0.7, "learning_rate": 0.00044809890234741724, "loss": 2.5367, "step": 25881 }, { "epoch": 0.7, "learning_rate": 0.00044802632162116787, "loss": 2.3195, "step": 25882 }, { "epoch": 0.7, "learning_rate": 0.0004479537450765722, "loss": 2.4174, "step": 25883 }, { "epoch": 0.7, "learning_rate": 0.00044788117271418005, "loss": 2.4026, "step": 25884 }, { "epoch": 0.7, "learning_rate": 0.00044780860453454195, "loss": 2.4876, "step": 25885 }, { "epoch": 0.7, "learning_rate": 0.0004477360405382067, "loss": 2.5615, "step": 25886 }, { "epoch": 0.7, "learning_rate": 0.00044766348072572447, "loss": 2.7502, "step": 25887 }, { "epoch": 0.7, "learning_rate": 0.00044759092509764496, "loss": 2.6622, "step": 25888 }, { "epoch": 0.7, "learning_rate": 0.00044751837365451796, "loss": 2.6381, "step": 25889 }, { "epoch": 0.7, "learning_rate": 0.00044744582639689323, "loss": 2.5666, "step": 25890 }, { "epoch": 0.7, "learning_rate": 0.0004473732833253198, "loss": 2.0936, "step": 25891 }, { "epoch": 0.7, "learning_rate": 0.0004473007444403475, "loss": 2.52, "step": 25892 }, { "epoch": 0.7, "learning_rate": 0.00044722820974252644, "loss": 2.7097, "step": 25893 }, { "epoch": 0.7, "learning_rate": 0.00044715567923240483, "loss": 2.5064, "step": 25894 }, { "epoch": 0.7, "learning_rate": 0.0004470831529105337, "loss": 2.2168, "step": 25895 }, { "epoch": 0.7, "learning_rate": 0.0004470106307774614, "loss": 2.5509, "step": 25896 }, { "epoch": 0.7, "learning_rate": 0.00044693811283373776, "loss": 2.4808, "step": 25897 }, { "epoch": 0.7, "learning_rate": 0.0004468655990799123, "loss": 2.7666, "step": 25898 }, { "epoch": 0.7, "learning_rate": 0.00044679308951653396, "loss": 2.3909, "step": 25899 }, { "epoch": 0.7, "learning_rate": 0.00044672058414415216, "loss": 2.3401, "step": 25900 }, { "epoch": 0.7, "learning_rate": 0.0004466480829633164, "loss": 2.3825, "step": 25901 }, { "epoch": 0.7, "learning_rate": 0.0004465755859745757, "loss": 2.3357, "step": 25902 }, { "epoch": 0.7, "learning_rate": 0.0004465030931784796, "loss": 2.8331, "step": 25903 }, { "epoch": 0.7, "learning_rate": 0.00044643060457557726, "loss": 2.5472, "step": 25904 }, { "epoch": 0.7, "learning_rate": 0.0004463581201664175, "loss": 3.0603, "step": 25905 }, { "epoch": 0.7, "learning_rate": 0.0004462856399515499, "loss": 2.2854, "step": 25906 }, { "epoch": 0.7, "learning_rate": 0.00044621316393152264, "loss": 2.0489, "step": 25907 }, { "epoch": 0.7, "learning_rate": 0.0004461406921068858, "loss": 2.5911, "step": 25908 }, { "epoch": 0.7, "learning_rate": 0.0004460682244781884, "loss": 2.7319, "step": 25909 }, { "epoch": 0.7, "learning_rate": 0.0004459957610459787, "loss": 2.2454, "step": 25910 }, { "epoch": 0.7, "learning_rate": 0.0004459233018108061, "loss": 2.5175, "step": 25911 }, { "epoch": 0.7, "learning_rate": 0.00044585084677321987, "loss": 2.2175, "step": 25912 }, { "epoch": 0.7, "learning_rate": 0.0004457783959337681, "loss": 2.1339, "step": 25913 }, { "epoch": 0.7, "learning_rate": 0.00044570594929300023, "loss": 2.4301, "step": 25914 }, { "epoch": 0.7, "learning_rate": 0.00044563350685146495, "loss": 2.3801, "step": 25915 }, { "epoch": 0.7, "learning_rate": 0.00044556106860971115, "loss": 2.4189, "step": 25916 }, { "epoch": 0.7, "learning_rate": 0.0004454886345682879, "loss": 2.6394, "step": 25917 }, { "epoch": 0.7, "learning_rate": 0.00044541620472774324, "loss": 2.8037, "step": 25918 }, { "epoch": 0.7, "learning_rate": 0.00044534377908862636, "loss": 2.2714, "step": 25919 }, { "epoch": 0.7, "learning_rate": 0.00044527135765148575, "loss": 2.4623, "step": 25920 }, { "epoch": 0.7, "learning_rate": 0.00044519894041687014, "loss": 2.6516, "step": 25921 }, { "epoch": 0.7, "learning_rate": 0.00044512652738532856, "loss": 2.6016, "step": 25922 }, { "epoch": 0.7, "learning_rate": 0.00044505411855740886, "loss": 2.502, "step": 25923 }, { "epoch": 0.7, "learning_rate": 0.0004449817139336599, "loss": 2.5979, "step": 25924 }, { "epoch": 0.7, "learning_rate": 0.0004449093135146307, "loss": 2.4849, "step": 25925 }, { "epoch": 0.7, "learning_rate": 0.00044483691730086883, "loss": 2.5897, "step": 25926 }, { "epoch": 0.7, "learning_rate": 0.0004447645252929233, "loss": 2.6591, "step": 25927 }, { "epoch": 0.7, "learning_rate": 0.0004446921374913424, "loss": 2.4898, "step": 25928 }, { "epoch": 0.7, "learning_rate": 0.00044461975389667463, "loss": 2.724, "step": 25929 }, { "epoch": 0.7, "learning_rate": 0.0004445473745094687, "loss": 2.695, "step": 25930 }, { "epoch": 0.7, "learning_rate": 0.0004444749993302721, "loss": 2.6423, "step": 25931 }, { "epoch": 0.7, "learning_rate": 0.00044440262835963363, "loss": 2.2788, "step": 25932 }, { "epoch": 0.7, "learning_rate": 0.0004443302615981015, "loss": 2.5114, "step": 25933 }, { "epoch": 0.7, "learning_rate": 0.00044425789904622406, "loss": 2.7845, "step": 25934 }, { "epoch": 0.7, "learning_rate": 0.0004441855407045493, "loss": 2.9567, "step": 25935 }, { "epoch": 0.7, "learning_rate": 0.00044411318657362596, "loss": 2.5969, "step": 25936 }, { "epoch": 0.7, "learning_rate": 0.00044404083665400143, "loss": 2.8683, "step": 25937 }, { "epoch": 0.7, "learning_rate": 0.00044396849094622393, "loss": 2.9081, "step": 25938 }, { "epoch": 0.7, "learning_rate": 0.0004438961494508422, "loss": 2.1036, "step": 25939 }, { "epoch": 0.7, "learning_rate": 0.00044382381216840353, "loss": 2.215, "step": 25940 }, { "epoch": 0.7, "learning_rate": 0.0004437514790994561, "loss": 2.7841, "step": 25941 }, { "epoch": 0.7, "learning_rate": 0.0004436791502445481, "loss": 2.3909, "step": 25942 }, { "epoch": 0.7, "learning_rate": 0.0004436068256042274, "loss": 2.9008, "step": 25943 }, { "epoch": 0.7, "learning_rate": 0.00044353450517904214, "loss": 2.1981, "step": 25944 }, { "epoch": 0.7, "learning_rate": 0.0004434621889695397, "loss": 2.4528, "step": 25945 }, { "epoch": 0.7, "learning_rate": 0.00044338987697626833, "loss": 2.3401, "step": 25946 }, { "epoch": 0.7, "learning_rate": 0.0004433175691997756, "loss": 2.5813, "step": 25947 }, { "epoch": 0.7, "learning_rate": 0.00044324526564060954, "loss": 2.5462, "step": 25948 }, { "epoch": 0.7, "learning_rate": 0.00044317296629931815, "loss": 2.4516, "step": 25949 }, { "epoch": 0.7, "learning_rate": 0.0004431006711764484, "loss": 2.5169, "step": 25950 }, { "epoch": 0.7, "learning_rate": 0.00044302838027254846, "loss": 2.7293, "step": 25951 }, { "epoch": 0.7, "learning_rate": 0.00044295609358816623, "loss": 2.4962, "step": 25952 }, { "epoch": 0.7, "learning_rate": 0.0004428838111238487, "loss": 2.5034, "step": 25953 }, { "epoch": 0.7, "learning_rate": 0.0004428115328801434, "loss": 2.5492, "step": 25954 }, { "epoch": 0.7, "learning_rate": 0.00044273925885759914, "loss": 2.6123, "step": 25955 }, { "epoch": 0.7, "learning_rate": 0.0004426669890567622, "loss": 2.456, "step": 25956 }, { "epoch": 0.7, "learning_rate": 0.0004425947234781809, "loss": 2.5663, "step": 25957 }, { "epoch": 0.7, "learning_rate": 0.00044252246212240197, "loss": 2.68, "step": 25958 }, { "epoch": 0.7, "learning_rate": 0.0004424502049899731, "loss": 2.6182, "step": 25959 }, { "epoch": 0.7, "learning_rate": 0.00044237795208144193, "loss": 2.0405, "step": 25960 }, { "epoch": 0.7, "learning_rate": 0.00044230570339735565, "loss": 2.3678, "step": 25961 }, { "epoch": 0.7, "learning_rate": 0.00044223345893826174, "loss": 2.3272, "step": 25962 }, { "epoch": 0.7, "learning_rate": 0.0004421612187047076, "loss": 2.27, "step": 25963 }, { "epoch": 0.7, "learning_rate": 0.0004420889826972401, "loss": 2.474, "step": 25964 }, { "epoch": 0.7, "learning_rate": 0.000442016750916407, "loss": 2.5679, "step": 25965 }, { "epoch": 0.7, "learning_rate": 0.00044194452336275504, "loss": 2.4262, "step": 25966 }, { "epoch": 0.7, "learning_rate": 0.0004418723000368311, "loss": 2.3403, "step": 25967 }, { "epoch": 0.7, "learning_rate": 0.0004418000809391836, "loss": 2.3455, "step": 25968 }, { "epoch": 0.7, "learning_rate": 0.00044172786607035854, "loss": 2.6385, "step": 25969 }, { "epoch": 0.7, "learning_rate": 0.00044165565543090324, "loss": 2.4983, "step": 25970 }, { "epoch": 0.7, "learning_rate": 0.0004415834490213654, "loss": 2.6068, "step": 25971 }, { "epoch": 0.7, "learning_rate": 0.00044151124684229103, "loss": 2.6111, "step": 25972 }, { "epoch": 0.7, "learning_rate": 0.0004414390488942277, "loss": 2.2185, "step": 25973 }, { "epoch": 0.7, "learning_rate": 0.00044136685517772226, "loss": 2.5563, "step": 25974 }, { "epoch": 0.7, "learning_rate": 0.00044129466569332155, "loss": 2.9532, "step": 25975 }, { "epoch": 0.7, "learning_rate": 0.000441222480441573, "loss": 2.1838, "step": 25976 }, { "epoch": 0.7, "learning_rate": 0.00044115029942302263, "loss": 2.5295, "step": 25977 }, { "epoch": 0.7, "learning_rate": 0.0004410781226382178, "loss": 2.1197, "step": 25978 }, { "epoch": 0.7, "learning_rate": 0.0004410059500877055, "loss": 2.2654, "step": 25979 }, { "epoch": 0.7, "learning_rate": 0.00044093378177203135, "loss": 2.4113, "step": 25980 }, { "epoch": 0.7, "learning_rate": 0.00044086161769174337, "loss": 2.4153, "step": 25981 }, { "epoch": 0.7, "learning_rate": 0.00044078945784738823, "loss": 2.6743, "step": 25982 }, { "epoch": 0.7, "learning_rate": 0.00044071730223951166, "loss": 2.3231, "step": 25983 }, { "epoch": 0.7, "learning_rate": 0.0004406451508686613, "loss": 2.9317, "step": 25984 }, { "epoch": 0.7, "learning_rate": 0.0004405730037353829, "loss": 2.482, "step": 25985 }, { "epoch": 0.7, "learning_rate": 0.00044050086084022335, "loss": 2.4895, "step": 25986 }, { "epoch": 0.7, "learning_rate": 0.0004404287221837293, "loss": 2.5972, "step": 25987 }, { "epoch": 0.7, "learning_rate": 0.00044035658776644726, "loss": 2.5346, "step": 25988 }, { "epoch": 0.7, "learning_rate": 0.00044028445758892355, "loss": 2.6094, "step": 25989 }, { "epoch": 0.7, "learning_rate": 0.00044021233165170517, "loss": 2.5782, "step": 25990 }, { "epoch": 0.7, "learning_rate": 0.00044014020995533767, "loss": 2.6233, "step": 25991 }, { "epoch": 0.7, "learning_rate": 0.00044006809250036815, "loss": 2.1657, "step": 25992 }, { "epoch": 0.7, "learning_rate": 0.000439995979287342, "loss": 2.4233, "step": 25993 }, { "epoch": 0.7, "learning_rate": 0.0004399238703168066, "loss": 2.3612, "step": 25994 }, { "epoch": 0.7, "learning_rate": 0.00043985176558930815, "loss": 2.5756, "step": 25995 }, { "epoch": 0.7, "learning_rate": 0.00043977966510539215, "loss": 1.971, "step": 25996 }, { "epoch": 0.7, "learning_rate": 0.00043970756886560535, "loss": 2.8378, "step": 25997 }, { "epoch": 0.7, "learning_rate": 0.0004396354768704941, "loss": 2.7625, "step": 25998 }, { "epoch": 0.7, "learning_rate": 0.00043956338912060403, "loss": 2.9869, "step": 25999 }, { "epoch": 0.7, "learning_rate": 0.0004394913056164814, "loss": 2.484, "step": 26000 }, { "epoch": 0.7, "learning_rate": 0.0004394192263586726, "loss": 2.6857, "step": 26001 }, { "epoch": 0.7, "learning_rate": 0.0004393471513477234, "loss": 2.8085, "step": 26002 }, { "epoch": 0.7, "learning_rate": 0.0004392750805841803, "loss": 2.4132, "step": 26003 }, { "epoch": 0.7, "learning_rate": 0.0004392030140685886, "loss": 2.1581, "step": 26004 }, { "epoch": 0.7, "learning_rate": 0.00043913095180149464, "loss": 2.4909, "step": 26005 }, { "epoch": 0.7, "learning_rate": 0.0004390588937834443, "loss": 2.2307, "step": 26006 }, { "epoch": 0.7, "learning_rate": 0.00043898684001498356, "loss": 1.9782, "step": 26007 }, { "epoch": 0.7, "learning_rate": 0.0004389147904966585, "loss": 2.3641, "step": 26008 }, { "epoch": 0.7, "learning_rate": 0.00043884274522901435, "loss": 2.207, "step": 26009 }, { "epoch": 0.7, "learning_rate": 0.00043877070421259725, "loss": 2.4527, "step": 26010 }, { "epoch": 0.7, "learning_rate": 0.0004386986674479533, "loss": 2.6211, "step": 26011 }, { "epoch": 0.7, "learning_rate": 0.00043862663493562747, "loss": 2.6752, "step": 26012 }, { "epoch": 0.7, "learning_rate": 0.00043855460667616586, "loss": 1.778, "step": 26013 }, { "epoch": 0.7, "learning_rate": 0.0004384825826701143, "loss": 2.2639, "step": 26014 }, { "epoch": 0.7, "learning_rate": 0.00043841056291801827, "loss": 2.2111, "step": 26015 }, { "epoch": 0.7, "learning_rate": 0.0004383385474204233, "loss": 2.5733, "step": 26016 }, { "epoch": 0.7, "learning_rate": 0.00043826653617787557, "loss": 2.9927, "step": 26017 }, { "epoch": 0.7, "learning_rate": 0.00043819452919091975, "loss": 2.3055, "step": 26018 }, { "epoch": 0.7, "learning_rate": 0.00043812252646010174, "loss": 2.4646, "step": 26019 }, { "epoch": 0.7, "learning_rate": 0.000438050527985967, "loss": 2.3921, "step": 26020 }, { "epoch": 0.7, "learning_rate": 0.00043797853376906096, "loss": 2.878, "step": 26021 }, { "epoch": 0.7, "learning_rate": 0.00043790654380992944, "loss": 2.7059, "step": 26022 }, { "epoch": 0.7, "learning_rate": 0.0004378345581091171, "loss": 2.6826, "step": 26023 }, { "epoch": 0.7, "learning_rate": 0.00043776257666716965, "loss": 2.2573, "step": 26024 }, { "epoch": 0.7, "learning_rate": 0.00043769059948463285, "loss": 2.3287, "step": 26025 }, { "epoch": 0.7, "learning_rate": 0.00043761862656205064, "loss": 2.9619, "step": 26026 }, { "epoch": 0.7, "learning_rate": 0.00043754665789997005, "loss": 2.3482, "step": 26027 }, { "epoch": 0.7, "learning_rate": 0.00043747469349893496, "loss": 2.6975, "step": 26028 }, { "epoch": 0.7, "learning_rate": 0.0004374027333594911, "loss": 2.2948, "step": 26029 }, { "epoch": 0.7, "learning_rate": 0.0004373307774821839, "loss": 2.4105, "step": 26030 }, { "epoch": 0.7, "learning_rate": 0.0004372588258675576, "loss": 2.5057, "step": 26031 }, { "epoch": 0.7, "learning_rate": 0.00043718687851615804, "loss": 1.9834, "step": 26032 }, { "epoch": 0.7, "learning_rate": 0.00043711493542853, "loss": 2.7248, "step": 26033 }, { "epoch": 0.7, "learning_rate": 0.0004370429966052185, "loss": 2.3443, "step": 26034 }, { "epoch": 0.7, "learning_rate": 0.00043697106204676906, "loss": 1.9556, "step": 26035 }, { "epoch": 0.7, "learning_rate": 0.00043689913175372586, "loss": 2.486, "step": 26036 }, { "epoch": 0.7, "learning_rate": 0.00043682720572663406, "loss": 2.4898, "step": 26037 }, { "epoch": 0.7, "learning_rate": 0.00043675528396603904, "loss": 2.2196, "step": 26038 }, { "epoch": 0.7, "learning_rate": 0.0004366833664724846, "loss": 2.3421, "step": 26039 }, { "epoch": 0.7, "learning_rate": 0.00043661145324651665, "loss": 2.4882, "step": 26040 }, { "epoch": 0.7, "learning_rate": 0.00043653954428867994, "loss": 2.9267, "step": 26041 }, { "epoch": 0.7, "learning_rate": 0.00043646763959951865, "loss": 2.1627, "step": 26042 }, { "epoch": 0.7, "learning_rate": 0.00043639573917957796, "loss": 2.5151, "step": 26043 }, { "epoch": 0.7, "learning_rate": 0.0004363238430294021, "loss": 2.5542, "step": 26044 }, { "epoch": 0.7, "learning_rate": 0.0004362519511495361, "loss": 2.6311, "step": 26045 }, { "epoch": 0.7, "learning_rate": 0.0004361800635405244, "loss": 2.2136, "step": 26046 }, { "epoch": 0.7, "learning_rate": 0.0004361081802029118, "loss": 2.3826, "step": 26047 }, { "epoch": 0.7, "learning_rate": 0.0004360363011372428, "loss": 2.6306, "step": 26048 }, { "epoch": 0.7, "learning_rate": 0.0004359644263440623, "loss": 2.4569, "step": 26049 }, { "epoch": 0.7, "learning_rate": 0.0004358925558239142, "loss": 2.4242, "step": 26050 }, { "epoch": 0.7, "learning_rate": 0.0004358206895773431, "loss": 2.7, "step": 26051 }, { "epoch": 0.7, "learning_rate": 0.00043574882760489365, "loss": 2.3415, "step": 26052 }, { "epoch": 0.7, "learning_rate": 0.00043567696990711027, "loss": 2.4234, "step": 26053 }, { "epoch": 0.7, "learning_rate": 0.0004356051164845376, "loss": 2.6801, "step": 26054 }, { "epoch": 0.7, "learning_rate": 0.00043553326733771923, "loss": 2.1827, "step": 26055 }, { "epoch": 0.7, "learning_rate": 0.0004354614224672, "loss": 2.654, "step": 26056 }, { "epoch": 0.7, "learning_rate": 0.0004353895818735244, "loss": 2.6514, "step": 26057 }, { "epoch": 0.7, "learning_rate": 0.0004353177455572361, "loss": 2.501, "step": 26058 }, { "epoch": 0.7, "learning_rate": 0.00043524591351887953, "loss": 2.5868, "step": 26059 }, { "epoch": 0.7, "learning_rate": 0.00043517408575899895, "loss": 2.1979, "step": 26060 }, { "epoch": 0.7, "learning_rate": 0.00043510226227813853, "loss": 2.74, "step": 26061 }, { "epoch": 0.7, "learning_rate": 0.00043503044307684283, "loss": 2.2646, "step": 26062 }, { "epoch": 0.7, "learning_rate": 0.00043495862815565503, "loss": 2.5962, "step": 26063 }, { "epoch": 0.7, "learning_rate": 0.0004348868175151196, "loss": 2.4885, "step": 26064 }, { "epoch": 0.7, "learning_rate": 0.0004348150111557807, "loss": 2.7165, "step": 26065 }, { "epoch": 0.7, "learning_rate": 0.0004347432090781822, "loss": 2.7147, "step": 26066 }, { "epoch": 0.7, "learning_rate": 0.00043467141128286814, "loss": 2.3972, "step": 26067 }, { "epoch": 0.7, "learning_rate": 0.00043459961777038257, "loss": 2.7693, "step": 26068 }, { "epoch": 0.7, "learning_rate": 0.00043452782854126905, "loss": 2.2547, "step": 26069 }, { "epoch": 0.7, "learning_rate": 0.00043445604359607196, "loss": 2.266, "step": 26070 }, { "epoch": 0.7, "learning_rate": 0.00043438426293533427, "loss": 2.3631, "step": 26071 }, { "epoch": 0.7, "learning_rate": 0.0004343124865596004, "loss": 2.653, "step": 26072 }, { "epoch": 0.7, "learning_rate": 0.00043424071446941393, "loss": 2.2727, "step": 26073 }, { "epoch": 0.7, "learning_rate": 0.0004341689466653187, "loss": 2.5652, "step": 26074 }, { "epoch": 0.7, "learning_rate": 0.0004340971831478584, "loss": 2.4241, "step": 26075 }, { "epoch": 0.7, "learning_rate": 0.0004340254239175769, "loss": 2.5201, "step": 26076 }, { "epoch": 0.7, "learning_rate": 0.0004339536689750174, "loss": 2.8962, "step": 26077 }, { "epoch": 0.7, "learning_rate": 0.00043388191832072367, "loss": 1.9516, "step": 26078 }, { "epoch": 0.7, "learning_rate": 0.0004338101719552392, "loss": 2.0926, "step": 26079 }, { "epoch": 0.7, "learning_rate": 0.0004337384298791077, "loss": 2.8757, "step": 26080 }, { "epoch": 0.7, "learning_rate": 0.000433666692092873, "loss": 2.1928, "step": 26081 }, { "epoch": 0.7, "learning_rate": 0.0004335949585970779, "loss": 2.4958, "step": 26082 }, { "epoch": 0.7, "learning_rate": 0.000433523229392266, "loss": 2.7222, "step": 26083 }, { "epoch": 0.7, "learning_rate": 0.0004334515044789813, "loss": 2.4565, "step": 26084 }, { "epoch": 0.7, "learning_rate": 0.0004333797838577662, "loss": 2.2691, "step": 26085 }, { "epoch": 0.7, "learning_rate": 0.0004333080675291644, "loss": 2.5221, "step": 26086 }, { "epoch": 0.7, "learning_rate": 0.00043323635549372, "loss": 2.8692, "step": 26087 }, { "epoch": 0.7, "learning_rate": 0.00043316464775197515, "loss": 2.4153, "step": 26088 }, { "epoch": 0.7, "learning_rate": 0.0004330929443044741, "loss": 2.2353, "step": 26089 }, { "epoch": 0.7, "learning_rate": 0.0004330212451517592, "loss": 2.3684, "step": 26090 }, { "epoch": 0.7, "learning_rate": 0.0004329495502943739, "loss": 2.6107, "step": 26091 }, { "epoch": 0.7, "learning_rate": 0.0004328778597328614, "loss": 2.5069, "step": 26092 }, { "epoch": 0.7, "learning_rate": 0.000432806173467765, "loss": 2.3071, "step": 26093 }, { "epoch": 0.7, "learning_rate": 0.0004327344914996275, "loss": 2.429, "step": 26094 }, { "epoch": 0.7, "learning_rate": 0.00043266281382899253, "loss": 2.3166, "step": 26095 }, { "epoch": 0.7, "learning_rate": 0.0004325911404564021, "loss": 2.2852, "step": 26096 }, { "epoch": 0.7, "learning_rate": 0.0004325194713824003, "loss": 2.6796, "step": 26097 }, { "epoch": 0.7, "learning_rate": 0.0004324478066075291, "loss": 2.7762, "step": 26098 }, { "epoch": 0.7, "learning_rate": 0.00043237614613233155, "loss": 2.5481, "step": 26099 }, { "epoch": 0.7, "learning_rate": 0.0004323044899573515, "loss": 2.49, "step": 26100 }, { "epoch": 0.7, "learning_rate": 0.00043223283808313073, "loss": 2.195, "step": 26101 }, { "epoch": 0.7, "learning_rate": 0.0004321611905102125, "loss": 2.6744, "step": 26102 }, { "epoch": 0.7, "learning_rate": 0.00043208954723913994, "loss": 2.5476, "step": 26103 }, { "epoch": 0.7, "learning_rate": 0.0004320179082704552, "loss": 1.8838, "step": 26104 }, { "epoch": 0.7, "learning_rate": 0.00043194627360470107, "loss": 2.776, "step": 26105 }, { "epoch": 0.7, "learning_rate": 0.00043187464324242043, "loss": 2.1735, "step": 26106 }, { "epoch": 0.7, "learning_rate": 0.0004318030171841559, "loss": 2.3514, "step": 26107 }, { "epoch": 0.7, "learning_rate": 0.00043173139543045057, "loss": 2.743, "step": 26108 }, { "epoch": 0.7, "learning_rate": 0.0004316597779818463, "loss": 3.3373, "step": 26109 }, { "epoch": 0.7, "learning_rate": 0.00043158816483888587, "loss": 2.4459, "step": 26110 }, { "epoch": 0.7, "learning_rate": 0.00043151655600211214, "loss": 2.579, "step": 26111 }, { "epoch": 0.7, "learning_rate": 0.00043144495147206673, "loss": 2.3103, "step": 26112 }, { "epoch": 0.7, "learning_rate": 0.00043137335124929346, "loss": 2.5108, "step": 26113 }, { "epoch": 0.7, "learning_rate": 0.0004313017553343336, "loss": 2.7483, "step": 26114 }, { "epoch": 0.7, "learning_rate": 0.00043123016372772994, "loss": 2.8068, "step": 26115 }, { "epoch": 0.7, "learning_rate": 0.0004311585764300253, "loss": 2.2509, "step": 26116 }, { "epoch": 0.7, "learning_rate": 0.00043108699344176127, "loss": 2.939, "step": 26117 }, { "epoch": 0.7, "learning_rate": 0.0004310154147634804, "loss": 2.8018, "step": 26118 }, { "epoch": 0.7, "learning_rate": 0.000430943840395725, "loss": 2.4482, "step": 26119 }, { "epoch": 0.7, "learning_rate": 0.0004308722703390373, "loss": 2.8231, "step": 26120 }, { "epoch": 0.7, "learning_rate": 0.00043080070459396, "loss": 2.5947, "step": 26121 }, { "epoch": 0.7, "learning_rate": 0.0004307291431610344, "loss": 2.0608, "step": 26122 }, { "epoch": 0.7, "learning_rate": 0.00043065758604080294, "loss": 2.2643, "step": 26123 }, { "epoch": 0.7, "learning_rate": 0.0004305860332338083, "loss": 2.3865, "step": 26124 }, { "epoch": 0.7, "learning_rate": 0.0004305144847405913, "loss": 2.4083, "step": 26125 }, { "epoch": 0.7, "learning_rate": 0.0004304429405616951, "loss": 2.3164, "step": 26126 }, { "epoch": 0.7, "learning_rate": 0.00043037140069766177, "loss": 2.4957, "step": 26127 }, { "epoch": 0.7, "learning_rate": 0.0004302998651490324, "loss": 2.298, "step": 26128 }, { "epoch": 0.7, "learning_rate": 0.00043022833391634954, "loss": 2.6889, "step": 26129 }, { "epoch": 0.7, "learning_rate": 0.00043015680700015524, "loss": 2.497, "step": 26130 }, { "epoch": 0.7, "learning_rate": 0.0004300852844009907, "loss": 2.7905, "step": 26131 }, { "epoch": 0.7, "learning_rate": 0.00043001376611939826, "loss": 2.7193, "step": 26132 }, { "epoch": 0.7, "learning_rate": 0.0004299422521559195, "loss": 2.7169, "step": 26133 }, { "epoch": 0.7, "learning_rate": 0.0004298707425110964, "loss": 2.5441, "step": 26134 }, { "epoch": 0.7, "learning_rate": 0.000429799237185471, "loss": 2.3362, "step": 26135 }, { "epoch": 0.7, "learning_rate": 0.00042972773617958417, "loss": 2.7421, "step": 26136 }, { "epoch": 0.7, "learning_rate": 0.00042965623949397814, "loss": 2.3623, "step": 26137 }, { "epoch": 0.7, "learning_rate": 0.0004295847471291944, "loss": 2.7569, "step": 26138 }, { "epoch": 0.7, "learning_rate": 0.00042951325908577477, "loss": 2.5229, "step": 26139 }, { "epoch": 0.7, "learning_rate": 0.0004294417753642609, "loss": 2.7226, "step": 26140 }, { "epoch": 0.7, "learning_rate": 0.00042937029596519386, "loss": 2.4878, "step": 26141 }, { "epoch": 0.7, "learning_rate": 0.0004292988208891154, "loss": 3.0054, "step": 26142 }, { "epoch": 0.7, "learning_rate": 0.00042922735013656743, "loss": 2.602, "step": 26143 }, { "epoch": 0.7, "learning_rate": 0.00042915588370809067, "loss": 2.5255, "step": 26144 }, { "epoch": 0.7, "learning_rate": 0.0004290844216042269, "loss": 2.634, "step": 26145 }, { "epoch": 0.7, "learning_rate": 0.0004290129638255174, "loss": 2.6249, "step": 26146 }, { "epoch": 0.7, "learning_rate": 0.0004289415103725036, "loss": 2.5127, "step": 26147 }, { "epoch": 0.7, "learning_rate": 0.00042887006124572727, "loss": 2.2592, "step": 26148 }, { "epoch": 0.7, "learning_rate": 0.0004287986164457288, "loss": 2.4442, "step": 26149 }, { "epoch": 0.7, "learning_rate": 0.00042872717597305, "loss": 2.6736, "step": 26150 }, { "epoch": 0.7, "learning_rate": 0.00042865573982823194, "loss": 2.6219, "step": 26151 }, { "epoch": 0.7, "learning_rate": 0.0004285843080118158, "loss": 2.2229, "step": 26152 }, { "epoch": 0.7, "learning_rate": 0.00042851288052434276, "loss": 2.7835, "step": 26153 }, { "epoch": 0.7, "learning_rate": 0.0004284414573663544, "loss": 2.4078, "step": 26154 }, { "epoch": 0.7, "learning_rate": 0.000428370038538391, "loss": 2.5383, "step": 26155 }, { "epoch": 0.7, "learning_rate": 0.0004282986240409943, "loss": 2.4608, "step": 26156 }, { "epoch": 0.7, "learning_rate": 0.00042822721387470467, "loss": 2.5809, "step": 26157 }, { "epoch": 0.7, "learning_rate": 0.0004281558080400635, "loss": 2.5436, "step": 26158 }, { "epoch": 0.7, "learning_rate": 0.0004280844065376116, "loss": 2.6379, "step": 26159 }, { "epoch": 0.7, "learning_rate": 0.00042801300936789, "loss": 2.478, "step": 26160 }, { "epoch": 0.7, "learning_rate": 0.0004279416165314397, "loss": 2.1103, "step": 26161 }, { "epoch": 0.7, "learning_rate": 0.0004278702280288017, "loss": 2.6154, "step": 26162 }, { "epoch": 0.7, "learning_rate": 0.00042779884386051625, "loss": 2.5926, "step": 26163 }, { "epoch": 0.7, "learning_rate": 0.0004277274640271244, "loss": 2.6117, "step": 26164 }, { "epoch": 0.7, "learning_rate": 0.000427656088529167, "loss": 2.6714, "step": 26165 }, { "epoch": 0.7, "learning_rate": 0.00042758471736718476, "loss": 2.7765, "step": 26166 }, { "epoch": 0.7, "learning_rate": 0.00042751335054171867, "loss": 2.3263, "step": 26167 }, { "epoch": 0.7, "learning_rate": 0.0004274419880533088, "loss": 2.1017, "step": 26168 }, { "epoch": 0.7, "learning_rate": 0.000427370629902496, "loss": 2.4324, "step": 26169 }, { "epoch": 0.7, "learning_rate": 0.0004272992760898213, "loss": 2.0777, "step": 26170 }, { "epoch": 0.7, "learning_rate": 0.00042722792661582456, "loss": 2.5301, "step": 26171 }, { "epoch": 0.7, "learning_rate": 0.0004271565814810463, "loss": 2.1947, "step": 26172 }, { "epoch": 0.7, "learning_rate": 0.00042708524068602803, "loss": 2.6873, "step": 26173 }, { "epoch": 0.7, "learning_rate": 0.00042701390423130925, "loss": 1.8445, "step": 26174 }, { "epoch": 0.7, "learning_rate": 0.00042694257211743105, "loss": 2.5194, "step": 26175 }, { "epoch": 0.7, "learning_rate": 0.00042687124434493307, "loss": 2.6038, "step": 26176 }, { "epoch": 0.7, "learning_rate": 0.00042679992091435617, "loss": 2.4799, "step": 26177 }, { "epoch": 0.7, "learning_rate": 0.0004267286018262405, "loss": 2.1934, "step": 26178 }, { "epoch": 0.7, "learning_rate": 0.0004266572870811264, "loss": 2.6147, "step": 26179 }, { "epoch": 0.7, "learning_rate": 0.00042658597667955434, "loss": 2.5531, "step": 26180 }, { "epoch": 0.7, "learning_rate": 0.0004265146706220646, "loss": 2.5788, "step": 26181 }, { "epoch": 0.7, "learning_rate": 0.000426443368909197, "loss": 2.6151, "step": 26182 }, { "epoch": 0.7, "learning_rate": 0.00042637207154149213, "loss": 2.6759, "step": 26183 }, { "epoch": 0.7, "learning_rate": 0.0004263007785194892, "loss": 2.5009, "step": 26184 }, { "epoch": 0.7, "learning_rate": 0.00042622948984372936, "loss": 2.6208, "step": 26185 }, { "epoch": 0.7, "learning_rate": 0.0004261582055147527, "loss": 2.6706, "step": 26186 }, { "epoch": 0.7, "learning_rate": 0.00042608692553309846, "loss": 2.3884, "step": 26187 }, { "epoch": 0.7, "learning_rate": 0.0004260156498993072, "loss": 2.3208, "step": 26188 }, { "epoch": 0.7, "learning_rate": 0.000425944378613919, "loss": 2.1896, "step": 26189 }, { "epoch": 0.7, "learning_rate": 0.0004258731116774732, "loss": 1.9251, "step": 26190 }, { "epoch": 0.7, "learning_rate": 0.0004258018490905101, "loss": 2.5124, "step": 26191 }, { "epoch": 0.7, "learning_rate": 0.00042573059085356955, "loss": 2.5283, "step": 26192 }, { "epoch": 0.7, "learning_rate": 0.0004256593369671913, "loss": 2.2494, "step": 26193 }, { "epoch": 0.7, "learning_rate": 0.0004255880874319157, "loss": 2.8685, "step": 26194 }, { "epoch": 0.7, "learning_rate": 0.00042551684224828156, "loss": 2.451, "step": 26195 }, { "epoch": 0.7, "learning_rate": 0.0004254456014168292, "loss": 2.4128, "step": 26196 }, { "epoch": 0.7, "learning_rate": 0.0004253743649380982, "loss": 2.7841, "step": 26197 }, { "epoch": 0.7, "learning_rate": 0.00042530313281262833, "loss": 2.6536, "step": 26198 }, { "epoch": 0.7, "learning_rate": 0.0004252319050409592, "loss": 2.8311, "step": 26199 }, { "epoch": 0.7, "learning_rate": 0.00042516068162363075, "loss": 2.3719, "step": 26200 }, { "epoch": 0.7, "learning_rate": 0.00042508946256118187, "loss": 2.2172, "step": 26201 }, { "epoch": 0.7, "learning_rate": 0.00042501824785415266, "loss": 2.5517, "step": 26202 }, { "epoch": 0.7, "learning_rate": 0.0004249470375030822, "loss": 2.4298, "step": 26203 }, { "epoch": 0.7, "learning_rate": 0.00042487583150851006, "loss": 2.44, "step": 26204 }, { "epoch": 0.7, "learning_rate": 0.0004248046298709758, "loss": 2.3568, "step": 26205 }, { "epoch": 0.7, "learning_rate": 0.00042473343259101894, "loss": 2.4347, "step": 26206 }, { "epoch": 0.7, "learning_rate": 0.0004246622396691786, "loss": 2.3031, "step": 26207 }, { "epoch": 0.7, "learning_rate": 0.0004245910511059947, "loss": 2.757, "step": 26208 }, { "epoch": 0.7, "learning_rate": 0.00042451986690200585, "loss": 2.0507, "step": 26209 }, { "epoch": 0.7, "learning_rate": 0.0004244486870577515, "loss": 2.6148, "step": 26210 }, { "epoch": 0.7, "learning_rate": 0.000424377511573771, "loss": 2.077, "step": 26211 }, { "epoch": 0.7, "learning_rate": 0.0004243063404506036, "loss": 2.5367, "step": 26212 }, { "epoch": 0.7, "learning_rate": 0.00042423517368878885, "loss": 2.8156, "step": 26213 }, { "epoch": 0.7, "learning_rate": 0.00042416401128886496, "loss": 2.1148, "step": 26214 }, { "epoch": 0.7, "learning_rate": 0.0004240928532513717, "loss": 2.3269, "step": 26215 }, { "epoch": 0.7, "learning_rate": 0.00042402169957684834, "loss": 2.4284, "step": 26216 }, { "epoch": 0.7, "learning_rate": 0.0004239505502658333, "loss": 2.1924, "step": 26217 }, { "epoch": 0.7, "learning_rate": 0.0004238794053188658, "loss": 2.4156, "step": 26218 }, { "epoch": 0.7, "learning_rate": 0.00042380826473648503, "loss": 2.6188, "step": 26219 }, { "epoch": 0.7, "learning_rate": 0.00042373712851922975, "loss": 2.1094, "step": 26220 }, { "epoch": 0.7, "learning_rate": 0.00042366599666763936, "loss": 2.5495, "step": 26221 }, { "epoch": 0.7, "learning_rate": 0.000423594869182252, "loss": 2.4644, "step": 26222 }, { "epoch": 0.7, "learning_rate": 0.00042352374606360687, "loss": 2.6447, "step": 26223 }, { "epoch": 0.7, "learning_rate": 0.0004234526273122428, "loss": 2.5648, "step": 26224 }, { "epoch": 0.7, "learning_rate": 0.0004233815129286984, "loss": 2.0944, "step": 26225 }, { "epoch": 0.7, "learning_rate": 0.0004233104029135131, "loss": 2.3918, "step": 26226 }, { "epoch": 0.7, "learning_rate": 0.00042323929726722457, "loss": 2.1679, "step": 26227 }, { "epoch": 0.7, "learning_rate": 0.0004231681959903722, "loss": 2.8738, "step": 26228 }, { "epoch": 0.7, "learning_rate": 0.0004230970990834946, "loss": 2.3477, "step": 26229 }, { "epoch": 0.7, "learning_rate": 0.00042302600654713, "loss": 2.9037, "step": 26230 }, { "epoch": 0.7, "learning_rate": 0.0004229549183818168, "loss": 2.3158, "step": 26231 }, { "epoch": 0.7, "learning_rate": 0.00042288383458809474, "loss": 2.5669, "step": 26232 }, { "epoch": 0.7, "learning_rate": 0.0004228127551665012, "loss": 2.6465, "step": 26233 }, { "epoch": 0.71, "learning_rate": 0.00042274168011757497, "loss": 2.4871, "step": 26234 }, { "epoch": 0.71, "learning_rate": 0.0004226706094418551, "loss": 2.4386, "step": 26235 }, { "epoch": 0.71, "learning_rate": 0.0004225995431398789, "loss": 2.24, "step": 26236 }, { "epoch": 0.71, "learning_rate": 0.0004225284812121855, "loss": 2.0194, "step": 26237 }, { "epoch": 0.71, "learning_rate": 0.0004224574236593129, "loss": 2.8809, "step": 26238 }, { "epoch": 0.71, "learning_rate": 0.0004223863704817998, "loss": 2.5586, "step": 26239 }, { "epoch": 0.71, "learning_rate": 0.0004223153216801846, "loss": 2.4995, "step": 26240 }, { "epoch": 0.71, "learning_rate": 0.0004222442772550048, "loss": 2.3766, "step": 26241 }, { "epoch": 0.71, "learning_rate": 0.0004221732372067991, "loss": 2.4842, "step": 26242 }, { "epoch": 0.71, "learning_rate": 0.0004221022015361061, "loss": 2.7132, "step": 26243 }, { "epoch": 0.71, "learning_rate": 0.00042203117024346273, "loss": 2.5497, "step": 26244 }, { "epoch": 0.71, "learning_rate": 0.0004219601433294086, "loss": 2.1605, "step": 26245 }, { "epoch": 0.71, "learning_rate": 0.0004218891207944806, "loss": 2.2621, "step": 26246 }, { "epoch": 0.71, "learning_rate": 0.0004218181026392174, "loss": 2.1116, "step": 26247 }, { "epoch": 0.71, "learning_rate": 0.00042174708886415723, "loss": 2.1773, "step": 26248 }, { "epoch": 0.71, "learning_rate": 0.00042167607946983735, "loss": 2.5928, "step": 26249 }, { "epoch": 0.71, "learning_rate": 0.00042160507445679606, "loss": 2.0999, "step": 26250 }, { "epoch": 0.71, "learning_rate": 0.0004215340738255714, "loss": 2.3758, "step": 26251 }, { "epoch": 0.71, "learning_rate": 0.0004214630775767012, "loss": 2.385, "step": 26252 }, { "epoch": 0.71, "learning_rate": 0.0004213920857107235, "loss": 2.3564, "step": 26253 }, { "epoch": 0.71, "learning_rate": 0.00042132109822817565, "loss": 3.0478, "step": 26254 }, { "epoch": 0.71, "learning_rate": 0.00042125011512959576, "loss": 2.4838, "step": 26255 }, { "epoch": 0.71, "learning_rate": 0.0004211791364155219, "loss": 2.559, "step": 26256 }, { "epoch": 0.71, "learning_rate": 0.0004211081620864905, "loss": 2.2622, "step": 26257 }, { "epoch": 0.71, "learning_rate": 0.0004210371921430407, "loss": 2.3998, "step": 26258 }, { "epoch": 0.71, "learning_rate": 0.00042096622658570993, "loss": 2.567, "step": 26259 }, { "epoch": 0.71, "learning_rate": 0.00042089526541503507, "loss": 2.3968, "step": 26260 }, { "epoch": 0.71, "learning_rate": 0.00042082430863155465, "loss": 2.5588, "step": 26261 }, { "epoch": 0.71, "learning_rate": 0.00042075335623580523, "loss": 2.3129, "step": 26262 }, { "epoch": 0.71, "learning_rate": 0.0004206824082283249, "loss": 2.3554, "step": 26263 }, { "epoch": 0.71, "learning_rate": 0.00042061146460965103, "loss": 2.4108, "step": 26264 }, { "epoch": 0.71, "learning_rate": 0.0004205405253803212, "loss": 2.4398, "step": 26265 }, { "epoch": 0.71, "learning_rate": 0.00042046959054087274, "loss": 2.5991, "step": 26266 }, { "epoch": 0.71, "learning_rate": 0.0004203986600918434, "loss": 2.1497, "step": 26267 }, { "epoch": 0.71, "learning_rate": 0.00042032773403376976, "loss": 2.6283, "step": 26268 }, { "epoch": 0.71, "learning_rate": 0.00042025681236718994, "loss": 2.7062, "step": 26269 }, { "epoch": 0.71, "learning_rate": 0.00042018589509264015, "loss": 2.2995, "step": 26270 }, { "epoch": 0.71, "learning_rate": 0.0004201149822106588, "loss": 2.7194, "step": 26271 }, { "epoch": 0.71, "learning_rate": 0.00042004407372178297, "loss": 2.4837, "step": 26272 }, { "epoch": 0.71, "learning_rate": 0.0004199731696265492, "loss": 2.6197, "step": 26273 }, { "epoch": 0.71, "learning_rate": 0.000419902269925495, "loss": 2.3801, "step": 26274 }, { "epoch": 0.71, "learning_rate": 0.00041983137461915776, "loss": 2.4726, "step": 26275 }, { "epoch": 0.71, "learning_rate": 0.00041976048370807406, "loss": 2.5525, "step": 26276 }, { "epoch": 0.71, "learning_rate": 0.00041968959719278123, "loss": 2.4119, "step": 26277 }, { "epoch": 0.71, "learning_rate": 0.0004196187150738161, "loss": 2.2664, "step": 26278 }, { "epoch": 0.71, "learning_rate": 0.000419547837351716, "loss": 1.9591, "step": 26279 }, { "epoch": 0.71, "learning_rate": 0.00041947696402701794, "loss": 3.0207, "step": 26280 }, { "epoch": 0.71, "learning_rate": 0.0004194060951002583, "loss": 2.2336, "step": 26281 }, { "epoch": 0.71, "learning_rate": 0.00041933523057197434, "loss": 2.4043, "step": 26282 }, { "epoch": 0.71, "learning_rate": 0.0004192643704427027, "loss": 2.6807, "step": 26283 }, { "epoch": 0.71, "learning_rate": 0.0004191935147129805, "loss": 2.6414, "step": 26284 }, { "epoch": 0.71, "learning_rate": 0.00041912266338334437, "loss": 2.6985, "step": 26285 }, { "epoch": 0.71, "learning_rate": 0.0004190518164543314, "loss": 2.3567, "step": 26286 }, { "epoch": 0.71, "learning_rate": 0.0004189809739264777, "loss": 2.7353, "step": 26287 }, { "epoch": 0.71, "learning_rate": 0.0004189101358003207, "loss": 2.2857, "step": 26288 }, { "epoch": 0.71, "learning_rate": 0.0004188393020763961, "loss": 2.6021, "step": 26289 }, { "epoch": 0.71, "learning_rate": 0.0004187684727552411, "loss": 2.6407, "step": 26290 }, { "epoch": 0.71, "learning_rate": 0.0004186976478373923, "loss": 2.7339, "step": 26291 }, { "epoch": 0.71, "learning_rate": 0.0004186268273233861, "loss": 2.3102, "step": 26292 }, { "epoch": 0.71, "learning_rate": 0.0004185560112137592, "loss": 2.3339, "step": 26293 }, { "epoch": 0.71, "learning_rate": 0.0004184851995090483, "loss": 2.3171, "step": 26294 }, { "epoch": 0.71, "learning_rate": 0.00041841439220978926, "loss": 2.4604, "step": 26295 }, { "epoch": 0.71, "learning_rate": 0.0004183435893165188, "loss": 2.5378, "step": 26296 }, { "epoch": 0.71, "learning_rate": 0.0004182727908297733, "loss": 2.5001, "step": 26297 }, { "epoch": 0.71, "learning_rate": 0.0004182019967500891, "loss": 2.2765, "step": 26298 }, { "epoch": 0.71, "learning_rate": 0.000418131207078003, "loss": 2.4029, "step": 26299 }, { "epoch": 0.71, "learning_rate": 0.00041806042181405037, "loss": 2.2482, "step": 26300 }, { "epoch": 0.71, "learning_rate": 0.000417989640958768, "loss": 2.9888, "step": 26301 }, { "epoch": 0.71, "learning_rate": 0.0004179188645126925, "loss": 2.7815, "step": 26302 }, { "epoch": 0.71, "learning_rate": 0.0004178480924763591, "loss": 2.5391, "step": 26303 }, { "epoch": 0.71, "learning_rate": 0.0004177773248503046, "loss": 2.623, "step": 26304 }, { "epoch": 0.71, "learning_rate": 0.00041770656163506495, "loss": 2.1438, "step": 26305 }, { "epoch": 0.71, "learning_rate": 0.0004176358028311763, "loss": 2.7603, "step": 26306 }, { "epoch": 0.71, "learning_rate": 0.000417565048439175, "loss": 2.1308, "step": 26307 }, { "epoch": 0.71, "learning_rate": 0.0004174942984595964, "loss": 2.5089, "step": 26308 }, { "epoch": 0.71, "learning_rate": 0.00041742355289297694, "loss": 2.7273, "step": 26309 }, { "epoch": 0.71, "learning_rate": 0.0004173528117398524, "loss": 2.4956, "step": 26310 }, { "epoch": 0.71, "learning_rate": 0.00041728207500075885, "loss": 2.4308, "step": 26311 }, { "epoch": 0.71, "learning_rate": 0.0004172113426762321, "loss": 2.4252, "step": 26312 }, { "epoch": 0.71, "learning_rate": 0.0004171406147668084, "loss": 2.5535, "step": 26313 }, { "epoch": 0.71, "learning_rate": 0.0004170698912730227, "loss": 2.5387, "step": 26314 }, { "epoch": 0.71, "learning_rate": 0.00041699917219541183, "loss": 1.7099, "step": 26315 }, { "epoch": 0.71, "learning_rate": 0.0004169284575345106, "loss": 2.5595, "step": 26316 }, { "epoch": 0.71, "learning_rate": 0.0004168577472908548, "loss": 2.7269, "step": 26317 }, { "epoch": 0.71, "learning_rate": 0.00041678704146498103, "loss": 2.1476, "step": 26318 }, { "epoch": 0.71, "learning_rate": 0.0004167163400574241, "loss": 2.654, "step": 26319 }, { "epoch": 0.71, "learning_rate": 0.0004166456430687199, "loss": 2.5571, "step": 26320 }, { "epoch": 0.71, "learning_rate": 0.0004165749504994044, "loss": 2.3736, "step": 26321 }, { "epoch": 0.71, "learning_rate": 0.00041650426235001237, "loss": 2.3583, "step": 26322 }, { "epoch": 0.71, "learning_rate": 0.0004164335786210798, "loss": 2.2308, "step": 26323 }, { "epoch": 0.71, "learning_rate": 0.00041636289931314195, "loss": 2.8983, "step": 26324 }, { "epoch": 0.71, "learning_rate": 0.00041629222442673454, "loss": 2.839, "step": 26325 }, { "epoch": 0.71, "learning_rate": 0.00041622155396239325, "loss": 2.6333, "step": 26326 }, { "epoch": 0.71, "learning_rate": 0.0004161508879206527, "loss": 2.2526, "step": 26327 }, { "epoch": 0.71, "learning_rate": 0.00041608022630204865, "loss": 2.4803, "step": 26328 }, { "epoch": 0.71, "learning_rate": 0.00041600956910711675, "loss": 2.7333, "step": 26329 }, { "epoch": 0.71, "learning_rate": 0.00041593891633639123, "loss": 2.4542, "step": 26330 }, { "epoch": 0.71, "learning_rate": 0.0004158682679904088, "loss": 2.6522, "step": 26331 }, { "epoch": 0.71, "learning_rate": 0.00041579762406970355, "loss": 2.3871, "step": 26332 }, { "epoch": 0.71, "learning_rate": 0.00041572698457481105, "loss": 2.4997, "step": 26333 }, { "epoch": 0.71, "learning_rate": 0.00041565634950626684, "loss": 2.2274, "step": 26334 }, { "epoch": 0.71, "learning_rate": 0.0004155857188646054, "loss": 2.8344, "step": 26335 }, { "epoch": 0.71, "learning_rate": 0.0004155150926503619, "loss": 2.6898, "step": 26336 }, { "epoch": 0.71, "learning_rate": 0.00041544447086407164, "loss": 2.5583, "step": 26337 }, { "epoch": 0.71, "learning_rate": 0.00041537385350626953, "loss": 2.6338, "step": 26338 }, { "epoch": 0.71, "learning_rate": 0.00041530324057749104, "loss": 2.0368, "step": 26339 }, { "epoch": 0.71, "learning_rate": 0.00041523263207827023, "loss": 2.6955, "step": 26340 }, { "epoch": 0.71, "learning_rate": 0.0004151620280091424, "loss": 2.5316, "step": 26341 }, { "epoch": 0.71, "learning_rate": 0.00041509142837064297, "loss": 2.1918, "step": 26342 }, { "epoch": 0.71, "learning_rate": 0.00041502083316330554, "loss": 2.7971, "step": 26343 }, { "epoch": 0.71, "learning_rate": 0.000414950242387666, "loss": 2.5056, "step": 26344 }, { "epoch": 0.71, "learning_rate": 0.00041487965604425917, "loss": 2.1477, "step": 26345 }, { "epoch": 0.71, "learning_rate": 0.00041480907413361914, "loss": 2.8556, "step": 26346 }, { "epoch": 0.71, "learning_rate": 0.00041473849665628093, "loss": 2.4767, "step": 26347 }, { "epoch": 0.71, "learning_rate": 0.0004146679236127796, "loss": 2.3578, "step": 26348 }, { "epoch": 0.71, "learning_rate": 0.00041459735500364915, "loss": 2.4976, "step": 26349 }, { "epoch": 0.71, "learning_rate": 0.0004145267908294244, "loss": 2.5158, "step": 26350 }, { "epoch": 0.71, "learning_rate": 0.00041445623109064, "loss": 3.0395, "step": 26351 }, { "epoch": 0.71, "learning_rate": 0.0004143856757878305, "loss": 2.2584, "step": 26352 }, { "epoch": 0.71, "learning_rate": 0.0004143151249215309, "loss": 2.3281, "step": 26353 }, { "epoch": 0.71, "learning_rate": 0.0004142445784922747, "loss": 2.6486, "step": 26354 }, { "epoch": 0.71, "learning_rate": 0.00041417403650059693, "loss": 2.1807, "step": 26355 }, { "epoch": 0.71, "learning_rate": 0.00041410349894703194, "loss": 2.3349, "step": 26356 }, { "epoch": 0.71, "learning_rate": 0.00041403296583211404, "loss": 2.1993, "step": 26357 }, { "epoch": 0.71, "learning_rate": 0.0004139624371563779, "loss": 2.3764, "step": 26358 }, { "epoch": 0.71, "learning_rate": 0.0004138919129203573, "loss": 2.2493, "step": 26359 }, { "epoch": 0.71, "learning_rate": 0.0004138213931245869, "loss": 2.4761, "step": 26360 }, { "epoch": 0.71, "learning_rate": 0.000413750877769601, "loss": 2.6905, "step": 26361 }, { "epoch": 0.71, "learning_rate": 0.00041368036685593336, "loss": 2.7712, "step": 26362 }, { "epoch": 0.71, "learning_rate": 0.00041360986038411807, "loss": 2.6004, "step": 26363 }, { "epoch": 0.71, "learning_rate": 0.00041353935835469036, "loss": 2.1895, "step": 26364 }, { "epoch": 0.71, "learning_rate": 0.00041346886076818324, "loss": 2.2266, "step": 26365 }, { "epoch": 0.71, "learning_rate": 0.0004133983676251316, "loss": 2.3599, "step": 26366 }, { "epoch": 0.71, "learning_rate": 0.0004133278789260686, "loss": 2.8691, "step": 26367 }, { "epoch": 0.71, "learning_rate": 0.0004132573946715288, "loss": 2.505, "step": 26368 }, { "epoch": 0.71, "learning_rate": 0.00041318691486204594, "loss": 2.4896, "step": 26369 }, { "epoch": 0.71, "learning_rate": 0.0004131164394981542, "loss": 2.3311, "step": 26370 }, { "epoch": 0.71, "learning_rate": 0.00041304596858038735, "loss": 2.782, "step": 26371 }, { "epoch": 0.71, "learning_rate": 0.0004129755021092797, "loss": 2.4138, "step": 26372 }, { "epoch": 0.71, "learning_rate": 0.0004129050400853643, "loss": 2.6497, "step": 26373 }, { "epoch": 0.71, "learning_rate": 0.0004128345825091758, "loss": 2.6303, "step": 26374 }, { "epoch": 0.71, "learning_rate": 0.00041276412938124707, "loss": 2.5835, "step": 26375 }, { "epoch": 0.71, "learning_rate": 0.000412693680702112, "loss": 2.4002, "step": 26376 }, { "epoch": 0.71, "learning_rate": 0.00041262323647230526, "loss": 2.1384, "step": 26377 }, { "epoch": 0.71, "learning_rate": 0.00041255279669235955, "loss": 2.3943, "step": 26378 }, { "epoch": 0.71, "learning_rate": 0.0004124823613628088, "loss": 2.436, "step": 26379 }, { "epoch": 0.71, "learning_rate": 0.0004124119304841871, "loss": 2.7288, "step": 26380 }, { "epoch": 0.71, "learning_rate": 0.00041234150405702706, "loss": 2.7286, "step": 26381 }, { "epoch": 0.71, "learning_rate": 0.0004122710820818628, "loss": 2.4992, "step": 26382 }, { "epoch": 0.71, "learning_rate": 0.0004122006645592278, "loss": 2.159, "step": 26383 }, { "epoch": 0.71, "learning_rate": 0.00041213025148965546, "loss": 2.7835, "step": 26384 }, { "epoch": 0.71, "learning_rate": 0.0004120598428736795, "loss": 2.5168, "step": 26385 }, { "epoch": 0.71, "learning_rate": 0.0004119894387118328, "loss": 2.2375, "step": 26386 }, { "epoch": 0.71, "learning_rate": 0.0004119190390046489, "loss": 2.3948, "step": 26387 }, { "epoch": 0.71, "learning_rate": 0.0004118486437526616, "loss": 3.3179, "step": 26388 }, { "epoch": 0.71, "learning_rate": 0.0004117782529564031, "loss": 2.7828, "step": 26389 }, { "epoch": 0.71, "learning_rate": 0.0004117078666164078, "loss": 2.3707, "step": 26390 }, { "epoch": 0.71, "learning_rate": 0.00041163748473320883, "loss": 2.3628, "step": 26391 }, { "epoch": 0.71, "learning_rate": 0.0004115671073073388, "loss": 2.4394, "step": 26392 }, { "epoch": 0.71, "learning_rate": 0.00041149673433933144, "loss": 2.7938, "step": 26393 }, { "epoch": 0.71, "learning_rate": 0.0004114263658297193, "loss": 2.6547, "step": 26394 }, { "epoch": 0.71, "learning_rate": 0.0004113560017790358, "loss": 2.4254, "step": 26395 }, { "epoch": 0.71, "learning_rate": 0.00041128564218781394, "loss": 2.3843, "step": 26396 }, { "epoch": 0.71, "learning_rate": 0.0004112152870565868, "loss": 2.6451, "step": 26397 }, { "epoch": 0.71, "learning_rate": 0.00041114493638588745, "loss": 2.5632, "step": 26398 }, { "epoch": 0.71, "learning_rate": 0.00041107459017624906, "loss": 2.4111, "step": 26399 }, { "epoch": 0.71, "learning_rate": 0.0004110042484282039, "loss": 2.9367, "step": 26400 }, { "epoch": 0.71, "learning_rate": 0.00041093391114228574, "loss": 2.1886, "step": 26401 }, { "epoch": 0.71, "learning_rate": 0.0004108635783190262, "loss": 2.257, "step": 26402 }, { "epoch": 0.71, "learning_rate": 0.0004107932499589592, "loss": 2.7839, "step": 26403 }, { "epoch": 0.71, "learning_rate": 0.0004107229260626175, "loss": 2.5495, "step": 26404 }, { "epoch": 0.71, "learning_rate": 0.00041065260663053325, "loss": 2.0014, "step": 26405 }, { "epoch": 0.71, "learning_rate": 0.00041058229166323945, "loss": 2.2777, "step": 26406 }, { "epoch": 0.71, "learning_rate": 0.0004105119811612693, "loss": 2.6834, "step": 26407 }, { "epoch": 0.71, "learning_rate": 0.0004104416751251545, "loss": 2.917, "step": 26408 }, { "epoch": 0.71, "learning_rate": 0.0004103713735554282, "loss": 2.2868, "step": 26409 }, { "epoch": 0.71, "learning_rate": 0.00041030107645262306, "loss": 2.2444, "step": 26410 }, { "epoch": 0.71, "learning_rate": 0.00041023078381727143, "loss": 2.2741, "step": 26411 }, { "epoch": 0.71, "learning_rate": 0.00041016049564990633, "loss": 2.7531, "step": 26412 }, { "epoch": 0.71, "learning_rate": 0.00041009021195105946, "loss": 2.0202, "step": 26413 }, { "epoch": 0.71, "learning_rate": 0.0004100199327212637, "loss": 2.4745, "step": 26414 }, { "epoch": 0.71, "learning_rate": 0.00040994965796105153, "loss": 2.5523, "step": 26415 }, { "epoch": 0.71, "learning_rate": 0.0004098793876709551, "loss": 2.3641, "step": 26416 }, { "epoch": 0.71, "learning_rate": 0.0004098091218515074, "loss": 2.1832, "step": 26417 }, { "epoch": 0.71, "learning_rate": 0.00040973886050323994, "loss": 2.2349, "step": 26418 }, { "epoch": 0.71, "learning_rate": 0.00040966860362668533, "loss": 2.5397, "step": 26419 }, { "epoch": 0.71, "learning_rate": 0.0004095983512223761, "loss": 2.6084, "step": 26420 }, { "epoch": 0.71, "learning_rate": 0.000409528103290844, "loss": 2.634, "step": 26421 }, { "epoch": 0.71, "learning_rate": 0.0004094578598326213, "loss": 2.5688, "step": 26422 }, { "epoch": 0.71, "learning_rate": 0.0004093876208482403, "loss": 2.1005, "step": 26423 }, { "epoch": 0.71, "learning_rate": 0.00040931738633823313, "loss": 2.3317, "step": 26424 }, { "epoch": 0.71, "learning_rate": 0.0004092471563031318, "loss": 2.8282, "step": 26425 }, { "epoch": 0.71, "learning_rate": 0.00040917693074346876, "loss": 2.4704, "step": 26426 }, { "epoch": 0.71, "learning_rate": 0.00040910670965977534, "loss": 2.5577, "step": 26427 }, { "epoch": 0.71, "learning_rate": 0.00040903649305258383, "loss": 2.6233, "step": 26428 }, { "epoch": 0.71, "learning_rate": 0.00040896628092242614, "loss": 2.3993, "step": 26429 }, { "epoch": 0.71, "learning_rate": 0.0004088960732698344, "loss": 2.0314, "step": 26430 }, { "epoch": 0.71, "learning_rate": 0.0004088258700953404, "loss": 2.3371, "step": 26431 }, { "epoch": 0.71, "learning_rate": 0.0004087556713994758, "loss": 2.3164, "step": 26432 }, { "epoch": 0.71, "learning_rate": 0.0004086854771827725, "loss": 2.2794, "step": 26433 }, { "epoch": 0.71, "learning_rate": 0.0004086152874457626, "loss": 2.296, "step": 26434 }, { "epoch": 0.71, "learning_rate": 0.00040854510218897724, "loss": 2.9216, "step": 26435 }, { "epoch": 0.71, "learning_rate": 0.0004084749214129484, "loss": 2.6586, "step": 26436 }, { "epoch": 0.71, "learning_rate": 0.0004084047451182078, "loss": 2.8553, "step": 26437 }, { "epoch": 0.71, "learning_rate": 0.00040833457330528714, "loss": 2.5686, "step": 26438 }, { "epoch": 0.71, "learning_rate": 0.00040826440597471823, "loss": 2.4816, "step": 26439 }, { "epoch": 0.71, "learning_rate": 0.00040819424312703214, "loss": 2.6375, "step": 26440 }, { "epoch": 0.71, "learning_rate": 0.00040812408476276066, "loss": 2.1509, "step": 26441 }, { "epoch": 0.71, "learning_rate": 0.0004080539308824353, "loss": 2.5509, "step": 26442 }, { "epoch": 0.71, "learning_rate": 0.0004079837814865874, "loss": 2.6273, "step": 26443 }, { "epoch": 0.71, "learning_rate": 0.00040791363657574896, "loss": 2.3911, "step": 26444 }, { "epoch": 0.71, "learning_rate": 0.0004078434961504507, "loss": 2.2128, "step": 26445 }, { "epoch": 0.71, "learning_rate": 0.00040777336021122413, "loss": 2.6982, "step": 26446 }, { "epoch": 0.71, "learning_rate": 0.000407703228758601, "loss": 3.0992, "step": 26447 }, { "epoch": 0.71, "learning_rate": 0.0004076331017931121, "loss": 2.5214, "step": 26448 }, { "epoch": 0.71, "learning_rate": 0.0004075629793152885, "loss": 2.6061, "step": 26449 }, { "epoch": 0.71, "learning_rate": 0.00040749286132566256, "loss": 2.6844, "step": 26450 }, { "epoch": 0.71, "learning_rate": 0.0004074227478247644, "loss": 2.5268, "step": 26451 }, { "epoch": 0.71, "learning_rate": 0.0004073526388131259, "loss": 1.9851, "step": 26452 }, { "epoch": 0.71, "learning_rate": 0.0004072825342912776, "loss": 2.3852, "step": 26453 }, { "epoch": 0.71, "learning_rate": 0.0004072124342597507, "loss": 2.6871, "step": 26454 }, { "epoch": 0.71, "learning_rate": 0.0004071423387190766, "loss": 2.4753, "step": 26455 }, { "epoch": 0.71, "learning_rate": 0.000407072247669786, "loss": 2.3239, "step": 26456 }, { "epoch": 0.71, "learning_rate": 0.00040700216111241004, "loss": 2.5526, "step": 26457 }, { "epoch": 0.71, "learning_rate": 0.0004069320790474802, "loss": 2.7528, "step": 26458 }, { "epoch": 0.71, "learning_rate": 0.00040686200147552643, "loss": 2.7627, "step": 26459 }, { "epoch": 0.71, "learning_rate": 0.0004067919283970801, "loss": 2.6419, "step": 26460 }, { "epoch": 0.71, "learning_rate": 0.0004067218598126724, "loss": 2.5719, "step": 26461 }, { "epoch": 0.71, "learning_rate": 0.00040665179572283317, "loss": 2.385, "step": 26462 }, { "epoch": 0.71, "learning_rate": 0.00040658173612809456, "loss": 2.3787, "step": 26463 }, { "epoch": 0.71, "learning_rate": 0.00040651168102898627, "loss": 2.2892, "step": 26464 }, { "epoch": 0.71, "learning_rate": 0.00040644163042603934, "loss": 2.4335, "step": 26465 }, { "epoch": 0.71, "learning_rate": 0.0004063715843197848, "loss": 2.3825, "step": 26466 }, { "epoch": 0.71, "learning_rate": 0.0004063015427107527, "loss": 2.2508, "step": 26467 }, { "epoch": 0.71, "learning_rate": 0.0004062315055994741, "loss": 2.4628, "step": 26468 }, { "epoch": 0.71, "learning_rate": 0.00040616147298647935, "loss": 2.343, "step": 26469 }, { "epoch": 0.71, "learning_rate": 0.00040609144487229907, "loss": 2.0771, "step": 26470 }, { "epoch": 0.71, "learning_rate": 0.0004060214212574642, "loss": 2.3839, "step": 26471 }, { "epoch": 0.71, "learning_rate": 0.00040595140214250445, "loss": 2.4433, "step": 26472 }, { "epoch": 0.71, "learning_rate": 0.0004058813875279508, "loss": 2.4843, "step": 26473 }, { "epoch": 0.71, "learning_rate": 0.00040581137741433384, "loss": 2.2186, "step": 26474 }, { "epoch": 0.71, "learning_rate": 0.00040574137180218294, "loss": 2.2602, "step": 26475 }, { "epoch": 0.71, "learning_rate": 0.0004056713706920294, "loss": 2.7143, "step": 26476 }, { "epoch": 0.71, "learning_rate": 0.00040560137408440376, "loss": 2.6112, "step": 26477 }, { "epoch": 0.71, "learning_rate": 0.0004055313819798355, "loss": 2.7875, "step": 26478 }, { "epoch": 0.71, "learning_rate": 0.00040546139437885566, "loss": 2.7337, "step": 26479 }, { "epoch": 0.71, "learning_rate": 0.00040539141128199355, "loss": 2.8939, "step": 26480 }, { "epoch": 0.71, "learning_rate": 0.0004053214326897797, "loss": 2.2658, "step": 26481 }, { "epoch": 0.71, "learning_rate": 0.00040525145860274446, "loss": 2.7039, "step": 26482 }, { "epoch": 0.71, "learning_rate": 0.0004051814890214178, "loss": 2.2054, "step": 26483 }, { "epoch": 0.71, "learning_rate": 0.0004051115239463299, "loss": 2.2727, "step": 26484 }, { "epoch": 0.71, "learning_rate": 0.0004050415633780111, "loss": 2.2572, "step": 26485 }, { "epoch": 0.71, "learning_rate": 0.00040497160731699065, "loss": 2.1558, "step": 26486 }, { "epoch": 0.71, "learning_rate": 0.0004049016557637992, "loss": 2.4441, "step": 26487 }, { "epoch": 0.71, "learning_rate": 0.0004048317087189658, "loss": 2.682, "step": 26488 }, { "epoch": 0.71, "learning_rate": 0.0004047617661830213, "loss": 2.8716, "step": 26489 }, { "epoch": 0.71, "learning_rate": 0.00040469182815649563, "loss": 2.441, "step": 26490 }, { "epoch": 0.71, "learning_rate": 0.00040462189463991784, "loss": 1.775, "step": 26491 }, { "epoch": 0.71, "learning_rate": 0.00040455196563381814, "loss": 2.7539, "step": 26492 }, { "epoch": 0.71, "learning_rate": 0.00040448204113872666, "loss": 2.726, "step": 26493 }, { "epoch": 0.71, "learning_rate": 0.00040441212115517247, "loss": 2.3458, "step": 26494 }, { "epoch": 0.71, "learning_rate": 0.0004043422056836855, "loss": 2.3522, "step": 26495 }, { "epoch": 0.71, "learning_rate": 0.0004042722947247954, "loss": 2.4847, "step": 26496 }, { "epoch": 0.71, "learning_rate": 0.000404202388279032, "loss": 2.6868, "step": 26497 }, { "epoch": 0.71, "learning_rate": 0.0004041324863469251, "loss": 2.261, "step": 26498 }, { "epoch": 0.71, "learning_rate": 0.0004040625889290037, "loss": 2.6154, "step": 26499 }, { "epoch": 0.71, "learning_rate": 0.0004039926960257975, "loss": 2.7399, "step": 26500 }, { "epoch": 0.71, "learning_rate": 0.0004039228076378361, "loss": 2.0517, "step": 26501 }, { "epoch": 0.71, "learning_rate": 0.00040385292376564884, "loss": 2.5445, "step": 26502 }, { "epoch": 0.71, "learning_rate": 0.0004037830444097654, "loss": 2.5054, "step": 26503 }, { "epoch": 0.71, "learning_rate": 0.00040371316957071526, "loss": 2.0559, "step": 26504 }, { "epoch": 0.71, "learning_rate": 0.00040364329924902733, "loss": 2.3461, "step": 26505 }, { "epoch": 0.71, "learning_rate": 0.0004035734334452313, "loss": 2.5439, "step": 26506 }, { "epoch": 0.71, "learning_rate": 0.0004035035721598561, "loss": 2.2353, "step": 26507 }, { "epoch": 0.71, "learning_rate": 0.0004034337153934311, "loss": 2.4114, "step": 26508 }, { "epoch": 0.71, "learning_rate": 0.00040336386314648577, "loss": 2.6827, "step": 26509 }, { "epoch": 0.71, "learning_rate": 0.000403294015419549, "loss": 2.6298, "step": 26510 }, { "epoch": 0.71, "learning_rate": 0.0004032241722131501, "loss": 2.364, "step": 26511 }, { "epoch": 0.71, "learning_rate": 0.0004031543335278186, "loss": 2.2792, "step": 26512 }, { "epoch": 0.71, "learning_rate": 0.00040308449936408275, "loss": 2.7764, "step": 26513 }, { "epoch": 0.71, "learning_rate": 0.000403014669722472, "loss": 2.5357, "step": 26514 }, { "epoch": 0.71, "learning_rate": 0.00040294484460351546, "loss": 2.5736, "step": 26515 }, { "epoch": 0.71, "learning_rate": 0.000402875024007742, "loss": 2.3526, "step": 26516 }, { "epoch": 0.71, "learning_rate": 0.0004028052079356809, "loss": 2.1409, "step": 26517 }, { "epoch": 0.71, "learning_rate": 0.0004027353963878605, "loss": 2.3155, "step": 26518 }, { "epoch": 0.71, "learning_rate": 0.0004026655893648099, "loss": 2.6724, "step": 26519 }, { "epoch": 0.71, "learning_rate": 0.00040259578686705844, "loss": 2.6877, "step": 26520 }, { "epoch": 0.71, "learning_rate": 0.0004025259888951337, "loss": 2.2207, "step": 26521 }, { "epoch": 0.71, "learning_rate": 0.0004024561954495659, "loss": 2.4749, "step": 26522 }, { "epoch": 0.71, "learning_rate": 0.00040238640653088287, "loss": 2.5012, "step": 26523 }, { "epoch": 0.71, "learning_rate": 0.00040231662213961365, "loss": 2.5423, "step": 26524 }, { "epoch": 0.71, "learning_rate": 0.00040224684227628706, "loss": 2.4686, "step": 26525 }, { "epoch": 0.71, "learning_rate": 0.0004021770669414313, "loss": 2.2689, "step": 26526 }, { "epoch": 0.71, "learning_rate": 0.00040210729613557506, "loss": 2.0753, "step": 26527 }, { "epoch": 0.71, "learning_rate": 0.00040203752985924714, "loss": 2.3943, "step": 26528 }, { "epoch": 0.71, "learning_rate": 0.000401967768112976, "loss": 2.4286, "step": 26529 }, { "epoch": 0.71, "learning_rate": 0.0004018980108972905, "loss": 2.732, "step": 26530 }, { "epoch": 0.71, "learning_rate": 0.0004018282582127183, "loss": 2.4129, "step": 26531 }, { "epoch": 0.71, "learning_rate": 0.00040175851005978824, "loss": 2.5133, "step": 26532 }, { "epoch": 0.71, "learning_rate": 0.0004016887664390293, "loss": 2.4758, "step": 26533 }, { "epoch": 0.71, "learning_rate": 0.0004016190273509685, "loss": 2.7984, "step": 26534 }, { "epoch": 0.71, "learning_rate": 0.00040154929279613517, "loss": 2.187, "step": 26535 }, { "epoch": 0.71, "learning_rate": 0.00040147956277505794, "loss": 2.5671, "step": 26536 }, { "epoch": 0.71, "learning_rate": 0.0004014098372882641, "loss": 2.2616, "step": 26537 }, { "epoch": 0.71, "learning_rate": 0.0004013401163362823, "loss": 2.5305, "step": 26538 }, { "epoch": 0.71, "learning_rate": 0.0004012703999196412, "loss": 2.5348, "step": 26539 }, { "epoch": 0.71, "learning_rate": 0.0004012006880388681, "loss": 2.0523, "step": 26540 }, { "epoch": 0.71, "learning_rate": 0.0004011309806944915, "loss": 2.5606, "step": 26541 }, { "epoch": 0.71, "learning_rate": 0.0004010612778870395, "loss": 2.5384, "step": 26542 }, { "epoch": 0.71, "learning_rate": 0.00040099157961704025, "loss": 2.4611, "step": 26543 }, { "epoch": 0.71, "learning_rate": 0.0004009218858850221, "loss": 2.4722, "step": 26544 }, { "epoch": 0.71, "learning_rate": 0.0004008521966915122, "loss": 2.6773, "step": 26545 }, { "epoch": 0.71, "learning_rate": 0.0004007825120370389, "loss": 2.8724, "step": 26546 }, { "epoch": 0.71, "learning_rate": 0.00040071283192213026, "loss": 2.1173, "step": 26547 }, { "epoch": 0.71, "learning_rate": 0.00040064315634731395, "loss": 2.5881, "step": 26548 }, { "epoch": 0.71, "learning_rate": 0.00040057348531311846, "loss": 2.5592, "step": 26549 }, { "epoch": 0.71, "learning_rate": 0.0004005038188200706, "loss": 2.4182, "step": 26550 }, { "epoch": 0.71, "learning_rate": 0.00040043415686869855, "loss": 2.1567, "step": 26551 }, { "epoch": 0.71, "learning_rate": 0.0004003644994595306, "loss": 2.7983, "step": 26552 }, { "epoch": 0.71, "learning_rate": 0.0004002948465930937, "loss": 2.3683, "step": 26553 }, { "epoch": 0.71, "learning_rate": 0.00040022519826991566, "loss": 2.2819, "step": 26554 }, { "epoch": 0.71, "learning_rate": 0.0004001555544905244, "loss": 2.5375, "step": 26555 }, { "epoch": 0.71, "learning_rate": 0.00040008591525544744, "loss": 2.4203, "step": 26556 }, { "epoch": 0.71, "learning_rate": 0.00040001628056521266, "loss": 2.4991, "step": 26557 }, { "epoch": 0.71, "learning_rate": 0.00039994665042034685, "loss": 2.561, "step": 26558 }, { "epoch": 0.71, "learning_rate": 0.000399877024821378, "loss": 1.9969, "step": 26559 }, { "epoch": 0.71, "learning_rate": 0.0003998074037688335, "loss": 2.5221, "step": 26560 }, { "epoch": 0.71, "learning_rate": 0.0003997377872632408, "loss": 2.7997, "step": 26561 }, { "epoch": 0.71, "learning_rate": 0.00039966817530512734, "loss": 2.5507, "step": 26562 }, { "epoch": 0.71, "learning_rate": 0.0003995985678950208, "loss": 2.5258, "step": 26563 }, { "epoch": 0.71, "learning_rate": 0.0003995289650334478, "loss": 2.5818, "step": 26564 }, { "epoch": 0.71, "learning_rate": 0.0003994593667209363, "loss": 2.4703, "step": 26565 }, { "epoch": 0.71, "learning_rate": 0.000399389772958013, "loss": 2.5378, "step": 26566 }, { "epoch": 0.71, "learning_rate": 0.0003993201837452054, "loss": 2.2386, "step": 26567 }, { "epoch": 0.71, "learning_rate": 0.00039925059908304064, "loss": 2.5535, "step": 26568 }, { "epoch": 0.71, "learning_rate": 0.00039918101897204597, "loss": 2.339, "step": 26569 }, { "epoch": 0.71, "learning_rate": 0.00039911144341274853, "loss": 2.2071, "step": 26570 }, { "epoch": 0.71, "learning_rate": 0.0003990418724056757, "loss": 2.6807, "step": 26571 }, { "epoch": 0.71, "learning_rate": 0.0003989723059513538, "loss": 2.5745, "step": 26572 }, { "epoch": 0.71, "learning_rate": 0.00039890274405031027, "loss": 2.5942, "step": 26573 }, { "epoch": 0.71, "learning_rate": 0.00039883318670307213, "loss": 2.1499, "step": 26574 }, { "epoch": 0.71, "learning_rate": 0.0003987636339101662, "loss": 2.8624, "step": 26575 }, { "epoch": 0.71, "learning_rate": 0.00039869408567211995, "loss": 2.3587, "step": 26576 }, { "epoch": 0.71, "learning_rate": 0.0003986245419894594, "loss": 2.7929, "step": 26577 }, { "epoch": 0.71, "learning_rate": 0.00039855500286271173, "loss": 2.675, "step": 26578 }, { "epoch": 0.71, "learning_rate": 0.0003984854682924043, "loss": 2.1789, "step": 26579 }, { "epoch": 0.71, "learning_rate": 0.00039841593827906295, "loss": 2.6129, "step": 26580 }, { "epoch": 0.71, "learning_rate": 0.0003983464128232147, "loss": 1.9978, "step": 26581 }, { "epoch": 0.71, "learning_rate": 0.0003982768919253871, "loss": 2.1514, "step": 26582 }, { "epoch": 0.71, "learning_rate": 0.00039820737558610576, "loss": 2.739, "step": 26583 }, { "epoch": 0.71, "learning_rate": 0.00039813786380589824, "loss": 2.8792, "step": 26584 }, { "epoch": 0.71, "learning_rate": 0.00039806835658529017, "loss": 2.2661, "step": 26585 }, { "epoch": 0.71, "learning_rate": 0.00039799885392480873, "loss": 2.6759, "step": 26586 }, { "epoch": 0.71, "learning_rate": 0.00039792935582498026, "loss": 1.9463, "step": 26587 }, { "epoch": 0.71, "learning_rate": 0.0003978598622863314, "loss": 2.9132, "step": 26588 }, { "epoch": 0.71, "learning_rate": 0.00039779037330938863, "loss": 2.9212, "step": 26589 }, { "epoch": 0.71, "learning_rate": 0.0003977208888946785, "loss": 2.5813, "step": 26590 }, { "epoch": 0.71, "learning_rate": 0.000397651409042727, "loss": 2.887, "step": 26591 }, { "epoch": 0.71, "learning_rate": 0.00039758193375406115, "loss": 3.0918, "step": 26592 }, { "epoch": 0.71, "learning_rate": 0.00039751246302920643, "loss": 2.9488, "step": 26593 }, { "epoch": 0.71, "learning_rate": 0.00039744299686868923, "loss": 2.323, "step": 26594 }, { "epoch": 0.71, "learning_rate": 0.0003973735352730369, "loss": 2.4409, "step": 26595 }, { "epoch": 0.71, "learning_rate": 0.00039730407824277447, "loss": 2.203, "step": 26596 }, { "epoch": 0.71, "learning_rate": 0.00039723462577842875, "loss": 2.5777, "step": 26597 }, { "epoch": 0.71, "learning_rate": 0.00039716517788052595, "loss": 2.355, "step": 26598 }, { "epoch": 0.71, "learning_rate": 0.0003970957345495917, "loss": 2.4104, "step": 26599 }, { "epoch": 0.71, "learning_rate": 0.00039702629578615233, "loss": 2.3791, "step": 26600 }, { "epoch": 0.71, "learning_rate": 0.00039695686159073394, "loss": 2.5367, "step": 26601 }, { "epoch": 0.71, "learning_rate": 0.0003968874319638627, "loss": 2.6967, "step": 26602 }, { "epoch": 0.71, "learning_rate": 0.0003968180069060646, "loss": 2.4177, "step": 26603 }, { "epoch": 0.71, "learning_rate": 0.00039674858641786527, "loss": 2.8501, "step": 26604 }, { "epoch": 0.71, "learning_rate": 0.00039667917049979065, "loss": 2.3838, "step": 26605 }, { "epoch": 0.72, "learning_rate": 0.0003966097591523672, "loss": 2.5068, "step": 26606 }, { "epoch": 0.72, "learning_rate": 0.0003965403523761196, "loss": 2.5786, "step": 26607 }, { "epoch": 0.72, "learning_rate": 0.0003964709501715747, "loss": 2.6803, "step": 26608 }, { "epoch": 0.72, "learning_rate": 0.0003964015525392585, "loss": 2.6541, "step": 26609 }, { "epoch": 0.72, "learning_rate": 0.00039633215947969583, "loss": 2.4082, "step": 26610 }, { "epoch": 0.72, "learning_rate": 0.00039626277099341303, "loss": 2.2508, "step": 26611 }, { "epoch": 0.72, "learning_rate": 0.0003961933870809352, "loss": 2.7245, "step": 26612 }, { "epoch": 0.72, "learning_rate": 0.00039612400774278843, "loss": 2.0895, "step": 26613 }, { "epoch": 0.72, "learning_rate": 0.00039605463297949815, "loss": 1.9668, "step": 26614 }, { "epoch": 0.72, "learning_rate": 0.00039598526279159, "loss": 2.4681, "step": 26615 }, { "epoch": 0.72, "learning_rate": 0.0003959158971795895, "loss": 2.3726, "step": 26616 }, { "epoch": 0.72, "learning_rate": 0.00039584653614402256, "loss": 2.4831, "step": 26617 }, { "epoch": 0.72, "learning_rate": 0.00039577717968541383, "loss": 2.5983, "step": 26618 }, { "epoch": 0.72, "learning_rate": 0.0003957078278042896, "loss": 2.5697, "step": 26619 }, { "epoch": 0.72, "learning_rate": 0.00039563848050117403, "loss": 2.3567, "step": 26620 }, { "epoch": 0.72, "learning_rate": 0.00039556913777659365, "loss": 2.4171, "step": 26621 }, { "epoch": 0.72, "learning_rate": 0.00039549979963107387, "loss": 2.5095, "step": 26622 }, { "epoch": 0.72, "learning_rate": 0.0003954304660651391, "loss": 2.5847, "step": 26623 }, { "epoch": 0.72, "learning_rate": 0.00039536113707931497, "loss": 2.7585, "step": 26624 }, { "epoch": 0.72, "learning_rate": 0.0003952918126741273, "loss": 2.4515, "step": 26625 }, { "epoch": 0.72, "learning_rate": 0.0003952224928501003, "loss": 2.7026, "step": 26626 }, { "epoch": 0.72, "learning_rate": 0.0003951531776077595, "loss": 2.0927, "step": 26627 }, { "epoch": 0.72, "learning_rate": 0.0003950838669476301, "loss": 2.5397, "step": 26628 }, { "epoch": 0.72, "learning_rate": 0.00039501456087023725, "loss": 2.522, "step": 26629 }, { "epoch": 0.72, "learning_rate": 0.00039494525937610627, "loss": 2.2278, "step": 26630 }, { "epoch": 0.72, "learning_rate": 0.00039487596246576143, "loss": 2.2193, "step": 26631 }, { "epoch": 0.72, "learning_rate": 0.00039480667013972815, "loss": 2.4397, "step": 26632 }, { "epoch": 0.72, "learning_rate": 0.0003947373823985313, "loss": 2.9135, "step": 26633 }, { "epoch": 0.72, "learning_rate": 0.00039466809924269586, "loss": 2.3684, "step": 26634 }, { "epoch": 0.72, "learning_rate": 0.000394598820672747, "loss": 2.5303, "step": 26635 }, { "epoch": 0.72, "learning_rate": 0.00039452954668920895, "loss": 2.527, "step": 26636 }, { "epoch": 0.72, "learning_rate": 0.0003944602772926067, "loss": 2.6486, "step": 26637 }, { "epoch": 0.72, "learning_rate": 0.00039439101248346566, "loss": 2.5828, "step": 26638 }, { "epoch": 0.72, "learning_rate": 0.00039432175226230946, "loss": 2.3028, "step": 26639 }, { "epoch": 0.72, "learning_rate": 0.00039425249662966355, "loss": 2.1936, "step": 26640 }, { "epoch": 0.72, "learning_rate": 0.00039418324558605235, "loss": 2.5932, "step": 26641 }, { "epoch": 0.72, "learning_rate": 0.00039411399913200063, "loss": 2.4835, "step": 26642 }, { "epoch": 0.72, "learning_rate": 0.00039404475726803324, "loss": 2.7217, "step": 26643 }, { "epoch": 0.72, "learning_rate": 0.0003939755199946741, "loss": 2.8661, "step": 26644 }, { "epoch": 0.72, "learning_rate": 0.00039390628731244805, "loss": 2.5712, "step": 26645 }, { "epoch": 0.72, "learning_rate": 0.00039383705922187964, "loss": 2.8217, "step": 26646 }, { "epoch": 0.72, "learning_rate": 0.0003937678357234933, "loss": 2.3964, "step": 26647 }, { "epoch": 0.72, "learning_rate": 0.0003936986168178134, "loss": 2.4056, "step": 26648 }, { "epoch": 0.72, "learning_rate": 0.0003936294025053647, "loss": 2.3263, "step": 26649 }, { "epoch": 0.72, "learning_rate": 0.000393560192786671, "loss": 2.0289, "step": 26650 }, { "epoch": 0.72, "learning_rate": 0.00039349098766225675, "loss": 2.5299, "step": 26651 }, { "epoch": 0.72, "learning_rate": 0.00039342178713264674, "loss": 2.7084, "step": 26652 }, { "epoch": 0.72, "learning_rate": 0.00039335259119836454, "loss": 2.198, "step": 26653 }, { "epoch": 0.72, "learning_rate": 0.0003932833998599346, "loss": 2.1578, "step": 26654 }, { "epoch": 0.72, "learning_rate": 0.0003932142131178812, "loss": 2.5032, "step": 26655 }, { "epoch": 0.72, "learning_rate": 0.00039314503097272836, "loss": 2.539, "step": 26656 }, { "epoch": 0.72, "learning_rate": 0.00039307585342500064, "loss": 2.0903, "step": 26657 }, { "epoch": 0.72, "learning_rate": 0.00039300668047522136, "loss": 2.326, "step": 26658 }, { "epoch": 0.72, "learning_rate": 0.00039293751212391505, "loss": 2.1793, "step": 26659 }, { "epoch": 0.72, "learning_rate": 0.0003928683483716056, "loss": 2.5712, "step": 26660 }, { "epoch": 0.72, "learning_rate": 0.0003927991892188169, "loss": 2.9551, "step": 26661 }, { "epoch": 0.72, "learning_rate": 0.0003927300346660734, "loss": 2.1918, "step": 26662 }, { "epoch": 0.72, "learning_rate": 0.00039266088471389814, "loss": 2.2702, "step": 26663 }, { "epoch": 0.72, "learning_rate": 0.00039259173936281557, "loss": 2.8212, "step": 26664 }, { "epoch": 0.72, "learning_rate": 0.0003925225986133497, "loss": 2.5777, "step": 26665 }, { "epoch": 0.72, "learning_rate": 0.00039245346246602367, "loss": 2.6423, "step": 26666 }, { "epoch": 0.72, "learning_rate": 0.0003923843309213613, "loss": 2.2403, "step": 26667 }, { "epoch": 0.72, "learning_rate": 0.0003923152039798872, "loss": 2.4585, "step": 26668 }, { "epoch": 0.72, "learning_rate": 0.00039224608164212417, "loss": 2.2363, "step": 26669 }, { "epoch": 0.72, "learning_rate": 0.0003921769639085965, "loss": 2.7823, "step": 26670 }, { "epoch": 0.72, "learning_rate": 0.0003921078507798271, "loss": 2.6703, "step": 26671 }, { "epoch": 0.72, "learning_rate": 0.00039203874225633993, "loss": 2.0996, "step": 26672 }, { "epoch": 0.72, "learning_rate": 0.0003919696383386586, "loss": 2.5966, "step": 26673 }, { "epoch": 0.72, "learning_rate": 0.0003919005390273066, "loss": 2.7283, "step": 26674 }, { "epoch": 0.72, "learning_rate": 0.00039183144432280737, "loss": 2.4218, "step": 26675 }, { "epoch": 0.72, "learning_rate": 0.00039176235422568484, "loss": 2.4898, "step": 26676 }, { "epoch": 0.72, "learning_rate": 0.0003916932687364615, "loss": 2.3723, "step": 26677 }, { "epoch": 0.72, "learning_rate": 0.00039162418785566156, "loss": 2.771, "step": 26678 }, { "epoch": 0.72, "learning_rate": 0.00039155511158380776, "loss": 2.7703, "step": 26679 }, { "epoch": 0.72, "learning_rate": 0.0003914860399214232, "loss": 2.5077, "step": 26680 }, { "epoch": 0.72, "learning_rate": 0.0003914169728690323, "loss": 2.6306, "step": 26681 }, { "epoch": 0.72, "learning_rate": 0.00039134791042715733, "loss": 2.5772, "step": 26682 }, { "epoch": 0.72, "learning_rate": 0.00039127885259632167, "loss": 2.6668, "step": 26683 }, { "epoch": 0.72, "learning_rate": 0.00039120979937704904, "loss": 2.8002, "step": 26684 }, { "epoch": 0.72, "learning_rate": 0.00039114075076986175, "loss": 2.4801, "step": 26685 }, { "epoch": 0.72, "learning_rate": 0.00039107170677528326, "loss": 2.9156, "step": 26686 }, { "epoch": 0.72, "learning_rate": 0.0003910026673938367, "loss": 2.9067, "step": 26687 }, { "epoch": 0.72, "learning_rate": 0.0003909336326260451, "loss": 2.6249, "step": 26688 }, { "epoch": 0.72, "learning_rate": 0.00039086460247243163, "loss": 2.6302, "step": 26689 }, { "epoch": 0.72, "learning_rate": 0.00039079557693351874, "loss": 2.645, "step": 26690 }, { "epoch": 0.72, "learning_rate": 0.00039072655600982963, "loss": 2.591, "step": 26691 }, { "epoch": 0.72, "learning_rate": 0.0003906575397018872, "loss": 3.0485, "step": 26692 }, { "epoch": 0.72, "learning_rate": 0.00039058852801021436, "loss": 2.4563, "step": 26693 }, { "epoch": 0.72, "learning_rate": 0.0003905195209353338, "loss": 2.618, "step": 26694 }, { "epoch": 0.72, "learning_rate": 0.0003904505184777688, "loss": 2.5207, "step": 26695 }, { "epoch": 0.72, "learning_rate": 0.00039038152063804133, "loss": 2.318, "step": 26696 }, { "epoch": 0.72, "learning_rate": 0.00039031252741667476, "loss": 2.0723, "step": 26697 }, { "epoch": 0.72, "learning_rate": 0.00039024353881419115, "loss": 2.5133, "step": 26698 }, { "epoch": 0.72, "learning_rate": 0.00039017455483111353, "loss": 2.5395, "step": 26699 }, { "epoch": 0.72, "learning_rate": 0.0003901055754679644, "loss": 2.5096, "step": 26700 }, { "epoch": 0.72, "learning_rate": 0.0003900366007252665, "loss": 2.3396, "step": 26701 }, { "epoch": 0.72, "learning_rate": 0.0003899676306035421, "loss": 2.4644, "step": 26702 }, { "epoch": 0.72, "learning_rate": 0.0003898986651033144, "loss": 2.4212, "step": 26703 }, { "epoch": 0.72, "learning_rate": 0.0003898297042251049, "loss": 2.2196, "step": 26704 }, { "epoch": 0.72, "learning_rate": 0.0003897607479694364, "loss": 2.6783, "step": 26705 }, { "epoch": 0.72, "learning_rate": 0.0003896917963368315, "loss": 2.3325, "step": 26706 }, { "epoch": 0.72, "learning_rate": 0.00038962284932781235, "loss": 2.2177, "step": 26707 }, { "epoch": 0.72, "learning_rate": 0.0003895539069429017, "loss": 2.5771, "step": 26708 }, { "epoch": 0.72, "learning_rate": 0.0003894849691826212, "loss": 2.1918, "step": 26709 }, { "epoch": 0.72, "learning_rate": 0.00038941603604749345, "loss": 2.4842, "step": 26710 }, { "epoch": 0.72, "learning_rate": 0.00038934710753804093, "loss": 2.6105, "step": 26711 }, { "epoch": 0.72, "learning_rate": 0.0003892781836547853, "loss": 2.4623, "step": 26712 }, { "epoch": 0.72, "learning_rate": 0.0003892092643982489, "loss": 2.0323, "step": 26713 }, { "epoch": 0.72, "learning_rate": 0.000389140349768954, "loss": 2.3782, "step": 26714 }, { "epoch": 0.72, "learning_rate": 0.0003890714397674224, "loss": 2.3947, "step": 26715 }, { "epoch": 0.72, "learning_rate": 0.00038900253439417686, "loss": 2.4342, "step": 26716 }, { "epoch": 0.72, "learning_rate": 0.0003889336336497384, "loss": 2.4814, "step": 26717 }, { "epoch": 0.72, "learning_rate": 0.0003888647375346297, "loss": 2.5438, "step": 26718 }, { "epoch": 0.72, "learning_rate": 0.00038879584604937237, "loss": 2.2393, "step": 26719 }, { "epoch": 0.72, "learning_rate": 0.0003887269591944884, "loss": 2.4723, "step": 26720 }, { "epoch": 0.72, "learning_rate": 0.0003886580769704997, "loss": 2.4597, "step": 26721 }, { "epoch": 0.72, "learning_rate": 0.00038858919937792845, "loss": 2.6192, "step": 26722 }, { "epoch": 0.72, "learning_rate": 0.00038852032641729586, "loss": 2.5598, "step": 26723 }, { "epoch": 0.72, "learning_rate": 0.0003884514580891243, "loss": 2.3141, "step": 26724 }, { "epoch": 0.72, "learning_rate": 0.00038838259439393473, "loss": 2.3464, "step": 26725 }, { "epoch": 0.72, "learning_rate": 0.000388313735332249, "loss": 2.5308, "step": 26726 }, { "epoch": 0.72, "learning_rate": 0.00038824488090458966, "loss": 2.799, "step": 26727 }, { "epoch": 0.72, "learning_rate": 0.0003881760311114775, "loss": 2.6736, "step": 26728 }, { "epoch": 0.72, "learning_rate": 0.0003881071859534342, "loss": 2.2592, "step": 26729 }, { "epoch": 0.72, "learning_rate": 0.00038803834543098194, "loss": 2.2202, "step": 26730 }, { "epoch": 0.72, "learning_rate": 0.0003879695095446414, "loss": 2.4727, "step": 26731 }, { "epoch": 0.72, "learning_rate": 0.0003879006782949344, "loss": 2.5242, "step": 26732 }, { "epoch": 0.72, "learning_rate": 0.00038783185168238233, "loss": 2.7228, "step": 26733 }, { "epoch": 0.72, "learning_rate": 0.00038776302970750686, "loss": 2.8811, "step": 26734 }, { "epoch": 0.72, "learning_rate": 0.0003876942123708295, "loss": 2.6169, "step": 26735 }, { "epoch": 0.72, "learning_rate": 0.00038762539967287103, "loss": 2.7856, "step": 26736 }, { "epoch": 0.72, "learning_rate": 0.0003875565916141529, "loss": 2.3102, "step": 26737 }, { "epoch": 0.72, "learning_rate": 0.00038748778819519704, "loss": 2.1207, "step": 26738 }, { "epoch": 0.72, "learning_rate": 0.0003874189894165234, "loss": 2.8674, "step": 26739 }, { "epoch": 0.72, "learning_rate": 0.0003873501952786548, "loss": 2.365, "step": 26740 }, { "epoch": 0.72, "learning_rate": 0.00038728140578211115, "loss": 2.3293, "step": 26741 }, { "epoch": 0.72, "learning_rate": 0.00038721262092741404, "loss": 2.3489, "step": 26742 }, { "epoch": 0.72, "learning_rate": 0.0003871438407150849, "loss": 2.2979, "step": 26743 }, { "epoch": 0.72, "learning_rate": 0.00038707506514564405, "loss": 2.3419, "step": 26744 }, { "epoch": 0.72, "learning_rate": 0.000387006294219613, "loss": 2.9006, "step": 26745 }, { "epoch": 0.72, "learning_rate": 0.0003869375279375127, "loss": 2.9908, "step": 26746 }, { "epoch": 0.72, "learning_rate": 0.000386868766299864, "loss": 2.4228, "step": 26747 }, { "epoch": 0.72, "learning_rate": 0.0003868000093071883, "loss": 2.5269, "step": 26748 }, { "epoch": 0.72, "learning_rate": 0.00038673125696000565, "loss": 2.0923, "step": 26749 }, { "epoch": 0.72, "learning_rate": 0.0003866625092588375, "loss": 2.3411, "step": 26750 }, { "epoch": 0.72, "learning_rate": 0.0003865937662042048, "loss": 2.4683, "step": 26751 }, { "epoch": 0.72, "learning_rate": 0.00038652502779662744, "loss": 2.13, "step": 26752 }, { "epoch": 0.72, "learning_rate": 0.00038645629403662705, "loss": 2.458, "step": 26753 }, { "epoch": 0.72, "learning_rate": 0.0003863875649247245, "loss": 2.2381, "step": 26754 }, { "epoch": 0.72, "learning_rate": 0.0003863188404614396, "loss": 2.472, "step": 26755 }, { "epoch": 0.72, "learning_rate": 0.00038625012064729357, "loss": 2.5752, "step": 26756 }, { "epoch": 0.72, "learning_rate": 0.00038618140548280725, "loss": 2.5553, "step": 26757 }, { "epoch": 0.72, "learning_rate": 0.0003861126949685004, "loss": 2.5046, "step": 26758 }, { "epoch": 0.72, "learning_rate": 0.00038604398910489416, "loss": 2.3529, "step": 26759 }, { "epoch": 0.72, "learning_rate": 0.0003859752878925088, "loss": 2.8191, "step": 26760 }, { "epoch": 0.72, "learning_rate": 0.0003859065913318649, "loss": 2.5859, "step": 26761 }, { "epoch": 0.72, "learning_rate": 0.0003858378994234831, "loss": 2.305, "step": 26762 }, { "epoch": 0.72, "learning_rate": 0.0003857692121678834, "loss": 2.5096, "step": 26763 }, { "epoch": 0.72, "learning_rate": 0.0003857005295655863, "loss": 2.8495, "step": 26764 }, { "epoch": 0.72, "learning_rate": 0.0003856318516171121, "loss": 2.7096, "step": 26765 }, { "epoch": 0.72, "learning_rate": 0.0003855631783229813, "loss": 2.6533, "step": 26766 }, { "epoch": 0.72, "learning_rate": 0.00038549450968371413, "loss": 2.3138, "step": 26767 }, { "epoch": 0.72, "learning_rate": 0.00038542584569983054, "loss": 2.5462, "step": 26768 }, { "epoch": 0.72, "learning_rate": 0.0003853571863718508, "loss": 2.3337, "step": 26769 }, { "epoch": 0.72, "learning_rate": 0.0003852885317002954, "loss": 2.4737, "step": 26770 }, { "epoch": 0.72, "learning_rate": 0.0003852198816856839, "loss": 2.3682, "step": 26771 }, { "epoch": 0.72, "learning_rate": 0.0003851512363285367, "loss": 2.3267, "step": 26772 }, { "epoch": 0.72, "learning_rate": 0.00038508259562937376, "loss": 2.877, "step": 26773 }, { "epoch": 0.72, "learning_rate": 0.0003850139595887152, "loss": 2.4572, "step": 26774 }, { "epoch": 0.72, "learning_rate": 0.0003849453282070812, "loss": 2.4311, "step": 26775 }, { "epoch": 0.72, "learning_rate": 0.0003848767014849911, "loss": 2.301, "step": 26776 }, { "epoch": 0.72, "learning_rate": 0.00038480807942296516, "loss": 2.6805, "step": 26777 }, { "epoch": 0.72, "learning_rate": 0.0003847394620215232, "loss": 2.5145, "step": 26778 }, { "epoch": 0.72, "learning_rate": 0.00038467084928118513, "loss": 2.1849, "step": 26779 }, { "epoch": 0.72, "learning_rate": 0.00038460224120247065, "loss": 2.1144, "step": 26780 }, { "epoch": 0.72, "learning_rate": 0.0003845336377859, "loss": 2.1733, "step": 26781 }, { "epoch": 0.72, "learning_rate": 0.00038446503903199206, "loss": 2.4562, "step": 26782 }, { "epoch": 0.72, "learning_rate": 0.0003843964449412672, "loss": 2.3734, "step": 26783 }, { "epoch": 0.72, "learning_rate": 0.0003843278555142445, "loss": 2.6976, "step": 26784 }, { "epoch": 0.72, "learning_rate": 0.0003842592707514441, "loss": 2.9839, "step": 26785 }, { "epoch": 0.72, "learning_rate": 0.0003841906906533852, "loss": 2.6581, "step": 26786 }, { "epoch": 0.72, "learning_rate": 0.0003841221152205875, "loss": 2.6305, "step": 26787 }, { "epoch": 0.72, "learning_rate": 0.00038405354445357053, "loss": 2.5485, "step": 26788 }, { "epoch": 0.72, "learning_rate": 0.00038398497835285427, "loss": 2.422, "step": 26789 }, { "epoch": 0.72, "learning_rate": 0.0003839164169189573, "loss": 1.9796, "step": 26790 }, { "epoch": 0.72, "learning_rate": 0.0003838478601523994, "loss": 2.4448, "step": 26791 }, { "epoch": 0.72, "learning_rate": 0.00038377930805369984, "loss": 2.7775, "step": 26792 }, { "epoch": 0.72, "learning_rate": 0.0003837107606233782, "loss": 2.3572, "step": 26793 }, { "epoch": 0.72, "learning_rate": 0.00038364221786195397, "loss": 2.3884, "step": 26794 }, { "epoch": 0.72, "learning_rate": 0.00038357367976994575, "loss": 2.5007, "step": 26795 }, { "epoch": 0.72, "learning_rate": 0.00038350514634787313, "loss": 2.4336, "step": 26796 }, { "epoch": 0.72, "learning_rate": 0.0003834366175962557, "loss": 2.2349, "step": 26797 }, { "epoch": 0.72, "learning_rate": 0.00038336809351561174, "loss": 2.5935, "step": 26798 }, { "epoch": 0.72, "learning_rate": 0.00038329957410646064, "loss": 2.4851, "step": 26799 }, { "epoch": 0.72, "learning_rate": 0.00038323105936932233, "loss": 2.2704, "step": 26800 }, { "epoch": 0.72, "learning_rate": 0.00038316254930471493, "loss": 2.3323, "step": 26801 }, { "epoch": 0.72, "learning_rate": 0.00038309404391315816, "loss": 2.448, "step": 26802 }, { "epoch": 0.72, "learning_rate": 0.00038302554319517027, "loss": 2.4505, "step": 26803 }, { "epoch": 0.72, "learning_rate": 0.0003829570471512704, "loss": 2.6908, "step": 26804 }, { "epoch": 0.72, "learning_rate": 0.0003828885557819778, "loss": 2.3197, "step": 26805 }, { "epoch": 0.72, "learning_rate": 0.0003828200690878112, "loss": 2.839, "step": 26806 }, { "epoch": 0.72, "learning_rate": 0.00038275158706928925, "loss": 2.033, "step": 26807 }, { "epoch": 0.72, "learning_rate": 0.0003826831097269314, "loss": 2.5108, "step": 26808 }, { "epoch": 0.72, "learning_rate": 0.00038261463706125556, "loss": 2.1543, "step": 26809 }, { "epoch": 0.72, "learning_rate": 0.00038254616907278116, "loss": 2.4134, "step": 26810 }, { "epoch": 0.72, "learning_rate": 0.00038247770576202634, "loss": 2.2268, "step": 26811 }, { "epoch": 0.72, "learning_rate": 0.0003824092471295095, "loss": 2.4851, "step": 26812 }, { "epoch": 0.72, "learning_rate": 0.00038234079317575067, "loss": 2.3175, "step": 26813 }, { "epoch": 0.72, "learning_rate": 0.0003822723439012672, "loss": 2.4527, "step": 26814 }, { "epoch": 0.72, "learning_rate": 0.00038220389930657784, "loss": 2.4418, "step": 26815 }, { "epoch": 0.72, "learning_rate": 0.0003821354593922018, "loss": 2.4929, "step": 26816 }, { "epoch": 0.72, "learning_rate": 0.00038206702415865667, "loss": 2.4748, "step": 26817 }, { "epoch": 0.72, "learning_rate": 0.0003819985936064613, "loss": 2.1984, "step": 26818 }, { "epoch": 0.72, "learning_rate": 0.0003819301677361341, "loss": 2.6297, "step": 26819 }, { "epoch": 0.72, "learning_rate": 0.0003818617465481934, "loss": 2.3323, "step": 26820 }, { "epoch": 0.72, "learning_rate": 0.00038179333004315796, "loss": 2.6715, "step": 26821 }, { "epoch": 0.72, "learning_rate": 0.0003817249182215453, "loss": 2.4046, "step": 26822 }, { "epoch": 0.72, "learning_rate": 0.00038165651108387424, "loss": 2.2112, "step": 26823 }, { "epoch": 0.72, "learning_rate": 0.0003815881086306633, "loss": 2.3889, "step": 26824 }, { "epoch": 0.72, "learning_rate": 0.00038151971086242944, "loss": 2.7119, "step": 26825 }, { "epoch": 0.72, "learning_rate": 0.0003814513177796924, "loss": 2.6378, "step": 26826 }, { "epoch": 0.72, "learning_rate": 0.0003813829293829694, "loss": 2.6554, "step": 26827 }, { "epoch": 0.72, "learning_rate": 0.00038131454567277856, "loss": 2.4698, "step": 26828 }, { "epoch": 0.72, "learning_rate": 0.0003812461666496385, "loss": 2.5169, "step": 26829 }, { "epoch": 0.72, "learning_rate": 0.0003811777923140665, "loss": 2.1028, "step": 26830 }, { "epoch": 0.72, "learning_rate": 0.000381109422666581, "loss": 2.6293, "step": 26831 }, { "epoch": 0.72, "learning_rate": 0.0003810410577076997, "loss": 2.5612, "step": 26832 }, { "epoch": 0.72, "learning_rate": 0.0003809726974379408, "loss": 2.4698, "step": 26833 }, { "epoch": 0.72, "learning_rate": 0.0003809043418578221, "loss": 2.4784, "step": 26834 }, { "epoch": 0.72, "learning_rate": 0.0003808359909678617, "loss": 2.4542, "step": 26835 }, { "epoch": 0.72, "learning_rate": 0.00038076764476857686, "loss": 2.434, "step": 26836 }, { "epoch": 0.72, "learning_rate": 0.00038069930326048597, "loss": 3.086, "step": 26837 }, { "epoch": 0.72, "learning_rate": 0.00038063096644410564, "loss": 2.2823, "step": 26838 }, { "epoch": 0.72, "learning_rate": 0.0003805626343199549, "loss": 2.3071, "step": 26839 }, { "epoch": 0.72, "learning_rate": 0.000380494306888551, "loss": 2.7138, "step": 26840 }, { "epoch": 0.72, "learning_rate": 0.0003804259841504113, "loss": 2.3845, "step": 26841 }, { "epoch": 0.72, "learning_rate": 0.0003803576661060536, "loss": 2.9341, "step": 26842 }, { "epoch": 0.72, "learning_rate": 0.00038028935275599566, "loss": 2.9958, "step": 26843 }, { "epoch": 0.72, "learning_rate": 0.00038022104410075455, "loss": 2.825, "step": 26844 }, { "epoch": 0.72, "learning_rate": 0.000380152740140848, "loss": 2.404, "step": 26845 }, { "epoch": 0.72, "learning_rate": 0.0003800844408767934, "loss": 2.1873, "step": 26846 }, { "epoch": 0.72, "learning_rate": 0.0003800161463091083, "loss": 2.6047, "step": 26847 }, { "epoch": 0.72, "learning_rate": 0.0003799478564383103, "loss": 2.4766, "step": 26848 }, { "epoch": 0.72, "learning_rate": 0.00037987957126491624, "loss": 2.5821, "step": 26849 }, { "epoch": 0.72, "learning_rate": 0.00037981129078944366, "loss": 2.6938, "step": 26850 }, { "epoch": 0.72, "learning_rate": 0.0003797430150124098, "loss": 2.6152, "step": 26851 }, { "epoch": 0.72, "learning_rate": 0.000379674743934332, "loss": 2.9089, "step": 26852 }, { "epoch": 0.72, "learning_rate": 0.00037960647755572787, "loss": 2.7185, "step": 26853 }, { "epoch": 0.72, "learning_rate": 0.00037953821587711367, "loss": 2.7717, "step": 26854 }, { "epoch": 0.72, "learning_rate": 0.000379469958899007, "loss": 2.6494, "step": 26855 }, { "epoch": 0.72, "learning_rate": 0.00037940170662192544, "loss": 2.4331, "step": 26856 }, { "epoch": 0.72, "learning_rate": 0.00037933345904638525, "loss": 2.6933, "step": 26857 }, { "epoch": 0.72, "learning_rate": 0.0003792652161729034, "loss": 2.3925, "step": 26858 }, { "epoch": 0.72, "learning_rate": 0.00037919697800199806, "loss": 2.1763, "step": 26859 }, { "epoch": 0.72, "learning_rate": 0.000379128744534185, "loss": 2.6279, "step": 26860 }, { "epoch": 0.72, "learning_rate": 0.0003790605157699819, "loss": 2.2482, "step": 26861 }, { "epoch": 0.72, "learning_rate": 0.0003789922917099051, "loss": 2.7998, "step": 26862 }, { "epoch": 0.72, "learning_rate": 0.0003789240723544716, "loss": 2.6769, "step": 26863 }, { "epoch": 0.72, "learning_rate": 0.0003788558577041983, "loss": 2.1058, "step": 26864 }, { "epoch": 0.72, "learning_rate": 0.00037878764775960193, "loss": 2.4388, "step": 26865 }, { "epoch": 0.72, "learning_rate": 0.0003787194425211993, "loss": 2.4708, "step": 26866 }, { "epoch": 0.72, "learning_rate": 0.0003786512419895074, "loss": 2.4123, "step": 26867 }, { "epoch": 0.72, "learning_rate": 0.0003785830461650424, "loss": 2.6697, "step": 26868 }, { "epoch": 0.72, "learning_rate": 0.0003785148550483209, "loss": 2.7569, "step": 26869 }, { "epoch": 0.72, "learning_rate": 0.00037844666863986033, "loss": 2.4615, "step": 26870 }, { "epoch": 0.72, "learning_rate": 0.00037837848694017586, "loss": 2.4825, "step": 26871 }, { "epoch": 0.72, "learning_rate": 0.00037831030994978554, "loss": 2.7723, "step": 26872 }, { "epoch": 0.72, "learning_rate": 0.0003782421376692049, "loss": 2.6114, "step": 26873 }, { "epoch": 0.72, "learning_rate": 0.0003781739700989506, "loss": 2.2934, "step": 26874 }, { "epoch": 0.72, "learning_rate": 0.0003781058072395395, "loss": 2.4863, "step": 26875 }, { "epoch": 0.72, "learning_rate": 0.0003780376490914873, "loss": 2.7066, "step": 26876 }, { "epoch": 0.72, "learning_rate": 0.0003779694956553106, "loss": 2.2882, "step": 26877 }, { "epoch": 0.72, "learning_rate": 0.00037790134693152576, "loss": 2.0557, "step": 26878 }, { "epoch": 0.72, "learning_rate": 0.00037783320292064925, "loss": 2.2447, "step": 26879 }, { "epoch": 0.72, "learning_rate": 0.0003777650636231974, "loss": 2.1004, "step": 26880 }, { "epoch": 0.72, "learning_rate": 0.0003776969290396859, "loss": 2.8742, "step": 26881 }, { "epoch": 0.72, "learning_rate": 0.00037762879917063106, "loss": 1.8952, "step": 26882 }, { "epoch": 0.72, "learning_rate": 0.0003775606740165497, "loss": 2.2856, "step": 26883 }, { "epoch": 0.72, "learning_rate": 0.00037749255357795653, "loss": 2.0111, "step": 26884 }, { "epoch": 0.72, "learning_rate": 0.00037742443785536894, "loss": 2.4867, "step": 26885 }, { "epoch": 0.72, "learning_rate": 0.00037735632684930286, "loss": 2.4936, "step": 26886 }, { "epoch": 0.72, "learning_rate": 0.0003772882205602736, "loss": 2.5442, "step": 26887 }, { "epoch": 0.72, "learning_rate": 0.0003772201189887977, "loss": 2.5311, "step": 26888 }, { "epoch": 0.72, "learning_rate": 0.0003771520221353905, "loss": 2.8681, "step": 26889 }, { "epoch": 0.72, "learning_rate": 0.00037708393000056826, "loss": 2.6809, "step": 26890 }, { "epoch": 0.72, "learning_rate": 0.0003770158425848468, "loss": 2.6435, "step": 26891 }, { "epoch": 0.72, "learning_rate": 0.00037694775988874197, "loss": 2.1559, "step": 26892 }, { "epoch": 0.72, "learning_rate": 0.00037687968191276946, "loss": 2.5702, "step": 26893 }, { "epoch": 0.72, "learning_rate": 0.00037681160865744547, "loss": 2.5556, "step": 26894 }, { "epoch": 0.72, "learning_rate": 0.00037674354012328493, "loss": 2.2788, "step": 26895 }, { "epoch": 0.72, "learning_rate": 0.00037667547631080426, "loss": 2.5293, "step": 26896 }, { "epoch": 0.72, "learning_rate": 0.00037660741722051806, "loss": 2.4087, "step": 26897 }, { "epoch": 0.72, "learning_rate": 0.000376539362852943, "loss": 2.4978, "step": 26898 }, { "epoch": 0.72, "learning_rate": 0.0003764713132085945, "loss": 2.2612, "step": 26899 }, { "epoch": 0.72, "learning_rate": 0.00037640326828798756, "loss": 2.7451, "step": 26900 }, { "epoch": 0.72, "learning_rate": 0.000376335228091638, "loss": 2.4954, "step": 26901 }, { "epoch": 0.72, "learning_rate": 0.0003762671926200616, "loss": 2.5939, "step": 26902 }, { "epoch": 0.72, "learning_rate": 0.00037619916187377303, "loss": 2.195, "step": 26903 }, { "epoch": 0.72, "learning_rate": 0.0003761311358532882, "loss": 2.7144, "step": 26904 }, { "epoch": 0.72, "learning_rate": 0.0003760631145591222, "loss": 2.3367, "step": 26905 }, { "epoch": 0.72, "learning_rate": 0.0003759950979917905, "loss": 2.6761, "step": 26906 }, { "epoch": 0.72, "learning_rate": 0.0003759270861518089, "loss": 2.5807, "step": 26907 }, { "epoch": 0.72, "learning_rate": 0.00037585907903969166, "loss": 2.6787, "step": 26908 }, { "epoch": 0.72, "learning_rate": 0.0003757910766559545, "loss": 2.466, "step": 26909 }, { "epoch": 0.72, "learning_rate": 0.00037572307900111246, "loss": 2.5323, "step": 26910 }, { "epoch": 0.72, "learning_rate": 0.0003756550860756808, "loss": 2.465, "step": 26911 }, { "epoch": 0.72, "learning_rate": 0.00037558709788017454, "loss": 2.573, "step": 26912 }, { "epoch": 0.72, "learning_rate": 0.0003755191144151092, "loss": 3.0077, "step": 26913 }, { "epoch": 0.72, "learning_rate": 0.0003754511356809991, "loss": 2.5, "step": 26914 }, { "epoch": 0.72, "learning_rate": 0.00037538316167835985, "loss": 2.5757, "step": 26915 }, { "epoch": 0.72, "learning_rate": 0.00037531519240770574, "loss": 2.3468, "step": 26916 }, { "epoch": 0.72, "learning_rate": 0.000375247227869552, "loss": 2.6388, "step": 26917 }, { "epoch": 0.72, "learning_rate": 0.0003751792680644136, "loss": 2.305, "step": 26918 }, { "epoch": 0.72, "learning_rate": 0.0003751113129928053, "loss": 2.6937, "step": 26919 }, { "epoch": 0.72, "learning_rate": 0.0003750433626552421, "loss": 2.471, "step": 26920 }, { "epoch": 0.72, "learning_rate": 0.00037497541705223893, "loss": 2.8025, "step": 26921 }, { "epoch": 0.72, "learning_rate": 0.00037490747618430987, "loss": 2.3619, "step": 26922 }, { "epoch": 0.72, "learning_rate": 0.00037483954005197007, "loss": 2.3048, "step": 26923 }, { "epoch": 0.72, "learning_rate": 0.00037477160865573414, "loss": 2.9935, "step": 26924 }, { "epoch": 0.72, "learning_rate": 0.0003747036819961167, "loss": 2.6257, "step": 26925 }, { "epoch": 0.72, "learning_rate": 0.0003746357600736328, "loss": 2.5661, "step": 26926 }, { "epoch": 0.72, "learning_rate": 0.0003745678428887961, "loss": 2.1029, "step": 26927 }, { "epoch": 0.72, "learning_rate": 0.0003744999304421217, "loss": 2.1752, "step": 26928 }, { "epoch": 0.72, "learning_rate": 0.0003744320227341244, "loss": 2.1922, "step": 26929 }, { "epoch": 0.72, "learning_rate": 0.0003743641197653177, "loss": 2.3047, "step": 26930 }, { "epoch": 0.72, "learning_rate": 0.00037429622153621676, "loss": 2.5089, "step": 26931 }, { "epoch": 0.72, "learning_rate": 0.00037422832804733576, "loss": 2.2941, "step": 26932 }, { "epoch": 0.72, "learning_rate": 0.000374160439299189, "loss": 2.4117, "step": 26933 }, { "epoch": 0.72, "learning_rate": 0.00037409255529229123, "loss": 2.3719, "step": 26934 }, { "epoch": 0.72, "learning_rate": 0.00037402467602715595, "loss": 2.7973, "step": 26935 }, { "epoch": 0.72, "learning_rate": 0.0003739568015042979, "loss": 2.6088, "step": 26936 }, { "epoch": 0.72, "learning_rate": 0.0003738889317242312, "loss": 2.511, "step": 26937 }, { "epoch": 0.72, "learning_rate": 0.00037382106668747, "loss": 2.8317, "step": 26938 }, { "epoch": 0.72, "learning_rate": 0.0003737532063945288, "loss": 2.4372, "step": 26939 }, { "epoch": 0.72, "learning_rate": 0.000373685350845921, "loss": 2.7274, "step": 26940 }, { "epoch": 0.72, "learning_rate": 0.000373617500042161, "loss": 2.2468, "step": 26941 }, { "epoch": 0.72, "learning_rate": 0.0003735496539837632, "loss": 2.2779, "step": 26942 }, { "epoch": 0.72, "learning_rate": 0.0003734818126712408, "loss": 2.2002, "step": 26943 }, { "epoch": 0.72, "learning_rate": 0.00037341397610510783, "loss": 2.1378, "step": 26944 }, { "epoch": 0.72, "learning_rate": 0.00037334614428587935, "loss": 2.5001, "step": 26945 }, { "epoch": 0.72, "learning_rate": 0.000373278317214068, "loss": 2.5126, "step": 26946 }, { "epoch": 0.72, "learning_rate": 0.0003732104948901882, "loss": 2.8943, "step": 26947 }, { "epoch": 0.72, "learning_rate": 0.00037314267731475384, "loss": 2.4606, "step": 26948 }, { "epoch": 0.72, "learning_rate": 0.0003730748644882782, "loss": 2.4398, "step": 26949 }, { "epoch": 0.72, "learning_rate": 0.0003730070564112753, "loss": 2.6319, "step": 26950 }, { "epoch": 0.72, "learning_rate": 0.0003729392530842588, "loss": 2.4036, "step": 26951 }, { "epoch": 0.72, "learning_rate": 0.0003728714545077425, "loss": 2.7968, "step": 26952 }, { "epoch": 0.72, "learning_rate": 0.00037280366068224025, "loss": 2.0684, "step": 26953 }, { "epoch": 0.72, "learning_rate": 0.00037273587160826496, "loss": 2.566, "step": 26954 }, { "epoch": 0.72, "learning_rate": 0.0003726680872863306, "loss": 2.5525, "step": 26955 }, { "epoch": 0.72, "learning_rate": 0.000372600307716951, "loss": 2.5175, "step": 26956 }, { "epoch": 0.72, "learning_rate": 0.0003725325329006386, "loss": 2.8185, "step": 26957 }, { "epoch": 0.72, "learning_rate": 0.0003724647628379082, "loss": 2.6097, "step": 26958 }, { "epoch": 0.72, "learning_rate": 0.00037239699752927223, "loss": 2.4238, "step": 26959 }, { "epoch": 0.72, "learning_rate": 0.00037232923697524446, "loss": 2.5946, "step": 26960 }, { "epoch": 0.72, "learning_rate": 0.0003722614811763384, "loss": 2.8565, "step": 26961 }, { "epoch": 0.72, "learning_rate": 0.0003721937301330669, "loss": 2.0108, "step": 26962 }, { "epoch": 0.72, "learning_rate": 0.0003721259838459434, "loss": 2.9069, "step": 26963 }, { "epoch": 0.72, "learning_rate": 0.00037205824231548125, "loss": 2.1673, "step": 26964 }, { "epoch": 0.72, "learning_rate": 0.0003719905055421936, "loss": 2.34, "step": 26965 }, { "epoch": 0.72, "learning_rate": 0.00037192277352659386, "loss": 2.5301, "step": 26966 }, { "epoch": 0.72, "learning_rate": 0.0003718550462691946, "loss": 2.509, "step": 26967 }, { "epoch": 0.72, "learning_rate": 0.00037178732377050915, "loss": 2.1234, "step": 26968 }, { "epoch": 0.72, "learning_rate": 0.00037171960603105104, "loss": 2.0281, "step": 26969 }, { "epoch": 0.72, "learning_rate": 0.0003716518930513322, "loss": 2.5287, "step": 26970 }, { "epoch": 0.72, "learning_rate": 0.0003715841848318665, "loss": 2.4303, "step": 26971 }, { "epoch": 0.72, "learning_rate": 0.0003715164813731672, "loss": 2.4695, "step": 26972 }, { "epoch": 0.72, "learning_rate": 0.00037144878267574623, "loss": 2.3871, "step": 26973 }, { "epoch": 0.72, "learning_rate": 0.0003713810887401172, "loss": 2.7152, "step": 26974 }, { "epoch": 0.72, "learning_rate": 0.0003713133995667923, "loss": 3.2097, "step": 26975 }, { "epoch": 0.72, "learning_rate": 0.0003712457151562848, "loss": 2.5798, "step": 26976 }, { "epoch": 0.72, "learning_rate": 0.0003711780355091073, "loss": 2.812, "step": 26977 }, { "epoch": 0.73, "learning_rate": 0.00037111036062577253, "loss": 2.4883, "step": 26978 }, { "epoch": 0.73, "learning_rate": 0.00037104269050679327, "loss": 2.0781, "step": 26979 }, { "epoch": 0.73, "learning_rate": 0.00037097502515268257, "loss": 2.6016, "step": 26980 }, { "epoch": 0.73, "learning_rate": 0.0003709073645639521, "loss": 2.3631, "step": 26981 }, { "epoch": 0.73, "learning_rate": 0.00037083970874111514, "loss": 2.8529, "step": 26982 }, { "epoch": 0.73, "learning_rate": 0.000370772057684684, "loss": 2.3488, "step": 26983 }, { "epoch": 0.73, "learning_rate": 0.0003707044113951712, "loss": 2.4326, "step": 26984 }, { "epoch": 0.73, "learning_rate": 0.0003706367698730897, "loss": 2.4196, "step": 26985 }, { "epoch": 0.73, "learning_rate": 0.00037056913311895115, "loss": 2.6692, "step": 26986 }, { "epoch": 0.73, "learning_rate": 0.0003705015011332683, "loss": 2.3659, "step": 26987 }, { "epoch": 0.73, "learning_rate": 0.0003704338739165538, "loss": 2.1387, "step": 26988 }, { "epoch": 0.73, "learning_rate": 0.00037036625146931945, "loss": 2.3644, "step": 26989 }, { "epoch": 0.73, "learning_rate": 0.0003702986337920778, "loss": 2.2121, "step": 26990 }, { "epoch": 0.73, "learning_rate": 0.0003702310208853411, "loss": 2.6521, "step": 26991 }, { "epoch": 0.73, "learning_rate": 0.0003701634127496216, "loss": 2.2745, "step": 26992 }, { "epoch": 0.73, "learning_rate": 0.00037009580938543186, "loss": 2.5953, "step": 26993 }, { "epoch": 0.73, "learning_rate": 0.00037002821079328333, "loss": 2.3716, "step": 26994 }, { "epoch": 0.73, "learning_rate": 0.0003699606169736884, "loss": 2.0621, "step": 26995 }, { "epoch": 0.73, "learning_rate": 0.00036989302792715917, "loss": 2.2776, "step": 26996 }, { "epoch": 0.73, "learning_rate": 0.0003698254436542078, "loss": 2.7656, "step": 26997 }, { "epoch": 0.73, "learning_rate": 0.0003697578641553461, "loss": 2.3649, "step": 26998 }, { "epoch": 0.73, "learning_rate": 0.0003696902894310865, "loss": 2.1588, "step": 26999 }, { "epoch": 0.73, "learning_rate": 0.0003696227194819403, "loss": 2.0464, "step": 27000 }, { "epoch": 0.73, "learning_rate": 0.00036955515430842, "loss": 2.3476, "step": 27001 }, { "epoch": 0.73, "learning_rate": 0.00036948759391103683, "loss": 2.9387, "step": 27002 }, { "epoch": 0.73, "learning_rate": 0.0003694200382903028, "loss": 2.3655, "step": 27003 }, { "epoch": 0.73, "learning_rate": 0.0003693524874467299, "loss": 2.3955, "step": 27004 }, { "epoch": 0.73, "learning_rate": 0.0003692849413808298, "loss": 2.7244, "step": 27005 }, { "epoch": 0.73, "learning_rate": 0.0003692174000931142, "loss": 2.2746, "step": 27006 }, { "epoch": 0.73, "learning_rate": 0.00036914986358409517, "loss": 2.6134, "step": 27007 }, { "epoch": 0.73, "learning_rate": 0.00036908233185428365, "loss": 2.4066, "step": 27008 }, { "epoch": 0.73, "learning_rate": 0.0003690148049041916, "loss": 2.3801, "step": 27009 }, { "epoch": 0.73, "learning_rate": 0.0003689472827343305, "loss": 2.5595, "step": 27010 }, { "epoch": 0.73, "learning_rate": 0.0003688797653452121, "loss": 2.2361, "step": 27011 }, { "epoch": 0.73, "learning_rate": 0.0003688122527373481, "loss": 2.5875, "step": 27012 }, { "epoch": 0.73, "learning_rate": 0.0003687447449112492, "loss": 2.1145, "step": 27013 }, { "epoch": 0.73, "learning_rate": 0.0003686772418674272, "loss": 2.1535, "step": 27014 }, { "epoch": 0.73, "learning_rate": 0.000368609743606394, "loss": 2.5731, "step": 27015 }, { "epoch": 0.73, "learning_rate": 0.00036854225012866005, "loss": 2.3889, "step": 27016 }, { "epoch": 0.73, "learning_rate": 0.0003684747614347369, "loss": 2.434, "step": 27017 }, { "epoch": 0.73, "learning_rate": 0.00036840727752513667, "loss": 2.3524, "step": 27018 }, { "epoch": 0.73, "learning_rate": 0.00036833979840036966, "loss": 2.4804, "step": 27019 }, { "epoch": 0.73, "learning_rate": 0.0003682723240609478, "loss": 2.6365, "step": 27020 }, { "epoch": 0.73, "learning_rate": 0.00036820485450738137, "loss": 2.558, "step": 27021 }, { "epoch": 0.73, "learning_rate": 0.0003681373897401822, "loss": 2.3313, "step": 27022 }, { "epoch": 0.73, "learning_rate": 0.00036806992975986106, "loss": 1.9721, "step": 27023 }, { "epoch": 0.73, "learning_rate": 0.00036800247456692924, "loss": 2.6268, "step": 27024 }, { "epoch": 0.73, "learning_rate": 0.0003679350241618976, "loss": 2.4462, "step": 27025 }, { "epoch": 0.73, "learning_rate": 0.0003678675785452776, "loss": 2.2998, "step": 27026 }, { "epoch": 0.73, "learning_rate": 0.00036780013771757947, "loss": 2.5117, "step": 27027 }, { "epoch": 0.73, "learning_rate": 0.0003677327016793148, "loss": 2.4621, "step": 27028 }, { "epoch": 0.73, "learning_rate": 0.0003676652704309935, "loss": 2.5103, "step": 27029 }, { "epoch": 0.73, "learning_rate": 0.00036759784397312733, "loss": 2.6387, "step": 27030 }, { "epoch": 0.73, "learning_rate": 0.00036753042230622723, "loss": 2.981, "step": 27031 }, { "epoch": 0.73, "learning_rate": 0.00036746300543080327, "loss": 2.061, "step": 27032 }, { "epoch": 0.73, "learning_rate": 0.00036739559334736637, "loss": 2.3296, "step": 27033 }, { "epoch": 0.73, "learning_rate": 0.0003673281860564278, "loss": 2.3437, "step": 27034 }, { "epoch": 0.73, "learning_rate": 0.00036726078355849744, "loss": 2.8015, "step": 27035 }, { "epoch": 0.73, "learning_rate": 0.00036719338585408624, "loss": 2.0427, "step": 27036 }, { "epoch": 0.73, "learning_rate": 0.00036712599294370474, "loss": 2.5753, "step": 27037 }, { "epoch": 0.73, "learning_rate": 0.0003670586048278637, "loss": 2.3589, "step": 27038 }, { "epoch": 0.73, "learning_rate": 0.00036699122150707375, "loss": 2.7613, "step": 27039 }, { "epoch": 0.73, "learning_rate": 0.0003669238429818449, "loss": 2.226, "step": 27040 }, { "epoch": 0.73, "learning_rate": 0.0003668564692526877, "loss": 2.2358, "step": 27041 }, { "epoch": 0.73, "learning_rate": 0.0003667891003201128, "loss": 2.4647, "step": 27042 }, { "epoch": 0.73, "learning_rate": 0.00036672173618463043, "loss": 2.5661, "step": 27043 }, { "epoch": 0.73, "learning_rate": 0.0003666543768467513, "loss": 2.6261, "step": 27044 }, { "epoch": 0.73, "learning_rate": 0.00036658702230698507, "loss": 2.2366, "step": 27045 }, { "epoch": 0.73, "learning_rate": 0.0003665196725658423, "loss": 2.2819, "step": 27046 }, { "epoch": 0.73, "learning_rate": 0.0003664523276238335, "loss": 2.6739, "step": 27047 }, { "epoch": 0.73, "learning_rate": 0.0003663849874814683, "loss": 2.8877, "step": 27048 }, { "epoch": 0.73, "learning_rate": 0.00036631765213925716, "loss": 2.6702, "step": 27049 }, { "epoch": 0.73, "learning_rate": 0.0003662503215977102, "loss": 2.4815, "step": 27050 }, { "epoch": 0.73, "learning_rate": 0.0003661829958573376, "loss": 2.6466, "step": 27051 }, { "epoch": 0.73, "learning_rate": 0.0003661156749186495, "loss": 2.813, "step": 27052 }, { "epoch": 0.73, "learning_rate": 0.00036604835878215546, "loss": 2.263, "step": 27053 }, { "epoch": 0.73, "learning_rate": 0.0003659810474483657, "loss": 2.4186, "step": 27054 }, { "epoch": 0.73, "learning_rate": 0.00036591374091779017, "loss": 2.9614, "step": 27055 }, { "epoch": 0.73, "learning_rate": 0.00036584643919093874, "loss": 2.3067, "step": 27056 }, { "epoch": 0.73, "learning_rate": 0.0003657791422683213, "loss": 2.2986, "step": 27057 }, { "epoch": 0.73, "learning_rate": 0.00036571185015044815, "loss": 2.4124, "step": 27058 }, { "epoch": 0.73, "learning_rate": 0.0003656445628378282, "loss": 2.2724, "step": 27059 }, { "epoch": 0.73, "learning_rate": 0.0003655772803309716, "loss": 2.4736, "step": 27060 }, { "epoch": 0.73, "learning_rate": 0.00036551000263038846, "loss": 2.6321, "step": 27061 }, { "epoch": 0.73, "learning_rate": 0.0003654427297365878, "loss": 2.561, "step": 27062 }, { "epoch": 0.73, "learning_rate": 0.0003653754616500795, "loss": 2.279, "step": 27063 }, { "epoch": 0.73, "learning_rate": 0.0003653081983713733, "loss": 2.5095, "step": 27064 }, { "epoch": 0.73, "learning_rate": 0.00036524093990097874, "loss": 2.6799, "step": 27065 }, { "epoch": 0.73, "learning_rate": 0.00036517368623940563, "loss": 2.7343, "step": 27066 }, { "epoch": 0.73, "learning_rate": 0.00036510643738716286, "loss": 2.3388, "step": 27067 }, { "epoch": 0.73, "learning_rate": 0.00036503919334476023, "loss": 2.7427, "step": 27068 }, { "epoch": 0.73, "learning_rate": 0.0003649719541127071, "loss": 2.7745, "step": 27069 }, { "epoch": 0.73, "learning_rate": 0.00036490471969151297, "loss": 2.4083, "step": 27070 }, { "epoch": 0.73, "learning_rate": 0.00036483749008168743, "loss": 2.607, "step": 27071 }, { "epoch": 0.73, "learning_rate": 0.00036477026528373914, "loss": 2.1859, "step": 27072 }, { "epoch": 0.73, "learning_rate": 0.0003647030452981778, "loss": 2.4756, "step": 27073 }, { "epoch": 0.73, "learning_rate": 0.00036463583012551296, "loss": 2.2835, "step": 27074 }, { "epoch": 0.73, "learning_rate": 0.0003645686197662531, "loss": 2.5967, "step": 27075 }, { "epoch": 0.73, "learning_rate": 0.00036450141422090745, "loss": 3.3968, "step": 27076 }, { "epoch": 0.73, "learning_rate": 0.0003644342134899862, "loss": 2.1208, "step": 27077 }, { "epoch": 0.73, "learning_rate": 0.00036436701757399726, "loss": 2.4652, "step": 27078 }, { "epoch": 0.73, "learning_rate": 0.0003642998264734506, "loss": 2.3921, "step": 27079 }, { "epoch": 0.73, "learning_rate": 0.0003642326401888544, "loss": 2.4062, "step": 27080 }, { "epoch": 0.73, "learning_rate": 0.00036416545872071816, "loss": 2.3178, "step": 27081 }, { "epoch": 0.73, "learning_rate": 0.00036409828206955064, "loss": 2.2885, "step": 27082 }, { "epoch": 0.73, "learning_rate": 0.00036403111023586076, "loss": 2.3359, "step": 27083 }, { "epoch": 0.73, "learning_rate": 0.0003639639432201577, "loss": 2.5987, "step": 27084 }, { "epoch": 0.73, "learning_rate": 0.0003638967810229502, "loss": 2.3502, "step": 27085 }, { "epoch": 0.73, "learning_rate": 0.0003638296236447468, "loss": 2.9305, "step": 27086 }, { "epoch": 0.73, "learning_rate": 0.0003637624710860568, "loss": 2.2294, "step": 27087 }, { "epoch": 0.73, "learning_rate": 0.00036369532334738807, "loss": 2.7781, "step": 27088 }, { "epoch": 0.73, "learning_rate": 0.0003636281804292495, "loss": 2.3665, "step": 27089 }, { "epoch": 0.73, "learning_rate": 0.0003635610423321508, "loss": 2.3607, "step": 27090 }, { "epoch": 0.73, "learning_rate": 0.0003634939090565995, "loss": 2.306, "step": 27091 }, { "epoch": 0.73, "learning_rate": 0.00036342678060310464, "loss": 2.3787, "step": 27092 }, { "epoch": 0.73, "learning_rate": 0.0003633596569721749, "loss": 2.2791, "step": 27093 }, { "epoch": 0.73, "learning_rate": 0.00036329253816431826, "loss": 2.5403, "step": 27094 }, { "epoch": 0.73, "learning_rate": 0.0003632254241800436, "loss": 2.3947, "step": 27095 }, { "epoch": 0.73, "learning_rate": 0.0003631583150198592, "loss": 2.3277, "step": 27096 }, { "epoch": 0.73, "learning_rate": 0.00036309121068427353, "loss": 2.5792, "step": 27097 }, { "epoch": 0.73, "learning_rate": 0.0003630241111737953, "loss": 2.5772, "step": 27098 }, { "epoch": 0.73, "learning_rate": 0.0003629570164889323, "loss": 2.6186, "step": 27099 }, { "epoch": 0.73, "learning_rate": 0.00036288992663019296, "loss": 2.7097, "step": 27100 }, { "epoch": 0.73, "learning_rate": 0.000362822841598086, "loss": 2.6395, "step": 27101 }, { "epoch": 0.73, "learning_rate": 0.0003627557613931186, "loss": 2.2438, "step": 27102 }, { "epoch": 0.73, "learning_rate": 0.00036268868601579995, "loss": 2.4207, "step": 27103 }, { "epoch": 0.73, "learning_rate": 0.0003626216154666382, "loss": 2.1102, "step": 27104 }, { "epoch": 0.73, "learning_rate": 0.0003625545497461409, "loss": 2.4733, "step": 27105 }, { "epoch": 0.73, "learning_rate": 0.00036248748885481653, "loss": 2.484, "step": 27106 }, { "epoch": 0.73, "learning_rate": 0.00036242043279317274, "loss": 2.7716, "step": 27107 }, { "epoch": 0.73, "learning_rate": 0.0003623533815617177, "loss": 2.4314, "step": 27108 }, { "epoch": 0.73, "learning_rate": 0.00036228633516095955, "loss": 2.1943, "step": 27109 }, { "epoch": 0.73, "learning_rate": 0.00036221929359140607, "loss": 2.9104, "step": 27110 }, { "epoch": 0.73, "learning_rate": 0.00036215225685356513, "loss": 2.6011, "step": 27111 }, { "epoch": 0.73, "learning_rate": 0.00036208522494794504, "loss": 2.536, "step": 27112 }, { "epoch": 0.73, "learning_rate": 0.00036201819787505296, "loss": 2.1582, "step": 27113 }, { "epoch": 0.73, "learning_rate": 0.00036195117563539724, "loss": 2.4934, "step": 27114 }, { "epoch": 0.73, "learning_rate": 0.0003618841582294846, "loss": 2.3598, "step": 27115 }, { "epoch": 0.73, "learning_rate": 0.00036181714565782386, "loss": 2.7227, "step": 27116 }, { "epoch": 0.73, "learning_rate": 0.0003617501379209227, "loss": 2.2829, "step": 27117 }, { "epoch": 0.73, "learning_rate": 0.0003616831350192881, "loss": 2.3468, "step": 27118 }, { "epoch": 0.73, "learning_rate": 0.00036161613695342786, "loss": 2.7261, "step": 27119 }, { "epoch": 0.73, "learning_rate": 0.00036154914372385006, "loss": 2.5027, "step": 27120 }, { "epoch": 0.73, "learning_rate": 0.0003614821553310613, "loss": 2.4693, "step": 27121 }, { "epoch": 0.73, "learning_rate": 0.0003614151717755697, "loss": 2.1699, "step": 27122 }, { "epoch": 0.73, "learning_rate": 0.00036134819305788256, "loss": 2.5321, "step": 27123 }, { "epoch": 0.73, "learning_rate": 0.0003612812191785074, "loss": 2.3807, "step": 27124 }, { "epoch": 0.73, "learning_rate": 0.00036121425013795186, "loss": 2.6644, "step": 27125 }, { "epoch": 0.73, "learning_rate": 0.0003611472859367225, "loss": 2.2334, "step": 27126 }, { "epoch": 0.73, "learning_rate": 0.00036108032657532717, "loss": 2.227, "step": 27127 }, { "epoch": 0.73, "learning_rate": 0.000361013372054273, "loss": 2.3817, "step": 27128 }, { "epoch": 0.73, "learning_rate": 0.00036094642237406737, "loss": 2.5631, "step": 27129 }, { "epoch": 0.73, "learning_rate": 0.0003608794775352173, "loss": 2.4269, "step": 27130 }, { "epoch": 0.73, "learning_rate": 0.0003608125375382305, "loss": 2.265, "step": 27131 }, { "epoch": 0.73, "learning_rate": 0.0003607456023836132, "loss": 2.3987, "step": 27132 }, { "epoch": 0.73, "learning_rate": 0.0003606786720718733, "loss": 2.6019, "step": 27133 }, { "epoch": 0.73, "learning_rate": 0.0003606117466035171, "loss": 2.5022, "step": 27134 }, { "epoch": 0.73, "learning_rate": 0.00036054482597905205, "loss": 2.4272, "step": 27135 }, { "epoch": 0.73, "learning_rate": 0.00036047791019898514, "loss": 2.4348, "step": 27136 }, { "epoch": 0.73, "learning_rate": 0.00036041099926382314, "loss": 2.6453, "step": 27137 }, { "epoch": 0.73, "learning_rate": 0.000360344093174073, "loss": 2.7597, "step": 27138 }, { "epoch": 0.73, "learning_rate": 0.0003602771919302421, "loss": 2.1296, "step": 27139 }, { "epoch": 0.73, "learning_rate": 0.00036021029553283645, "loss": 2.7255, "step": 27140 }, { "epoch": 0.73, "learning_rate": 0.00036014340398236324, "loss": 2.7976, "step": 27141 }, { "epoch": 0.73, "learning_rate": 0.0003600765172793292, "loss": 2.3933, "step": 27142 }, { "epoch": 0.73, "learning_rate": 0.00036000963542424106, "loss": 2.4714, "step": 27143 }, { "epoch": 0.73, "learning_rate": 0.0003599427584176058, "loss": 2.128, "step": 27144 }, { "epoch": 0.73, "learning_rate": 0.0003598758862599295, "loss": 2.6094, "step": 27145 }, { "epoch": 0.73, "learning_rate": 0.00035980901895171904, "loss": 2.4447, "step": 27146 }, { "epoch": 0.73, "learning_rate": 0.0003597421564934813, "loss": 2.4834, "step": 27147 }, { "epoch": 0.73, "learning_rate": 0.00035967529888572216, "loss": 2.2008, "step": 27148 }, { "epoch": 0.73, "learning_rate": 0.0003596084461289485, "loss": 2.1319, "step": 27149 }, { "epoch": 0.73, "learning_rate": 0.00035954159822366674, "loss": 2.3719, "step": 27150 }, { "epoch": 0.73, "learning_rate": 0.0003594747551703834, "loss": 2.4966, "step": 27151 }, { "epoch": 0.73, "learning_rate": 0.0003594079169696051, "loss": 2.3468, "step": 27152 }, { "epoch": 0.73, "learning_rate": 0.0003593410836218375, "loss": 2.7204, "step": 27153 }, { "epoch": 0.73, "learning_rate": 0.0003592742551275874, "loss": 2.6618, "step": 27154 }, { "epoch": 0.73, "learning_rate": 0.00035920743148736093, "loss": 2.5126, "step": 27155 }, { "epoch": 0.73, "learning_rate": 0.00035914061270166434, "loss": 2.6585, "step": 27156 }, { "epoch": 0.73, "learning_rate": 0.0003590737987710043, "loss": 2.5181, "step": 27157 }, { "epoch": 0.73, "learning_rate": 0.0003590069896958863, "loss": 2.28, "step": 27158 }, { "epoch": 0.73, "learning_rate": 0.0003589401854768166, "loss": 2.5991, "step": 27159 }, { "epoch": 0.73, "learning_rate": 0.0003588733861143019, "loss": 2.2476, "step": 27160 }, { "epoch": 0.73, "learning_rate": 0.00035880659160884745, "loss": 2.3941, "step": 27161 }, { "epoch": 0.73, "learning_rate": 0.00035873980196095924, "loss": 2.4553, "step": 27162 }, { "epoch": 0.73, "learning_rate": 0.00035867301717114433, "loss": 2.6351, "step": 27163 }, { "epoch": 0.73, "learning_rate": 0.0003586062372399077, "loss": 2.5319, "step": 27164 }, { "epoch": 0.73, "learning_rate": 0.00035853946216775546, "loss": 2.063, "step": 27165 }, { "epoch": 0.73, "learning_rate": 0.0003584726919551941, "loss": 2.5392, "step": 27166 }, { "epoch": 0.73, "learning_rate": 0.0003584059266027284, "loss": 2.6879, "step": 27167 }, { "epoch": 0.73, "learning_rate": 0.0003583391661108647, "loss": 2.7022, "step": 27168 }, { "epoch": 0.73, "learning_rate": 0.0003582724104801088, "loss": 2.9197, "step": 27169 }, { "epoch": 0.73, "learning_rate": 0.0003582056597109664, "loss": 2.2147, "step": 27170 }, { "epoch": 0.73, "learning_rate": 0.00035813891380394357, "loss": 2.3063, "step": 27171 }, { "epoch": 0.73, "learning_rate": 0.0003580721727595452, "loss": 2.5668, "step": 27172 }, { "epoch": 0.73, "learning_rate": 0.0003580054365782772, "loss": 2.4598, "step": 27173 }, { "epoch": 0.73, "learning_rate": 0.00035793870526064565, "loss": 2.4982, "step": 27174 }, { "epoch": 0.73, "learning_rate": 0.00035787197880715496, "loss": 2.3832, "step": 27175 }, { "epoch": 0.73, "learning_rate": 0.00035780525721831213, "loss": 2.4215, "step": 27176 }, { "epoch": 0.73, "learning_rate": 0.0003577385404946214, "loss": 2.6314, "step": 27177 }, { "epoch": 0.73, "learning_rate": 0.00035767182863658876, "loss": 2.4733, "step": 27178 }, { "epoch": 0.73, "learning_rate": 0.0003576051216447198, "loss": 2.5117, "step": 27179 }, { "epoch": 0.73, "learning_rate": 0.00035753841951951924, "loss": 2.3568, "step": 27180 }, { "epoch": 0.73, "learning_rate": 0.00035747172226149274, "loss": 2.173, "step": 27181 }, { "epoch": 0.73, "learning_rate": 0.00035740502987114563, "loss": 2.3539, "step": 27182 }, { "epoch": 0.73, "learning_rate": 0.0003573383423489831, "loss": 2.6677, "step": 27183 }, { "epoch": 0.73, "learning_rate": 0.00035727165969551077, "loss": 2.4266, "step": 27184 }, { "epoch": 0.73, "learning_rate": 0.00035720498191123306, "loss": 2.5955, "step": 27185 }, { "epoch": 0.73, "learning_rate": 0.0003571383089966556, "loss": 3.0863, "step": 27186 }, { "epoch": 0.73, "learning_rate": 0.00035707164095228315, "loss": 2.8302, "step": 27187 }, { "epoch": 0.73, "learning_rate": 0.00035700497777862116, "loss": 2.4352, "step": 27188 }, { "epoch": 0.73, "learning_rate": 0.0003569383194761745, "loss": 2.3114, "step": 27189 }, { "epoch": 0.73, "learning_rate": 0.00035687166604544854, "loss": 2.2109, "step": 27190 }, { "epoch": 0.73, "learning_rate": 0.0003568050174869474, "loss": 2.4203, "step": 27191 }, { "epoch": 0.73, "learning_rate": 0.0003567383738011769, "loss": 2.316, "step": 27192 }, { "epoch": 0.73, "learning_rate": 0.00035667173498864105, "loss": 2.6118, "step": 27193 }, { "epoch": 0.73, "learning_rate": 0.0003566051010498452, "loss": 2.3648, "step": 27194 }, { "epoch": 0.73, "learning_rate": 0.000356538471985294, "loss": 2.543, "step": 27195 }, { "epoch": 0.73, "learning_rate": 0.00035647184779549236, "loss": 2.8845, "step": 27196 }, { "epoch": 0.73, "learning_rate": 0.0003564052284809449, "loss": 2.5528, "step": 27197 }, { "epoch": 0.73, "learning_rate": 0.00035633861404215674, "loss": 3.3339, "step": 27198 }, { "epoch": 0.73, "learning_rate": 0.0003562720044796318, "loss": 2.8649, "step": 27199 }, { "epoch": 0.73, "learning_rate": 0.0003562053997938751, "loss": 2.4138, "step": 27200 }, { "epoch": 0.73, "learning_rate": 0.0003561387999853911, "loss": 2.2435, "step": 27201 }, { "epoch": 0.73, "learning_rate": 0.0003560722050546845, "loss": 2.624, "step": 27202 }, { "epoch": 0.73, "learning_rate": 0.00035600561500226017, "loss": 2.6953, "step": 27203 }, { "epoch": 0.73, "learning_rate": 0.0003559390298286217, "loss": 2.4764, "step": 27204 }, { "epoch": 0.73, "learning_rate": 0.0003558724495342741, "loss": 2.0729, "step": 27205 }, { "epoch": 0.73, "learning_rate": 0.00035580587411972186, "loss": 2.6115, "step": 27206 }, { "epoch": 0.73, "learning_rate": 0.00035573930358546893, "loss": 2.4814, "step": 27207 }, { "epoch": 0.73, "learning_rate": 0.0003556727379320195, "loss": 2.3718, "step": 27208 }, { "epoch": 0.73, "learning_rate": 0.00035560617715987885, "loss": 2.7149, "step": 27209 }, { "epoch": 0.73, "learning_rate": 0.00035553962126955033, "loss": 2.2764, "step": 27210 }, { "epoch": 0.73, "learning_rate": 0.00035547307026153864, "loss": 2.4665, "step": 27211 }, { "epoch": 0.73, "learning_rate": 0.00035540652413634756, "loss": 2.3209, "step": 27212 }, { "epoch": 0.73, "learning_rate": 0.0003553399828944812, "loss": 2.3234, "step": 27213 }, { "epoch": 0.73, "learning_rate": 0.00035527344653644413, "loss": 2.8206, "step": 27214 }, { "epoch": 0.73, "learning_rate": 0.00035520691506273994, "loss": 2.3897, "step": 27215 }, { "epoch": 0.73, "learning_rate": 0.00035514038847387296, "loss": 2.2513, "step": 27216 }, { "epoch": 0.73, "learning_rate": 0.00035507386677034747, "loss": 2.7114, "step": 27217 }, { "epoch": 0.73, "learning_rate": 0.0003550073499526667, "loss": 2.4071, "step": 27218 }, { "epoch": 0.73, "learning_rate": 0.00035494083802133525, "loss": 2.3191, "step": 27219 }, { "epoch": 0.73, "learning_rate": 0.0003548743309768564, "loss": 2.433, "step": 27220 }, { "epoch": 0.73, "learning_rate": 0.00035480782881973393, "loss": 2.5804, "step": 27221 }, { "epoch": 0.73, "learning_rate": 0.00035474133155047273, "loss": 2.4332, "step": 27222 }, { "epoch": 0.73, "learning_rate": 0.00035467483916957543, "loss": 2.2012, "step": 27223 }, { "epoch": 0.73, "learning_rate": 0.00035460835167754615, "loss": 2.535, "step": 27224 }, { "epoch": 0.73, "learning_rate": 0.0003545418690748889, "loss": 2.3454, "step": 27225 }, { "epoch": 0.73, "learning_rate": 0.0003544753913621068, "loss": 2.5312, "step": 27226 }, { "epoch": 0.73, "learning_rate": 0.0003544089185397038, "loss": 2.4135, "step": 27227 }, { "epoch": 0.73, "learning_rate": 0.00035434245060818337, "loss": 2.0795, "step": 27228 }, { "epoch": 0.73, "learning_rate": 0.000354275987568049, "loss": 2.4924, "step": 27229 }, { "epoch": 0.73, "learning_rate": 0.0003542095294198048, "loss": 2.4087, "step": 27230 }, { "epoch": 0.73, "learning_rate": 0.00035414307616395325, "loss": 2.8397, "step": 27231 }, { "epoch": 0.73, "learning_rate": 0.00035407662780099835, "loss": 2.6082, "step": 27232 }, { "epoch": 0.73, "learning_rate": 0.0003540101843314438, "loss": 2.2045, "step": 27233 }, { "epoch": 0.73, "learning_rate": 0.00035394374575579193, "loss": 2.5819, "step": 27234 }, { "epoch": 0.73, "learning_rate": 0.0003538773120745473, "loss": 2.7185, "step": 27235 }, { "epoch": 0.73, "learning_rate": 0.0003538108832882124, "loss": 2.3206, "step": 27236 }, { "epoch": 0.73, "learning_rate": 0.00035374445939729074, "loss": 2.6441, "step": 27237 }, { "epoch": 0.73, "learning_rate": 0.0003536780404022859, "loss": 2.8578, "step": 27238 }, { "epoch": 0.73, "learning_rate": 0.00035361162630370024, "loss": 2.7411, "step": 27239 }, { "epoch": 0.73, "learning_rate": 0.00035354521710203733, "loss": 2.3388, "step": 27240 }, { "epoch": 0.73, "learning_rate": 0.00035347881279780037, "loss": 2.2859, "step": 27241 }, { "epoch": 0.73, "learning_rate": 0.0003534124133914922, "loss": 2.3533, "step": 27242 }, { "epoch": 0.73, "learning_rate": 0.00035334601888361607, "loss": 2.6131, "step": 27243 }, { "epoch": 0.73, "learning_rate": 0.0003532796292746753, "loss": 2.5418, "step": 27244 }, { "epoch": 0.73, "learning_rate": 0.0003532132445651719, "loss": 2.4139, "step": 27245 }, { "epoch": 0.73, "learning_rate": 0.0003531468647556099, "loss": 2.629, "step": 27246 }, { "epoch": 0.73, "learning_rate": 0.00035308048984649076, "loss": 2.2885, "step": 27247 }, { "epoch": 0.73, "learning_rate": 0.00035301411983831854, "loss": 2.9085, "step": 27248 }, { "epoch": 0.73, "learning_rate": 0.000352947754731596, "loss": 2.5011, "step": 27249 }, { "epoch": 0.73, "learning_rate": 0.0003528813945268253, "loss": 2.3842, "step": 27250 }, { "epoch": 0.73, "learning_rate": 0.0003528150392245094, "loss": 2.2914, "step": 27251 }, { "epoch": 0.73, "learning_rate": 0.00035274868882515155, "loss": 2.4301, "step": 27252 }, { "epoch": 0.73, "learning_rate": 0.0003526823433292534, "loss": 2.3972, "step": 27253 }, { "epoch": 0.73, "learning_rate": 0.00035261600273731817, "loss": 2.2341, "step": 27254 }, { "epoch": 0.73, "learning_rate": 0.00035254966704984837, "loss": 2.2912, "step": 27255 }, { "epoch": 0.73, "learning_rate": 0.00035248333626734655, "loss": 2.4371, "step": 27256 }, { "epoch": 0.73, "learning_rate": 0.0003524170103903155, "loss": 2.3545, "step": 27257 }, { "epoch": 0.73, "learning_rate": 0.00035235068941925706, "loss": 2.549, "step": 27258 }, { "epoch": 0.73, "learning_rate": 0.000352284373354674, "loss": 2.8268, "step": 27259 }, { "epoch": 0.73, "learning_rate": 0.00035221806219706874, "loss": 2.1002, "step": 27260 }, { "epoch": 0.73, "learning_rate": 0.0003521517559469437, "loss": 3.1373, "step": 27261 }, { "epoch": 0.73, "learning_rate": 0.00035208545460480137, "loss": 2.3452, "step": 27262 }, { "epoch": 0.73, "learning_rate": 0.0003520191581711435, "loss": 2.5983, "step": 27263 }, { "epoch": 0.73, "learning_rate": 0.0003519528666464726, "loss": 2.4347, "step": 27264 }, { "epoch": 0.73, "learning_rate": 0.0003518865800312914, "loss": 2.3898, "step": 27265 }, { "epoch": 0.73, "learning_rate": 0.00035182029832610105, "loss": 2.2926, "step": 27266 }, { "epoch": 0.73, "learning_rate": 0.00035175402153140445, "loss": 2.3931, "step": 27267 }, { "epoch": 0.73, "learning_rate": 0.00035168774964770334, "loss": 2.0611, "step": 27268 }, { "epoch": 0.73, "learning_rate": 0.0003516214826755, "loss": 2.7444, "step": 27269 }, { "epoch": 0.73, "learning_rate": 0.0003515552206152967, "loss": 2.3345, "step": 27270 }, { "epoch": 0.73, "learning_rate": 0.0003514889634675947, "loss": 2.4519, "step": 27271 }, { "epoch": 0.73, "learning_rate": 0.0003514227112328966, "loss": 2.6098, "step": 27272 }, { "epoch": 0.73, "learning_rate": 0.00035135646391170385, "loss": 2.3406, "step": 27273 }, { "epoch": 0.73, "learning_rate": 0.0003512902215045187, "loss": 2.7732, "step": 27274 }, { "epoch": 0.73, "learning_rate": 0.0003512239840118427, "loss": 2.5651, "step": 27275 }, { "epoch": 0.73, "learning_rate": 0.0003511577514341784, "loss": 2.779, "step": 27276 }, { "epoch": 0.73, "learning_rate": 0.00035109152377202645, "loss": 2.5894, "step": 27277 }, { "epoch": 0.73, "learning_rate": 0.00035102530102588915, "loss": 2.8918, "step": 27278 }, { "epoch": 0.73, "learning_rate": 0.0003509590831962685, "loss": 2.2338, "step": 27279 }, { "epoch": 0.73, "learning_rate": 0.00035089287028366534, "loss": 2.1606, "step": 27280 }, { "epoch": 0.73, "learning_rate": 0.0003508266622885818, "loss": 2.2587, "step": 27281 }, { "epoch": 0.73, "learning_rate": 0.00035076045921151943, "loss": 2.5909, "step": 27282 }, { "epoch": 0.73, "learning_rate": 0.0003506942610529799, "loss": 2.6418, "step": 27283 }, { "epoch": 0.73, "learning_rate": 0.00035062806781346466, "loss": 2.322, "step": 27284 }, { "epoch": 0.73, "learning_rate": 0.00035056187949347484, "loss": 2.6074, "step": 27285 }, { "epoch": 0.73, "learning_rate": 0.0003504956960935122, "loss": 2.7946, "step": 27286 }, { "epoch": 0.73, "learning_rate": 0.00035042951761407793, "loss": 2.9252, "step": 27287 }, { "epoch": 0.73, "learning_rate": 0.0003503633440556735, "loss": 2.3475, "step": 27288 }, { "epoch": 0.73, "learning_rate": 0.0003502971754188006, "loss": 2.5944, "step": 27289 }, { "epoch": 0.73, "learning_rate": 0.00035023101170395974, "loss": 2.9289, "step": 27290 }, { "epoch": 0.73, "learning_rate": 0.0003501648529116527, "loss": 2.9909, "step": 27291 }, { "epoch": 0.73, "learning_rate": 0.0003500986990423808, "loss": 2.8828, "step": 27292 }, { "epoch": 0.73, "learning_rate": 0.0003500325500966447, "loss": 2.4636, "step": 27293 }, { "epoch": 0.73, "learning_rate": 0.0003499664060749453, "loss": 2.6011, "step": 27294 }, { "epoch": 0.73, "learning_rate": 0.0003499002669777851, "loss": 2.161, "step": 27295 }, { "epoch": 0.73, "learning_rate": 0.0003498341328056638, "loss": 2.2798, "step": 27296 }, { "epoch": 0.73, "learning_rate": 0.0003497680035590831, "loss": 3.1932, "step": 27297 }, { "epoch": 0.73, "learning_rate": 0.0003497018792385436, "loss": 2.6163, "step": 27298 }, { "epoch": 0.73, "learning_rate": 0.00034963575984454633, "loss": 3.1231, "step": 27299 }, { "epoch": 0.73, "learning_rate": 0.0003495696453775923, "loss": 2.6632, "step": 27300 }, { "epoch": 0.73, "learning_rate": 0.0003495035358381823, "loss": 2.4024, "step": 27301 }, { "epoch": 0.73, "learning_rate": 0.00034943743122681714, "loss": 2.7584, "step": 27302 }, { "epoch": 0.73, "learning_rate": 0.00034937133154399816, "loss": 2.9847, "step": 27303 }, { "epoch": 0.73, "learning_rate": 0.0003493052367902253, "loss": 2.3889, "step": 27304 }, { "epoch": 0.73, "learning_rate": 0.0003492391469659999, "loss": 2.3469, "step": 27305 }, { "epoch": 0.73, "learning_rate": 0.0003491730620718221, "loss": 2.908, "step": 27306 }, { "epoch": 0.73, "learning_rate": 0.0003491069821081925, "loss": 1.9305, "step": 27307 }, { "epoch": 0.73, "learning_rate": 0.00034904090707561265, "loss": 2.509, "step": 27308 }, { "epoch": 0.73, "learning_rate": 0.0003489748369745821, "loss": 2.7859, "step": 27309 }, { "epoch": 0.73, "learning_rate": 0.0003489087718056019, "loss": 2.0718, "step": 27310 }, { "epoch": 0.73, "learning_rate": 0.0003488427115691728, "loss": 2.8409, "step": 27311 }, { "epoch": 0.73, "learning_rate": 0.00034877665626579444, "loss": 2.4042, "step": 27312 }, { "epoch": 0.73, "learning_rate": 0.0003487106058959678, "loss": 2.6544, "step": 27313 }, { "epoch": 0.73, "learning_rate": 0.00034864456046019323, "loss": 2.3235, "step": 27314 }, { "epoch": 0.73, "learning_rate": 0.00034857851995897095, "loss": 2.3475, "step": 27315 }, { "epoch": 0.73, "learning_rate": 0.0003485124843928017, "loss": 2.602, "step": 27316 }, { "epoch": 0.73, "learning_rate": 0.000348446453762185, "loss": 2.6742, "step": 27317 }, { "epoch": 0.73, "learning_rate": 0.00034838042806762147, "loss": 2.686, "step": 27318 }, { "epoch": 0.73, "learning_rate": 0.0003483144073096117, "loss": 2.6311, "step": 27319 }, { "epoch": 0.73, "learning_rate": 0.0003482483914886548, "loss": 2.5674, "step": 27320 }, { "epoch": 0.73, "learning_rate": 0.00034818238060525195, "loss": 2.6922, "step": 27321 }, { "epoch": 0.73, "learning_rate": 0.0003481163746599031, "loss": 2.2393, "step": 27322 }, { "epoch": 0.73, "learning_rate": 0.0003480503736531078, "loss": 2.8292, "step": 27323 }, { "epoch": 0.73, "learning_rate": 0.0003479843775853666, "loss": 2.1572, "step": 27324 }, { "epoch": 0.73, "learning_rate": 0.00034791838645717877, "loss": 2.1121, "step": 27325 }, { "epoch": 0.73, "learning_rate": 0.00034785240026904475, "loss": 2.4913, "step": 27326 }, { "epoch": 0.73, "learning_rate": 0.00034778641902146433, "loss": 2.7316, "step": 27327 }, { "epoch": 0.73, "learning_rate": 0.0003477204427149374, "loss": 2.0566, "step": 27328 }, { "epoch": 0.73, "learning_rate": 0.00034765447134996376, "loss": 2.5672, "step": 27329 }, { "epoch": 0.73, "learning_rate": 0.0003475885049270436, "loss": 2.3455, "step": 27330 }, { "epoch": 0.73, "learning_rate": 0.000347522543446676, "loss": 2.5484, "step": 27331 }, { "epoch": 0.73, "learning_rate": 0.00034745658690936123, "loss": 2.8384, "step": 27332 }, { "epoch": 0.73, "learning_rate": 0.00034739063531559787, "loss": 2.7891, "step": 27333 }, { "epoch": 0.73, "learning_rate": 0.00034732468866588694, "loss": 2.3268, "step": 27334 }, { "epoch": 0.73, "learning_rate": 0.0003472587469607277, "loss": 2.5956, "step": 27335 }, { "epoch": 0.73, "learning_rate": 0.00034719281020061923, "loss": 2.5741, "step": 27336 }, { "epoch": 0.73, "learning_rate": 0.00034712687838606127, "loss": 2.5992, "step": 27337 }, { "epoch": 0.73, "learning_rate": 0.00034706095151755366, "loss": 2.506, "step": 27338 }, { "epoch": 0.73, "learning_rate": 0.00034699502959559524, "loss": 2.6284, "step": 27339 }, { "epoch": 0.73, "learning_rate": 0.00034692911262068583, "loss": 2.0077, "step": 27340 }, { "epoch": 0.73, "learning_rate": 0.00034686320059332465, "loss": 2.1845, "step": 27341 }, { "epoch": 0.73, "learning_rate": 0.00034679729351401104, "loss": 2.4473, "step": 27342 }, { "epoch": 0.73, "learning_rate": 0.00034673139138324474, "loss": 2.9459, "step": 27343 }, { "epoch": 0.73, "learning_rate": 0.0003466654942015242, "loss": 2.6612, "step": 27344 }, { "epoch": 0.73, "learning_rate": 0.00034659960196934916, "loss": 2.3803, "step": 27345 }, { "epoch": 0.73, "learning_rate": 0.00034653371468721864, "loss": 2.7096, "step": 27346 }, { "epoch": 0.73, "learning_rate": 0.00034646783235563194, "loss": 2.2544, "step": 27347 }, { "epoch": 0.73, "learning_rate": 0.0003464019549750884, "loss": 2.3457, "step": 27348 }, { "epoch": 0.73, "learning_rate": 0.0003463360825460865, "loss": 2.8289, "step": 27349 }, { "epoch": 0.73, "learning_rate": 0.00034627021506912557, "loss": 2.0998, "step": 27350 }, { "epoch": 0.74, "learning_rate": 0.00034620435254470493, "loss": 2.5604, "step": 27351 }, { "epoch": 0.74, "learning_rate": 0.0003461384949733228, "loss": 2.6781, "step": 27352 }, { "epoch": 0.74, "learning_rate": 0.00034607264235547844, "loss": 2.0505, "step": 27353 }, { "epoch": 0.74, "learning_rate": 0.0003460067946916713, "loss": 2.3637, "step": 27354 }, { "epoch": 0.74, "learning_rate": 0.0003459409519823995, "loss": 2.4147, "step": 27355 }, { "epoch": 0.74, "learning_rate": 0.0003458751142281621, "loss": 2.5976, "step": 27356 }, { "epoch": 0.74, "learning_rate": 0.0003458092814294581, "loss": 2.2773, "step": 27357 }, { "epoch": 0.74, "learning_rate": 0.00034574345358678583, "loss": 2.2642, "step": 27358 }, { "epoch": 0.74, "learning_rate": 0.0003456776307006442, "loss": 2.423, "step": 27359 }, { "epoch": 0.74, "learning_rate": 0.0003456118127715317, "loss": 2.1976, "step": 27360 }, { "epoch": 0.74, "learning_rate": 0.00034554599979994737, "loss": 2.5873, "step": 27361 }, { "epoch": 0.74, "learning_rate": 0.00034548019178638967, "loss": 2.7169, "step": 27362 }, { "epoch": 0.74, "learning_rate": 0.0003454143887313568, "loss": 2.5494, "step": 27363 }, { "epoch": 0.74, "learning_rate": 0.0003453485906353474, "loss": 2.492, "step": 27364 }, { "epoch": 0.74, "learning_rate": 0.0003452827974988604, "loss": 2.3191, "step": 27365 }, { "epoch": 0.74, "learning_rate": 0.0003452170093223932, "loss": 2.625, "step": 27366 }, { "epoch": 0.74, "learning_rate": 0.00034515122610644555, "loss": 2.2375, "step": 27367 }, { "epoch": 0.74, "learning_rate": 0.00034508544785151485, "loss": 2.2993, "step": 27368 }, { "epoch": 0.74, "learning_rate": 0.00034501967455809966, "loss": 2.4349, "step": 27369 }, { "epoch": 0.74, "learning_rate": 0.00034495390622669867, "loss": 2.3887, "step": 27370 }, { "epoch": 0.74, "learning_rate": 0.00034488814285780947, "loss": 2.5046, "step": 27371 }, { "epoch": 0.74, "learning_rate": 0.00034482238445193047, "loss": 2.4424, "step": 27372 }, { "epoch": 0.74, "learning_rate": 0.00034475663100956, "loss": 2.2499, "step": 27373 }, { "epoch": 0.74, "learning_rate": 0.00034469088253119616, "loss": 2.2777, "step": 27374 }, { "epoch": 0.74, "learning_rate": 0.0003446251390173374, "loss": 2.9748, "step": 27375 }, { "epoch": 0.74, "learning_rate": 0.0003445594004684811, "loss": 3.1053, "step": 27376 }, { "epoch": 0.74, "learning_rate": 0.0003444936668851255, "loss": 2.2674, "step": 27377 }, { "epoch": 0.74, "learning_rate": 0.0003444279382677691, "loss": 2.3264, "step": 27378 }, { "epoch": 0.74, "learning_rate": 0.00034436221461690874, "loss": 2.7192, "step": 27379 }, { "epoch": 0.74, "learning_rate": 0.00034429649593304334, "loss": 2.3575, "step": 27380 }, { "epoch": 0.74, "learning_rate": 0.00034423078221667094, "loss": 2.7351, "step": 27381 }, { "epoch": 0.74, "learning_rate": 0.00034416507346828843, "loss": 2.4088, "step": 27382 }, { "epoch": 0.74, "learning_rate": 0.00034409936968839437, "loss": 3.3621, "step": 27383 }, { "epoch": 0.74, "learning_rate": 0.00034403367087748593, "loss": 2.1882, "step": 27384 }, { "epoch": 0.74, "learning_rate": 0.0003439679770360611, "loss": 2.4801, "step": 27385 }, { "epoch": 0.74, "learning_rate": 0.00034390228816461754, "loss": 2.6435, "step": 27386 }, { "epoch": 0.74, "learning_rate": 0.00034383660426365304, "loss": 3.1056, "step": 27387 }, { "epoch": 0.74, "learning_rate": 0.0003437709253336652, "loss": 2.389, "step": 27388 }, { "epoch": 0.74, "learning_rate": 0.00034370525137515163, "loss": 2.5362, "step": 27389 }, { "epoch": 0.74, "learning_rate": 0.0003436395823886095, "loss": 1.8295, "step": 27390 }, { "epoch": 0.74, "learning_rate": 0.00034357391837453653, "loss": 2.71, "step": 27391 }, { "epoch": 0.74, "learning_rate": 0.00034350825933343035, "loss": 2.7945, "step": 27392 }, { "epoch": 0.74, "learning_rate": 0.0003434426052657881, "loss": 2.3006, "step": 27393 }, { "epoch": 0.74, "learning_rate": 0.00034337695617210753, "loss": 2.5316, "step": 27394 }, { "epoch": 0.74, "learning_rate": 0.00034331131205288555, "loss": 1.6722, "step": 27395 }, { "epoch": 0.74, "learning_rate": 0.0003432456729086196, "loss": 2.2903, "step": 27396 }, { "epoch": 0.74, "learning_rate": 0.00034318003873980743, "loss": 2.4086, "step": 27397 }, { "epoch": 0.74, "learning_rate": 0.0003431144095469454, "loss": 2.1932, "step": 27398 }, { "epoch": 0.74, "learning_rate": 0.00034304878533053117, "loss": 2.3026, "step": 27399 }, { "epoch": 0.74, "learning_rate": 0.00034298316609106207, "loss": 2.8838, "step": 27400 }, { "epoch": 0.74, "learning_rate": 0.0003429175518290348, "loss": 2.3224, "step": 27401 }, { "epoch": 0.74, "learning_rate": 0.00034285194254494723, "loss": 3.0649, "step": 27402 }, { "epoch": 0.74, "learning_rate": 0.0003427863382392954, "loss": 2.6449, "step": 27403 }, { "epoch": 0.74, "learning_rate": 0.0003427207389125768, "loss": 2.393, "step": 27404 }, { "epoch": 0.74, "learning_rate": 0.0003426551445652883, "loss": 2.6143, "step": 27405 }, { "epoch": 0.74, "learning_rate": 0.000342589555197927, "loss": 1.9, "step": 27406 }, { "epoch": 0.74, "learning_rate": 0.0003425239708109897, "loss": 3.0425, "step": 27407 }, { "epoch": 0.74, "learning_rate": 0.0003424583914049736, "loss": 2.3245, "step": 27408 }, { "epoch": 0.74, "learning_rate": 0.00034239281698037475, "loss": 2.6833, "step": 27409 }, { "epoch": 0.74, "learning_rate": 0.0003423272475376907, "loss": 3.0571, "step": 27410 }, { "epoch": 0.74, "learning_rate": 0.00034226168307741755, "loss": 2.0863, "step": 27411 }, { "epoch": 0.74, "learning_rate": 0.00034219612360005225, "loss": 2.6449, "step": 27412 }, { "epoch": 0.74, "learning_rate": 0.0003421305691060915, "loss": 2.9855, "step": 27413 }, { "epoch": 0.74, "learning_rate": 0.0003420650195960321, "loss": 2.7182, "step": 27414 }, { "epoch": 0.74, "learning_rate": 0.0003419994750703703, "loss": 2.3626, "step": 27415 }, { "epoch": 0.74, "learning_rate": 0.00034193393552960327, "loss": 2.2876, "step": 27416 }, { "epoch": 0.74, "learning_rate": 0.00034186840097422664, "loss": 2.4743, "step": 27417 }, { "epoch": 0.74, "learning_rate": 0.00034180287140473753, "loss": 2.3323, "step": 27418 }, { "epoch": 0.74, "learning_rate": 0.00034173734682163207, "loss": 2.0015, "step": 27419 }, { "epoch": 0.74, "learning_rate": 0.0003416718272254068, "loss": 2.5125, "step": 27420 }, { "epoch": 0.74, "learning_rate": 0.0003416063126165584, "loss": 1.9425, "step": 27421 }, { "epoch": 0.74, "learning_rate": 0.00034154080299558256, "loss": 2.2253, "step": 27422 }, { "epoch": 0.74, "learning_rate": 0.00034147529836297587, "loss": 2.5484, "step": 27423 }, { "epoch": 0.74, "learning_rate": 0.00034140979871923483, "loss": 2.0108, "step": 27424 }, { "epoch": 0.74, "learning_rate": 0.00034134430406485515, "loss": 2.5096, "step": 27425 }, { "epoch": 0.74, "learning_rate": 0.000341278814400333, "loss": 2.0314, "step": 27426 }, { "epoch": 0.74, "learning_rate": 0.00034121332972616536, "loss": 2.6799, "step": 27427 }, { "epoch": 0.74, "learning_rate": 0.00034114785004284745, "loss": 2.7062, "step": 27428 }, { "epoch": 0.74, "learning_rate": 0.00034108237535087596, "loss": 2.4, "step": 27429 }, { "epoch": 0.74, "learning_rate": 0.00034101690565074627, "loss": 2.1658, "step": 27430 }, { "epoch": 0.74, "learning_rate": 0.0003409514409429547, "loss": 2.32, "step": 27431 }, { "epoch": 0.74, "learning_rate": 0.0003408859812279972, "loss": 2.2064, "step": 27432 }, { "epoch": 0.74, "learning_rate": 0.0003408205265063696, "loss": 2.3872, "step": 27433 }, { "epoch": 0.74, "learning_rate": 0.00034075507677856786, "loss": 3.0774, "step": 27434 }, { "epoch": 0.74, "learning_rate": 0.00034068963204508817, "loss": 2.4179, "step": 27435 }, { "epoch": 0.74, "learning_rate": 0.0003406241923064256, "loss": 2.5116, "step": 27436 }, { "epoch": 0.74, "learning_rate": 0.00034055875756307653, "loss": 2.6652, "step": 27437 }, { "epoch": 0.74, "learning_rate": 0.0003404933278155362, "loss": 1.986, "step": 27438 }, { "epoch": 0.74, "learning_rate": 0.00034042790306430007, "loss": 2.5485, "step": 27439 }, { "epoch": 0.74, "learning_rate": 0.000340362483309865, "loss": 2.5148, "step": 27440 }, { "epoch": 0.74, "learning_rate": 0.00034029706855272533, "loss": 2.3285, "step": 27441 }, { "epoch": 0.74, "learning_rate": 0.00034023165879337725, "loss": 2.5103, "step": 27442 }, { "epoch": 0.74, "learning_rate": 0.0003401662540323165, "loss": 2.2638, "step": 27443 }, { "epoch": 0.74, "learning_rate": 0.0003401008542700379, "loss": 2.7954, "step": 27444 }, { "epoch": 0.74, "learning_rate": 0.00034003545950703727, "loss": 2.5601, "step": 27445 }, { "epoch": 0.74, "learning_rate": 0.00033997006974380994, "loss": 2.4275, "step": 27446 }, { "epoch": 0.74, "learning_rate": 0.0003399046849808515, "loss": 2.0036, "step": 27447 }, { "epoch": 0.74, "learning_rate": 0.00033983930521865735, "loss": 2.2549, "step": 27448 }, { "epoch": 0.74, "learning_rate": 0.0003397739304577222, "loss": 1.7951, "step": 27449 }, { "epoch": 0.74, "learning_rate": 0.00033970856069854183, "loss": 2.1166, "step": 27450 }, { "epoch": 0.74, "learning_rate": 0.00033964319594161177, "loss": 2.7768, "step": 27451 }, { "epoch": 0.74, "learning_rate": 0.000339577836187426, "loss": 2.4169, "step": 27452 }, { "epoch": 0.74, "learning_rate": 0.00033951248143648116, "loss": 2.6735, "step": 27453 }, { "epoch": 0.74, "learning_rate": 0.00033944713168927135, "loss": 1.8967, "step": 27454 }, { "epoch": 0.74, "learning_rate": 0.00033938178694629197, "loss": 2.5391, "step": 27455 }, { "epoch": 0.74, "learning_rate": 0.00033931644720803833, "loss": 2.1498, "step": 27456 }, { "epoch": 0.74, "learning_rate": 0.00033925111247500494, "loss": 2.43, "step": 27457 }, { "epoch": 0.74, "learning_rate": 0.00033918578274768697, "loss": 2.2821, "step": 27458 }, { "epoch": 0.74, "learning_rate": 0.00033912045802657933, "loss": 2.958, "step": 27459 }, { "epoch": 0.74, "learning_rate": 0.00033905513831217703, "loss": 3.0137, "step": 27460 }, { "epoch": 0.74, "learning_rate": 0.0003389898236049751, "loss": 2.2625, "step": 27461 }, { "epoch": 0.74, "learning_rate": 0.00033892451390546776, "loss": 2.6205, "step": 27462 }, { "epoch": 0.74, "learning_rate": 0.00033885920921415013, "loss": 2.5914, "step": 27463 }, { "epoch": 0.74, "learning_rate": 0.0003387939095315172, "loss": 2.8119, "step": 27464 }, { "epoch": 0.74, "learning_rate": 0.00033872861485806285, "loss": 2.3721, "step": 27465 }, { "epoch": 0.74, "learning_rate": 0.00033866332519428253, "loss": 2.4306, "step": 27466 }, { "epoch": 0.74, "learning_rate": 0.000338598040540671, "loss": 2.3391, "step": 27467 }, { "epoch": 0.74, "learning_rate": 0.0003385327608977221, "loss": 2.5751, "step": 27468 }, { "epoch": 0.74, "learning_rate": 0.0003384674862659307, "loss": 2.1604, "step": 27469 }, { "epoch": 0.74, "learning_rate": 0.00033840221664579187, "loss": 2.1963, "step": 27470 }, { "epoch": 0.74, "learning_rate": 0.000338336952037799, "loss": 2.868, "step": 27471 }, { "epoch": 0.74, "learning_rate": 0.00033827169244244725, "loss": 2.6313, "step": 27472 }, { "epoch": 0.74, "learning_rate": 0.00033820643786023073, "loss": 2.3171, "step": 27473 }, { "epoch": 0.74, "learning_rate": 0.0003381411882916441, "loss": 2.2801, "step": 27474 }, { "epoch": 0.74, "learning_rate": 0.00033807594373718163, "loss": 2.805, "step": 27475 }, { "epoch": 0.74, "learning_rate": 0.00033801070419733724, "loss": 2.357, "step": 27476 }, { "epoch": 0.74, "learning_rate": 0.0003379454696726054, "loss": 2.3304, "step": 27477 }, { "epoch": 0.74, "learning_rate": 0.0003378802401634803, "loss": 2.53, "step": 27478 }, { "epoch": 0.74, "learning_rate": 0.00033781501567045613, "loss": 2.8432, "step": 27479 }, { "epoch": 0.74, "learning_rate": 0.00033774979619402736, "loss": 2.3764, "step": 27480 }, { "epoch": 0.74, "learning_rate": 0.00033768458173468743, "loss": 2.7623, "step": 27481 }, { "epoch": 0.74, "learning_rate": 0.0003376193722929306, "loss": 3.0579, "step": 27482 }, { "epoch": 0.74, "learning_rate": 0.00033755416786925143, "loss": 2.4992, "step": 27483 }, { "epoch": 0.74, "learning_rate": 0.000337488968464143, "loss": 2.5662, "step": 27484 }, { "epoch": 0.74, "learning_rate": 0.00033742377407809974, "loss": 2.9148, "step": 27485 }, { "epoch": 0.74, "learning_rate": 0.0003373585847116156, "loss": 2.4177, "step": 27486 }, { "epoch": 0.74, "learning_rate": 0.0003372934003651843, "loss": 2.0982, "step": 27487 }, { "epoch": 0.74, "learning_rate": 0.00033722822103929995, "loss": 2.6249, "step": 27488 }, { "epoch": 0.74, "learning_rate": 0.00033716304673445585, "loss": 2.5599, "step": 27489 }, { "epoch": 0.74, "learning_rate": 0.00033709787745114605, "loss": 2.8163, "step": 27490 }, { "epoch": 0.74, "learning_rate": 0.0003370327131898642, "loss": 2.5629, "step": 27491 }, { "epoch": 0.74, "learning_rate": 0.0003369675539511039, "loss": 3.0094, "step": 27492 }, { "epoch": 0.74, "learning_rate": 0.00033690239973535894, "loss": 2.4192, "step": 27493 }, { "epoch": 0.74, "learning_rate": 0.0003368372505431232, "loss": 2.8143, "step": 27494 }, { "epoch": 0.74, "learning_rate": 0.0003367721063748895, "loss": 2.5789, "step": 27495 }, { "epoch": 0.74, "learning_rate": 0.00033670696723115214, "loss": 2.3478, "step": 27496 }, { "epoch": 0.74, "learning_rate": 0.0003366418331124038, "loss": 2.5267, "step": 27497 }, { "epoch": 0.74, "learning_rate": 0.00033657670401913845, "loss": 2.1684, "step": 27498 }, { "epoch": 0.74, "learning_rate": 0.00033651157995184935, "loss": 2.5336, "step": 27499 }, { "epoch": 0.74, "learning_rate": 0.00033644646091102984, "loss": 2.3828, "step": 27500 }, { "epoch": 0.74, "learning_rate": 0.0003363813468971733, "loss": 2.49, "step": 27501 }, { "epoch": 0.74, "learning_rate": 0.00033631623791077335, "loss": 2.5211, "step": 27502 }, { "epoch": 0.74, "learning_rate": 0.0003362511339523226, "loss": 2.677, "step": 27503 }, { "epoch": 0.74, "learning_rate": 0.00033618603502231473, "loss": 2.5817, "step": 27504 }, { "epoch": 0.74, "learning_rate": 0.0003361209411212427, "loss": 2.3582, "step": 27505 }, { "epoch": 0.74, "learning_rate": 0.00033605585224959965, "loss": 2.3426, "step": 27506 }, { "epoch": 0.74, "learning_rate": 0.00033599076840787925, "loss": 2.1094, "step": 27507 }, { "epoch": 0.74, "learning_rate": 0.0003359256895965735, "loss": 2.4278, "step": 27508 }, { "epoch": 0.74, "learning_rate": 0.0003358606158161762, "loss": 2.8219, "step": 27509 }, { "epoch": 0.74, "learning_rate": 0.0003357955470671804, "loss": 2.38, "step": 27510 }, { "epoch": 0.74, "learning_rate": 0.0003357304833500785, "loss": 2.4718, "step": 27511 }, { "epoch": 0.74, "learning_rate": 0.00033566542466536333, "loss": 2.2057, "step": 27512 }, { "epoch": 0.74, "learning_rate": 0.0003356003710135288, "loss": 2.062, "step": 27513 }, { "epoch": 0.74, "learning_rate": 0.0003355353223950668, "loss": 2.8391, "step": 27514 }, { "epoch": 0.74, "learning_rate": 0.0003354702788104706, "loss": 2.8782, "step": 27515 }, { "epoch": 0.74, "learning_rate": 0.00033540524026023254, "loss": 2.4612, "step": 27516 }, { "epoch": 0.74, "learning_rate": 0.0003353402067448456, "loss": 2.6144, "step": 27517 }, { "epoch": 0.74, "learning_rate": 0.00033527517826480234, "loss": 2.1421, "step": 27518 }, { "epoch": 0.74, "learning_rate": 0.0003352101548205955, "loss": 2.7415, "step": 27519 }, { "epoch": 0.74, "learning_rate": 0.00033514513641271773, "loss": 2.406, "step": 27520 }, { "epoch": 0.74, "learning_rate": 0.0003350801230416618, "loss": 2.6092, "step": 27521 }, { "epoch": 0.74, "learning_rate": 0.0003350151147079197, "loss": 2.2909, "step": 27522 }, { "epoch": 0.74, "learning_rate": 0.0003349501114119844, "loss": 2.375, "step": 27523 }, { "epoch": 0.74, "learning_rate": 0.00033488511315434764, "loss": 2.4953, "step": 27524 }, { "epoch": 0.74, "learning_rate": 0.00033482011993550266, "loss": 2.4743, "step": 27525 }, { "epoch": 0.74, "learning_rate": 0.0003347551317559419, "loss": 2.196, "step": 27526 }, { "epoch": 0.74, "learning_rate": 0.0003346901486161569, "loss": 2.6362, "step": 27527 }, { "epoch": 0.74, "learning_rate": 0.00033462517051664043, "loss": 2.0333, "step": 27528 }, { "epoch": 0.74, "learning_rate": 0.000334560197457885, "loss": 2.4893, "step": 27529 }, { "epoch": 0.74, "learning_rate": 0.00033449522944038225, "loss": 2.1237, "step": 27530 }, { "epoch": 0.74, "learning_rate": 0.0003344302664646246, "loss": 2.5624, "step": 27531 }, { "epoch": 0.74, "learning_rate": 0.00033436530853110435, "loss": 2.7989, "step": 27532 }, { "epoch": 0.74, "learning_rate": 0.00033430035564031347, "loss": 1.8578, "step": 27533 }, { "epoch": 0.74, "learning_rate": 0.0003342354077927444, "loss": 2.7736, "step": 27534 }, { "epoch": 0.74, "learning_rate": 0.0003341704649888886, "loss": 2.4899, "step": 27535 }, { "epoch": 0.74, "learning_rate": 0.00033410552722923825, "loss": 2.6124, "step": 27536 }, { "epoch": 0.74, "learning_rate": 0.00033404059451428537, "loss": 2.7857, "step": 27537 }, { "epoch": 0.74, "learning_rate": 0.00033397566684452196, "loss": 2.2214, "step": 27538 }, { "epoch": 0.74, "learning_rate": 0.00033391074422043976, "loss": 2.8738, "step": 27539 }, { "epoch": 0.74, "learning_rate": 0.00033384582664253105, "loss": 2.1853, "step": 27540 }, { "epoch": 0.74, "learning_rate": 0.0003337809141112869, "loss": 2.2931, "step": 27541 }, { "epoch": 0.74, "learning_rate": 0.00033371600662719967, "loss": 2.7811, "step": 27542 }, { "epoch": 0.74, "learning_rate": 0.00033365110419076075, "loss": 2.6785, "step": 27543 }, { "epoch": 0.74, "learning_rate": 0.0003335862068024618, "loss": 2.5948, "step": 27544 }, { "epoch": 0.74, "learning_rate": 0.00033352131446279454, "loss": 2.5852, "step": 27545 }, { "epoch": 0.74, "learning_rate": 0.0003334564271722507, "loss": 2.4395, "step": 27546 }, { "epoch": 0.74, "learning_rate": 0.00033339154493132185, "loss": 2.6104, "step": 27547 }, { "epoch": 0.74, "learning_rate": 0.00033332666774049967, "loss": 2.4957, "step": 27548 }, { "epoch": 0.74, "learning_rate": 0.00033326179560027523, "loss": 2.2926, "step": 27549 }, { "epoch": 0.74, "learning_rate": 0.0003331969285111403, "loss": 2.5611, "step": 27550 }, { "epoch": 0.74, "learning_rate": 0.00033313206647358617, "loss": 2.6476, "step": 27551 }, { "epoch": 0.74, "learning_rate": 0.0003330672094881042, "loss": 2.6762, "step": 27552 }, { "epoch": 0.74, "learning_rate": 0.00033300235755518625, "loss": 2.3214, "step": 27553 }, { "epoch": 0.74, "learning_rate": 0.00033293751067532283, "loss": 2.3633, "step": 27554 }, { "epoch": 0.74, "learning_rate": 0.0003328726688490056, "loss": 2.0775, "step": 27555 }, { "epoch": 0.74, "learning_rate": 0.00033280783207672595, "loss": 2.402, "step": 27556 }, { "epoch": 0.74, "learning_rate": 0.00033274300035897466, "loss": 3.0047, "step": 27557 }, { "epoch": 0.74, "learning_rate": 0.0003326781736962431, "loss": 2.2944, "step": 27558 }, { "epoch": 0.74, "learning_rate": 0.00033261335208902243, "loss": 2.9038, "step": 27559 }, { "epoch": 0.74, "learning_rate": 0.0003325485355378036, "loss": 2.4533, "step": 27560 }, { "epoch": 0.74, "learning_rate": 0.00033248372404307816, "loss": 2.8026, "step": 27561 }, { "epoch": 0.74, "learning_rate": 0.0003324189176053363, "loss": 2.5276, "step": 27562 }, { "epoch": 0.74, "learning_rate": 0.00033235411622506927, "loss": 2.5375, "step": 27563 }, { "epoch": 0.74, "learning_rate": 0.0003322893199027682, "loss": 2.7095, "step": 27564 }, { "epoch": 0.74, "learning_rate": 0.0003322245286389239, "loss": 2.5736, "step": 27565 }, { "epoch": 0.74, "learning_rate": 0.00033215974243402745, "loss": 2.3262, "step": 27566 }, { "epoch": 0.74, "learning_rate": 0.0003320949612885691, "loss": 2.3633, "step": 27567 }, { "epoch": 0.74, "learning_rate": 0.00033203018520303995, "loss": 2.5256, "step": 27568 }, { "epoch": 0.74, "learning_rate": 0.0003319654141779309, "loss": 2.8326, "step": 27569 }, { "epoch": 0.74, "learning_rate": 0.00033190064821373225, "loss": 2.1807, "step": 27570 }, { "epoch": 0.74, "learning_rate": 0.0003318358873109344, "loss": 2.4987, "step": 27571 }, { "epoch": 0.74, "learning_rate": 0.0003317711314700291, "loss": 2.2538, "step": 27572 }, { "epoch": 0.74, "learning_rate": 0.00033170638069150596, "loss": 2.4891, "step": 27573 }, { "epoch": 0.74, "learning_rate": 0.0003316416349758558, "loss": 2.5511, "step": 27574 }, { "epoch": 0.74, "learning_rate": 0.0003315768943235694, "loss": 2.2995, "step": 27575 }, { "epoch": 0.74, "learning_rate": 0.00033151215873513664, "loss": 2.4886, "step": 27576 }, { "epoch": 0.74, "learning_rate": 0.00033144742821104823, "loss": 2.0745, "step": 27577 }, { "epoch": 0.74, "learning_rate": 0.0003313827027517946, "loss": 2.4435, "step": 27578 }, { "epoch": 0.74, "learning_rate": 0.00033131798235786603, "loss": 2.1869, "step": 27579 }, { "epoch": 0.74, "learning_rate": 0.00033125326702975334, "loss": 2.4435, "step": 27580 }, { "epoch": 0.74, "learning_rate": 0.00033118855676794593, "loss": 2.1058, "step": 27581 }, { "epoch": 0.74, "learning_rate": 0.00033112385157293435, "loss": 2.4964, "step": 27582 }, { "epoch": 0.74, "learning_rate": 0.00033105915144520927, "loss": 1.8989, "step": 27583 }, { "epoch": 0.74, "learning_rate": 0.0003309944563852598, "loss": 2.6133, "step": 27584 }, { "epoch": 0.74, "learning_rate": 0.00033092976639357755, "loss": 2.9045, "step": 27585 }, { "epoch": 0.74, "learning_rate": 0.0003308650814706512, "loss": 2.4763, "step": 27586 }, { "epoch": 0.74, "learning_rate": 0.00033080040161697147, "loss": 3.1173, "step": 27587 }, { "epoch": 0.74, "learning_rate": 0.0003307357268330286, "loss": 2.45, "step": 27588 }, { "epoch": 0.74, "learning_rate": 0.0003306710571193119, "loss": 2.1007, "step": 27589 }, { "epoch": 0.74, "learning_rate": 0.00033060639247631154, "loss": 2.391, "step": 27590 }, { "epoch": 0.74, "learning_rate": 0.0003305417329045175, "loss": 2.2649, "step": 27591 }, { "epoch": 0.74, "learning_rate": 0.00033047707840441954, "loss": 2.7414, "step": 27592 }, { "epoch": 0.74, "learning_rate": 0.00033041242897650794, "loss": 2.2045, "step": 27593 }, { "epoch": 0.74, "learning_rate": 0.0003303477846212718, "loss": 2.1447, "step": 27594 }, { "epoch": 0.74, "learning_rate": 0.000330283145339201, "loss": 1.9727, "step": 27595 }, { "epoch": 0.74, "learning_rate": 0.0003302185111307857, "loss": 2.8143, "step": 27596 }, { "epoch": 0.74, "learning_rate": 0.00033015388199651464, "loss": 2.7184, "step": 27597 }, { "epoch": 0.74, "learning_rate": 0.0003300892579368783, "loss": 2.0268, "step": 27598 }, { "epoch": 0.74, "learning_rate": 0.0003300246389523662, "loss": 2.6582, "step": 27599 }, { "epoch": 0.74, "learning_rate": 0.00032996002504346743, "loss": 2.4494, "step": 27600 }, { "epoch": 0.74, "learning_rate": 0.00032989541621067207, "loss": 2.3237, "step": 27601 }, { "epoch": 0.74, "learning_rate": 0.0003298308124544689, "loss": 2.5792, "step": 27602 }, { "epoch": 0.74, "learning_rate": 0.00032976621377534763, "loss": 2.8116, "step": 27603 }, { "epoch": 0.74, "learning_rate": 0.0003297016201737977, "loss": 2.3159, "step": 27604 }, { "epoch": 0.74, "learning_rate": 0.00032963703165030843, "loss": 2.6128, "step": 27605 }, { "epoch": 0.74, "learning_rate": 0.00032957244820536923, "loss": 2.0352, "step": 27606 }, { "epoch": 0.74, "learning_rate": 0.0003295078698394697, "loss": 2.3267, "step": 27607 }, { "epoch": 0.74, "learning_rate": 0.0003294432965530982, "loss": 2.3486, "step": 27608 }, { "epoch": 0.74, "learning_rate": 0.00032937872834674475, "loss": 2.3801, "step": 27609 }, { "epoch": 0.74, "learning_rate": 0.0003293141652208975, "loss": 2.4967, "step": 27610 }, { "epoch": 0.74, "learning_rate": 0.0003292496071760467, "loss": 2.312, "step": 27611 }, { "epoch": 0.74, "learning_rate": 0.00032918505421268107, "loss": 2.6019, "step": 27612 }, { "epoch": 0.74, "learning_rate": 0.0003291205063312893, "loss": 2.6559, "step": 27613 }, { "epoch": 0.74, "learning_rate": 0.0003290559635323607, "loss": 2.7795, "step": 27614 }, { "epoch": 0.74, "learning_rate": 0.0003289914258163844, "loss": 2.0365, "step": 27615 }, { "epoch": 0.74, "learning_rate": 0.0003289268931838488, "loss": 2.61, "step": 27616 }, { "epoch": 0.74, "learning_rate": 0.0003288623656352431, "loss": 2.1943, "step": 27617 }, { "epoch": 0.74, "learning_rate": 0.0003287978431710561, "loss": 2.329, "step": 27618 }, { "epoch": 0.74, "learning_rate": 0.00032873332579177675, "loss": 2.1757, "step": 27619 }, { "epoch": 0.74, "learning_rate": 0.0003286688134978939, "loss": 2.1031, "step": 27620 }, { "epoch": 0.74, "learning_rate": 0.0003286043062898958, "loss": 2.2526, "step": 27621 }, { "epoch": 0.74, "learning_rate": 0.00032853980416827145, "loss": 2.788, "step": 27622 }, { "epoch": 0.74, "learning_rate": 0.0003284753071335095, "loss": 2.2899, "step": 27623 }, { "epoch": 0.74, "learning_rate": 0.0003284108151860986, "loss": 2.1492, "step": 27624 }, { "epoch": 0.74, "learning_rate": 0.00032834632832652724, "loss": 2.6005, "step": 27625 }, { "epoch": 0.74, "learning_rate": 0.00032828184655528435, "loss": 2.9412, "step": 27626 }, { "epoch": 0.74, "learning_rate": 0.00032821736987285777, "loss": 2.579, "step": 27627 }, { "epoch": 0.74, "learning_rate": 0.0003281528982797366, "loss": 2.4527, "step": 27628 }, { "epoch": 0.74, "learning_rate": 0.00032808843177640866, "loss": 2.2479, "step": 27629 }, { "epoch": 0.74, "learning_rate": 0.00032802397036336273, "loss": 2.3768, "step": 27630 }, { "epoch": 0.74, "learning_rate": 0.00032795951404108694, "loss": 2.5243, "step": 27631 }, { "epoch": 0.74, "learning_rate": 0.00032789506281006973, "loss": 2.6926, "step": 27632 }, { "epoch": 0.74, "learning_rate": 0.00032783061667079937, "loss": 2.9987, "step": 27633 }, { "epoch": 0.74, "learning_rate": 0.00032776617562376445, "loss": 2.2985, "step": 27634 }, { "epoch": 0.74, "learning_rate": 0.0003277017396694525, "loss": 1.9267, "step": 27635 }, { "epoch": 0.74, "learning_rate": 0.00032763730880835197, "loss": 2.9198, "step": 27636 }, { "epoch": 0.74, "learning_rate": 0.0003275728830409509, "loss": 2.4953, "step": 27637 }, { "epoch": 0.74, "learning_rate": 0.0003275084623677375, "loss": 2.3681, "step": 27638 }, { "epoch": 0.74, "learning_rate": 0.00032744404678920004, "loss": 1.9614, "step": 27639 }, { "epoch": 0.74, "learning_rate": 0.000327379636305826, "loss": 2.8669, "step": 27640 }, { "epoch": 0.74, "learning_rate": 0.00032731523091810344, "loss": 3.0095, "step": 27641 }, { "epoch": 0.74, "learning_rate": 0.0003272508306265209, "loss": 2.8116, "step": 27642 }, { "epoch": 0.74, "learning_rate": 0.00032718643543156535, "loss": 2.6348, "step": 27643 }, { "epoch": 0.74, "learning_rate": 0.0003271220453337251, "loss": 2.668, "step": 27644 }, { "epoch": 0.74, "learning_rate": 0.00032705766033348804, "loss": 2.5766, "step": 27645 }, { "epoch": 0.74, "learning_rate": 0.0003269932804313418, "loss": 2.5395, "step": 27646 }, { "epoch": 0.74, "learning_rate": 0.0003269289056277744, "loss": 2.2078, "step": 27647 }, { "epoch": 0.74, "learning_rate": 0.00032686453592327305, "loss": 2.4534, "step": 27648 }, { "epoch": 0.74, "learning_rate": 0.0003268001713183255, "loss": 2.1874, "step": 27649 }, { "epoch": 0.74, "learning_rate": 0.0003267358118134196, "loss": 2.3972, "step": 27650 }, { "epoch": 0.74, "learning_rate": 0.00032667145740904283, "loss": 2.409, "step": 27651 }, { "epoch": 0.74, "learning_rate": 0.00032660710810568263, "loss": 1.9671, "step": 27652 }, { "epoch": 0.74, "learning_rate": 0.000326542763903827, "loss": 2.7218, "step": 27653 }, { "epoch": 0.74, "learning_rate": 0.0003264784248039625, "loss": 2.5318, "step": 27654 }, { "epoch": 0.74, "learning_rate": 0.00032641409080657756, "loss": 2.2528, "step": 27655 }, { "epoch": 0.74, "learning_rate": 0.0003263497619121586, "loss": 2.2302, "step": 27656 }, { "epoch": 0.74, "learning_rate": 0.00032628543812119313, "loss": 2.0931, "step": 27657 }, { "epoch": 0.74, "learning_rate": 0.00032622111943416933, "loss": 2.5862, "step": 27658 }, { "epoch": 0.74, "learning_rate": 0.0003261568058515736, "loss": 2.5351, "step": 27659 }, { "epoch": 0.74, "learning_rate": 0.0003260924973738935, "loss": 2.0654, "step": 27660 }, { "epoch": 0.74, "learning_rate": 0.00032602819400161633, "loss": 2.1863, "step": 27661 }, { "epoch": 0.74, "learning_rate": 0.0003259638957352289, "loss": 2.5862, "step": 27662 }, { "epoch": 0.74, "learning_rate": 0.00032589960257521834, "loss": 2.4322, "step": 27663 }, { "epoch": 0.74, "learning_rate": 0.0003258353145220719, "loss": 2.2464, "step": 27664 }, { "epoch": 0.74, "learning_rate": 0.0003257710315762766, "loss": 2.1968, "step": 27665 }, { "epoch": 0.74, "learning_rate": 0.0003257067537383198, "loss": 2.3616, "step": 27666 }, { "epoch": 0.74, "learning_rate": 0.00032564248100868775, "loss": 2.5711, "step": 27667 }, { "epoch": 0.74, "learning_rate": 0.00032557821338786774, "loss": 2.5617, "step": 27668 }, { "epoch": 0.74, "learning_rate": 0.00032551395087634683, "loss": 2.5984, "step": 27669 }, { "epoch": 0.74, "learning_rate": 0.0003254496934746111, "loss": 2.5498, "step": 27670 }, { "epoch": 0.74, "learning_rate": 0.0003253854411831485, "loss": 3.0264, "step": 27671 }, { "epoch": 0.74, "learning_rate": 0.00032532119400244475, "loss": 2.6111, "step": 27672 }, { "epoch": 0.74, "learning_rate": 0.0003252569519329872, "loss": 2.4374, "step": 27673 }, { "epoch": 0.74, "learning_rate": 0.0003251927149752626, "loss": 2.4712, "step": 27674 }, { "epoch": 0.74, "learning_rate": 0.00032512848312975695, "loss": 2.5096, "step": 27675 }, { "epoch": 0.74, "learning_rate": 0.00032506425639695734, "loss": 2.4408, "step": 27676 }, { "epoch": 0.74, "learning_rate": 0.0003250000347773502, "loss": 2.5603, "step": 27677 }, { "epoch": 0.74, "learning_rate": 0.0003249358182714222, "loss": 2.1746, "step": 27678 }, { "epoch": 0.74, "learning_rate": 0.00032487160687966, "loss": 2.5488, "step": 27679 }, { "epoch": 0.74, "learning_rate": 0.00032480740060254943, "loss": 2.7024, "step": 27680 }, { "epoch": 0.74, "learning_rate": 0.0003247431994405774, "loss": 2.0011, "step": 27681 }, { "epoch": 0.74, "learning_rate": 0.0003246790033942304, "loss": 2.3855, "step": 27682 }, { "epoch": 0.74, "learning_rate": 0.00032461481246399396, "loss": 2.4163, "step": 27683 }, { "epoch": 0.74, "learning_rate": 0.0003245506266503553, "loss": 2.9086, "step": 27684 }, { "epoch": 0.74, "learning_rate": 0.0003244864459538005, "loss": 2.4106, "step": 27685 }, { "epoch": 0.74, "learning_rate": 0.0003244222703748154, "loss": 2.9218, "step": 27686 }, { "epoch": 0.74, "learning_rate": 0.0003243580999138864, "loss": 1.9908, "step": 27687 }, { "epoch": 0.74, "learning_rate": 0.0003242939345715, "loss": 2.3791, "step": 27688 }, { "epoch": 0.74, "learning_rate": 0.0003242297743481416, "loss": 2.2715, "step": 27689 }, { "epoch": 0.74, "learning_rate": 0.00032416561924429756, "loss": 2.1056, "step": 27690 }, { "epoch": 0.74, "learning_rate": 0.00032410146926045404, "loss": 2.6435, "step": 27691 }, { "epoch": 0.74, "learning_rate": 0.00032403732439709686, "loss": 2.3424, "step": 27692 }, { "epoch": 0.74, "learning_rate": 0.0003239731846547124, "loss": 2.7822, "step": 27693 }, { "epoch": 0.74, "learning_rate": 0.000323909050033786, "loss": 2.0872, "step": 27694 }, { "epoch": 0.74, "learning_rate": 0.00032384492053480366, "loss": 2.3771, "step": 27695 }, { "epoch": 0.74, "learning_rate": 0.0003237807961582514, "loss": 2.5102, "step": 27696 }, { "epoch": 0.74, "learning_rate": 0.0003237166769046148, "loss": 2.6758, "step": 27697 }, { "epoch": 0.74, "learning_rate": 0.00032365256277438017, "loss": 2.3541, "step": 27698 }, { "epoch": 0.74, "learning_rate": 0.00032358845376803246, "loss": 2.635, "step": 27699 }, { "epoch": 0.74, "learning_rate": 0.00032352434988605774, "loss": 2.3381, "step": 27700 }, { "epoch": 0.74, "learning_rate": 0.00032346025112894183, "loss": 2.4081, "step": 27701 }, { "epoch": 0.74, "learning_rate": 0.00032339615749716987, "loss": 2.5731, "step": 27702 }, { "epoch": 0.74, "learning_rate": 0.00032333206899122735, "loss": 2.9203, "step": 27703 }, { "epoch": 0.74, "learning_rate": 0.00032326798561160066, "loss": 2.546, "step": 27704 }, { "epoch": 0.74, "learning_rate": 0.0003232039073587745, "loss": 2.4826, "step": 27705 }, { "epoch": 0.74, "learning_rate": 0.0003231398342332347, "loss": 2.7679, "step": 27706 }, { "epoch": 0.74, "learning_rate": 0.00032307576623546633, "loss": 2.6566, "step": 27707 }, { "epoch": 0.74, "learning_rate": 0.0003230117033659549, "loss": 2.4358, "step": 27708 }, { "epoch": 0.74, "learning_rate": 0.00032294764562518577, "loss": 2.3715, "step": 27709 }, { "epoch": 0.74, "learning_rate": 0.0003228835930136441, "loss": 2.5867, "step": 27710 }, { "epoch": 0.74, "learning_rate": 0.0003228195455318155, "loss": 2.5747, "step": 27711 }, { "epoch": 0.74, "learning_rate": 0.0003227555031801851, "loss": 2.4799, "step": 27712 }, { "epoch": 0.74, "learning_rate": 0.0003226914659592376, "loss": 2.7323, "step": 27713 }, { "epoch": 0.74, "learning_rate": 0.00032262743386945894, "loss": 2.9536, "step": 27714 }, { "epoch": 0.74, "learning_rate": 0.00032256340691133324, "loss": 1.978, "step": 27715 }, { "epoch": 0.74, "learning_rate": 0.00032249938508534584, "loss": 2.3757, "step": 27716 }, { "epoch": 0.74, "learning_rate": 0.0003224353683919826, "loss": 2.6278, "step": 27717 }, { "epoch": 0.74, "learning_rate": 0.0003223713568317276, "loss": 2.6515, "step": 27718 }, { "epoch": 0.74, "learning_rate": 0.000322307350405066, "loss": 2.6009, "step": 27719 }, { "epoch": 0.74, "learning_rate": 0.000322243349112483, "loss": 2.5635, "step": 27720 }, { "epoch": 0.74, "learning_rate": 0.000322179352954463, "loss": 2.7961, "step": 27721 }, { "epoch": 0.74, "learning_rate": 0.00032211536193149106, "loss": 2.6221, "step": 27722 }, { "epoch": 0.75, "learning_rate": 0.00032205137604405186, "loss": 1.9647, "step": 27723 }, { "epoch": 0.75, "learning_rate": 0.0003219873952926302, "loss": 2.2225, "step": 27724 }, { "epoch": 0.75, "learning_rate": 0.0003219234196777112, "loss": 2.7598, "step": 27725 }, { "epoch": 0.75, "learning_rate": 0.00032185944919977885, "loss": 2.3395, "step": 27726 }, { "epoch": 0.75, "learning_rate": 0.000321795483859318, "loss": 2.5956, "step": 27727 }, { "epoch": 0.75, "learning_rate": 0.00032173152365681367, "loss": 2.7113, "step": 27728 }, { "epoch": 0.75, "learning_rate": 0.00032166756859274947, "loss": 2.296, "step": 27729 }, { "epoch": 0.75, "learning_rate": 0.0003216036186676108, "loss": 2.1578, "step": 27730 }, { "epoch": 0.75, "learning_rate": 0.0003215396738818821, "loss": 2.4794, "step": 27731 }, { "epoch": 0.75, "learning_rate": 0.0003214757342360471, "loss": 2.4173, "step": 27732 }, { "epoch": 0.75, "learning_rate": 0.00032141179973059123, "loss": 2.6349, "step": 27733 }, { "epoch": 0.75, "learning_rate": 0.0003213478703659978, "loss": 2.1394, "step": 27734 }, { "epoch": 0.75, "learning_rate": 0.00032128394614275145, "loss": 2.7296, "step": 27735 }, { "epoch": 0.75, "learning_rate": 0.00032122002706133667, "loss": 2.36, "step": 27736 }, { "epoch": 0.75, "learning_rate": 0.00032115611312223756, "loss": 2.3769, "step": 27737 }, { "epoch": 0.75, "learning_rate": 0.0003210922043259384, "loss": 2.0493, "step": 27738 }, { "epoch": 0.75, "learning_rate": 0.0003210283006729238, "loss": 2.8668, "step": 27739 }, { "epoch": 0.75, "learning_rate": 0.00032096440216367695, "loss": 2.6721, "step": 27740 }, { "epoch": 0.75, "learning_rate": 0.0003209005087986827, "loss": 2.1006, "step": 27741 }, { "epoch": 0.75, "learning_rate": 0.0003208366205784241, "loss": 2.6835, "step": 27742 }, { "epoch": 0.75, "learning_rate": 0.0003207727375033862, "loss": 3.0309, "step": 27743 }, { "epoch": 0.75, "learning_rate": 0.00032070885957405295, "loss": 2.7937, "step": 27744 }, { "epoch": 0.75, "learning_rate": 0.0003206449867909076, "loss": 2.8105, "step": 27745 }, { "epoch": 0.75, "learning_rate": 0.00032058111915443443, "loss": 2.6362, "step": 27746 }, { "epoch": 0.75, "learning_rate": 0.0003205172566651174, "loss": 2.5767, "step": 27747 }, { "epoch": 0.75, "learning_rate": 0.00032045339932344, "loss": 3.0024, "step": 27748 }, { "epoch": 0.75, "learning_rate": 0.00032038954712988613, "loss": 2.2489, "step": 27749 }, { "epoch": 0.75, "learning_rate": 0.00032032570008493945, "loss": 2.3631, "step": 27750 }, { "epoch": 0.75, "learning_rate": 0.00032026185818908383, "loss": 2.8932, "step": 27751 }, { "epoch": 0.75, "learning_rate": 0.0003201980214428032, "loss": 2.5281, "step": 27752 }, { "epoch": 0.75, "learning_rate": 0.00032013418984658037, "loss": 2.4674, "step": 27753 }, { "epoch": 0.75, "learning_rate": 0.0003200703634008995, "loss": 2.3682, "step": 27754 }, { "epoch": 0.75, "learning_rate": 0.0003200065421062439, "loss": 2.2753, "step": 27755 }, { "epoch": 0.75, "learning_rate": 0.00031994272596309723, "loss": 2.1883, "step": 27756 }, { "epoch": 0.75, "learning_rate": 0.0003198789149719432, "loss": 2.2029, "step": 27757 }, { "epoch": 0.75, "learning_rate": 0.00031981510913326464, "loss": 2.5534, "step": 27758 }, { "epoch": 0.75, "learning_rate": 0.0003197513084475451, "loss": 2.7063, "step": 27759 }, { "epoch": 0.75, "learning_rate": 0.00031968751291526845, "loss": 2.2497, "step": 27760 }, { "epoch": 0.75, "learning_rate": 0.0003196237225369172, "loss": 2.4847, "step": 27761 }, { "epoch": 0.75, "learning_rate": 0.0003195599373129749, "loss": 2.9236, "step": 27762 }, { "epoch": 0.75, "learning_rate": 0.000319496157243925, "loss": 2.2919, "step": 27763 }, { "epoch": 0.75, "learning_rate": 0.0003194323823302505, "loss": 2.6533, "step": 27764 }, { "epoch": 0.75, "learning_rate": 0.00031936861257243456, "loss": 1.9376, "step": 27765 }, { "epoch": 0.75, "learning_rate": 0.0003193048479709607, "loss": 2.5851, "step": 27766 }, { "epoch": 0.75, "learning_rate": 0.0003192410885263113, "loss": 2.3052, "step": 27767 }, { "epoch": 0.75, "learning_rate": 0.00031917733423896964, "loss": 2.5506, "step": 27768 }, { "epoch": 0.75, "learning_rate": 0.0003191135851094189, "loss": 2.4979, "step": 27769 }, { "epoch": 0.75, "learning_rate": 0.00031904984113814185, "loss": 2.6849, "step": 27770 }, { "epoch": 0.75, "learning_rate": 0.00031898610232562177, "loss": 2.5256, "step": 27771 }, { "epoch": 0.75, "learning_rate": 0.00031892236867234083, "loss": 3.0056, "step": 27772 }, { "epoch": 0.75, "learning_rate": 0.0003188586401787823, "loss": 2.6708, "step": 27773 }, { "epoch": 0.75, "learning_rate": 0.0003187949168454293, "loss": 2.3479, "step": 27774 }, { "epoch": 0.75, "learning_rate": 0.0003187311986727639, "loss": 2.4641, "step": 27775 }, { "epoch": 0.75, "learning_rate": 0.00031866748566126914, "loss": 2.8452, "step": 27776 }, { "epoch": 0.75, "learning_rate": 0.00031860377781142766, "loss": 2.5526, "step": 27777 }, { "epoch": 0.75, "learning_rate": 0.0003185400751237222, "loss": 2.4554, "step": 27778 }, { "epoch": 0.75, "learning_rate": 0.00031847637759863556, "loss": 2.2543, "step": 27779 }, { "epoch": 0.75, "learning_rate": 0.00031841268523664966, "loss": 3.0592, "step": 27780 }, { "epoch": 0.75, "learning_rate": 0.00031834899803824757, "loss": 2.5842, "step": 27781 }, { "epoch": 0.75, "learning_rate": 0.0003182853160039114, "loss": 2.2733, "step": 27782 }, { "epoch": 0.75, "learning_rate": 0.0003182216391341239, "loss": 2.3245, "step": 27783 }, { "epoch": 0.75, "learning_rate": 0.00031815796742936775, "loss": 2.7686, "step": 27784 }, { "epoch": 0.75, "learning_rate": 0.0003180943008901246, "loss": 2.6648, "step": 27785 }, { "epoch": 0.75, "learning_rate": 0.000318030639516877, "loss": 2.5054, "step": 27786 }, { "epoch": 0.75, "learning_rate": 0.00031796698331010775, "loss": 2.3373, "step": 27787 }, { "epoch": 0.75, "learning_rate": 0.00031790333227029843, "loss": 2.2974, "step": 27788 }, { "epoch": 0.75, "learning_rate": 0.00031783968639793116, "loss": 2.8412, "step": 27789 }, { "epoch": 0.75, "learning_rate": 0.00031777604569348906, "loss": 2.2919, "step": 27790 }, { "epoch": 0.75, "learning_rate": 0.00031771241015745335, "loss": 2.6413, "step": 27791 }, { "epoch": 0.75, "learning_rate": 0.00031764877979030684, "loss": 2.7696, "step": 27792 }, { "epoch": 0.75, "learning_rate": 0.0003175851545925308, "loss": 2.1288, "step": 27793 }, { "epoch": 0.75, "learning_rate": 0.00031752153456460767, "loss": 2.5729, "step": 27794 }, { "epoch": 0.75, "learning_rate": 0.0003174579197070193, "loss": 2.486, "step": 27795 }, { "epoch": 0.75, "learning_rate": 0.0003173943100202477, "loss": 2.6698, "step": 27796 }, { "epoch": 0.75, "learning_rate": 0.0003173307055047748, "loss": 2.2321, "step": 27797 }, { "epoch": 0.75, "learning_rate": 0.0003172671061610828, "loss": 2.5077, "step": 27798 }, { "epoch": 0.75, "learning_rate": 0.00031720351198965283, "loss": 2.6273, "step": 27799 }, { "epoch": 0.75, "learning_rate": 0.00031713992299096683, "loss": 2.5579, "step": 27800 }, { "epoch": 0.75, "learning_rate": 0.00031707633916550716, "loss": 2.0398, "step": 27801 }, { "epoch": 0.75, "learning_rate": 0.0003170127605137544, "loss": 2.9003, "step": 27802 }, { "epoch": 0.75, "learning_rate": 0.00031694918703619135, "loss": 2.1359, "step": 27803 }, { "epoch": 0.75, "learning_rate": 0.000316885618733299, "loss": 2.7092, "step": 27804 }, { "epoch": 0.75, "learning_rate": 0.00031682205560555897, "loss": 2.4462, "step": 27805 }, { "epoch": 0.75, "learning_rate": 0.0003167584976534532, "loss": 2.5433, "step": 27806 }, { "epoch": 0.75, "learning_rate": 0.00031669494487746264, "loss": 2.6858, "step": 27807 }, { "epoch": 0.75, "learning_rate": 0.0003166313972780691, "loss": 2.685, "step": 27808 }, { "epoch": 0.75, "learning_rate": 0.0003165678548557538, "loss": 2.9708, "step": 27809 }, { "epoch": 0.75, "learning_rate": 0.00031650431761099827, "loss": 2.3976, "step": 27810 }, { "epoch": 0.75, "learning_rate": 0.0003164407855442841, "loss": 2.4921, "step": 27811 }, { "epoch": 0.75, "learning_rate": 0.0003163772586560921, "loss": 2.4151, "step": 27812 }, { "epoch": 0.75, "learning_rate": 0.0003163137369469038, "loss": 2.6598, "step": 27813 }, { "epoch": 0.75, "learning_rate": 0.0003162502204172006, "loss": 2.4634, "step": 27814 }, { "epoch": 0.75, "learning_rate": 0.00031618670906746293, "loss": 2.6133, "step": 27815 }, { "epoch": 0.75, "learning_rate": 0.00031612320289817273, "loss": 2.4969, "step": 27816 }, { "epoch": 0.75, "learning_rate": 0.00031605970190981124, "loss": 2.6422, "step": 27817 }, { "epoch": 0.75, "learning_rate": 0.00031599620610285893, "loss": 2.458, "step": 27818 }, { "epoch": 0.75, "learning_rate": 0.00031593271547779734, "loss": 2.5211, "step": 27819 }, { "epoch": 0.75, "learning_rate": 0.00031586923003510694, "loss": 3.0218, "step": 27820 }, { "epoch": 0.75, "learning_rate": 0.0003158057497752688, "loss": 2.3294, "step": 27821 }, { "epoch": 0.75, "learning_rate": 0.00031574227469876405, "loss": 2.7125, "step": 27822 }, { "epoch": 0.75, "learning_rate": 0.00031567880480607346, "loss": 2.8924, "step": 27823 }, { "epoch": 0.75, "learning_rate": 0.000315615340097678, "loss": 1.9223, "step": 27824 }, { "epoch": 0.75, "learning_rate": 0.0003155518805740586, "loss": 2.4361, "step": 27825 }, { "epoch": 0.75, "learning_rate": 0.0003154884262356955, "loss": 2.3832, "step": 27826 }, { "epoch": 0.75, "learning_rate": 0.00031542497708306996, "loss": 2.3834, "step": 27827 }, { "epoch": 0.75, "learning_rate": 0.0003153615331166618, "loss": 2.4579, "step": 27828 }, { "epoch": 0.75, "learning_rate": 0.0003152980943369527, "loss": 2.681, "step": 27829 }, { "epoch": 0.75, "learning_rate": 0.000315234660744423, "loss": 2.3905, "step": 27830 }, { "epoch": 0.75, "learning_rate": 0.0003151712323395528, "loss": 2.9131, "step": 27831 }, { "epoch": 0.75, "learning_rate": 0.0003151078091228229, "loss": 2.1267, "step": 27832 }, { "epoch": 0.75, "learning_rate": 0.00031504439109471407, "loss": 2.2993, "step": 27833 }, { "epoch": 0.75, "learning_rate": 0.0003149809782557063, "loss": 2.4137, "step": 27834 }, { "epoch": 0.75, "learning_rate": 0.00031491757060628, "loss": 2.7546, "step": 27835 }, { "epoch": 0.75, "learning_rate": 0.0003148541681469158, "loss": 2.3844, "step": 27836 }, { "epoch": 0.75, "learning_rate": 0.00031479077087809396, "loss": 2.9274, "step": 27837 }, { "epoch": 0.75, "learning_rate": 0.000314727378800295, "loss": 1.9828, "step": 27838 }, { "epoch": 0.75, "learning_rate": 0.00031466399191399855, "loss": 2.6322, "step": 27839 }, { "epoch": 0.75, "learning_rate": 0.0003146006102196852, "loss": 2.4173, "step": 27840 }, { "epoch": 0.75, "learning_rate": 0.00031453723371783506, "loss": 2.322, "step": 27841 }, { "epoch": 0.75, "learning_rate": 0.0003144738624089284, "loss": 2.4988, "step": 27842 }, { "epoch": 0.75, "learning_rate": 0.0003144104962934451, "loss": 2.373, "step": 27843 }, { "epoch": 0.75, "learning_rate": 0.00031434713537186566, "loss": 2.7049, "step": 27844 }, { "epoch": 0.75, "learning_rate": 0.00031428377964466935, "loss": 2.3675, "step": 27845 }, { "epoch": 0.75, "learning_rate": 0.00031422042911233696, "loss": 2.0503, "step": 27846 }, { "epoch": 0.75, "learning_rate": 0.0003141570837753476, "loss": 2.4809, "step": 27847 }, { "epoch": 0.75, "learning_rate": 0.0003140937436341816, "loss": 2.3507, "step": 27848 }, { "epoch": 0.75, "learning_rate": 0.00031403040868931874, "loss": 2.6411, "step": 27849 }, { "epoch": 0.75, "learning_rate": 0.00031396707894123887, "loss": 2.1264, "step": 27850 }, { "epoch": 0.75, "learning_rate": 0.00031390375439042175, "loss": 2.3947, "step": 27851 }, { "epoch": 0.75, "learning_rate": 0.00031384043503734747, "loss": 2.478, "step": 27852 }, { "epoch": 0.75, "learning_rate": 0.0003137771208824951, "loss": 2.4746, "step": 27853 }, { "epoch": 0.75, "learning_rate": 0.00031371381192634454, "loss": 2.6029, "step": 27854 }, { "epoch": 0.75, "learning_rate": 0.00031365050816937535, "loss": 3.0393, "step": 27855 }, { "epoch": 0.75, "learning_rate": 0.00031358720961206733, "loss": 2.4582, "step": 27856 }, { "epoch": 0.75, "learning_rate": 0.0003135239162549002, "loss": 2.4001, "step": 27857 }, { "epoch": 0.75, "learning_rate": 0.00031346062809835273, "loss": 2.7061, "step": 27858 }, { "epoch": 0.75, "learning_rate": 0.00031339734514290485, "loss": 2.5986, "step": 27859 }, { "epoch": 0.75, "learning_rate": 0.00031333406738903626, "loss": 2.3953, "step": 27860 }, { "epoch": 0.75, "learning_rate": 0.00031327079483722543, "loss": 2.9576, "step": 27861 }, { "epoch": 0.75, "learning_rate": 0.00031320752748795276, "loss": 2.5207, "step": 27862 }, { "epoch": 0.75, "learning_rate": 0.0003131442653416969, "loss": 2.4279, "step": 27863 }, { "epoch": 0.75, "learning_rate": 0.00031308100839893725, "loss": 2.5161, "step": 27864 }, { "epoch": 0.75, "learning_rate": 0.00031301775666015344, "loss": 2.38, "step": 27865 }, { "epoch": 0.75, "learning_rate": 0.00031295451012582385, "loss": 2.5685, "step": 27866 }, { "epoch": 0.75, "learning_rate": 0.00031289126879642813, "loss": 2.5312, "step": 27867 }, { "epoch": 0.75, "learning_rate": 0.0003128280326724453, "loss": 2.3485, "step": 27868 }, { "epoch": 0.75, "learning_rate": 0.0003127648017543545, "loss": 2.5826, "step": 27869 }, { "epoch": 0.75, "learning_rate": 0.00031270157604263495, "loss": 2.7893, "step": 27870 }, { "epoch": 0.75, "learning_rate": 0.0003126383555377651, "loss": 2.7612, "step": 27871 }, { "epoch": 0.75, "learning_rate": 0.00031257514024022416, "loss": 2.3185, "step": 27872 }, { "epoch": 0.75, "learning_rate": 0.0003125119301504914, "loss": 2.153, "step": 27873 }, { "epoch": 0.75, "learning_rate": 0.00031244872526904464, "loss": 1.8926, "step": 27874 }, { "epoch": 0.75, "learning_rate": 0.0003123855255963638, "loss": 2.039, "step": 27875 }, { "epoch": 0.75, "learning_rate": 0.0003123223311329275, "loss": 2.2009, "step": 27876 }, { "epoch": 0.75, "learning_rate": 0.0003122591418792141, "loss": 2.2426, "step": 27877 }, { "epoch": 0.75, "learning_rate": 0.00031219595783570244, "loss": 2.2469, "step": 27878 }, { "epoch": 0.75, "learning_rate": 0.0003121327790028715, "loss": 2.1602, "step": 27879 }, { "epoch": 0.75, "learning_rate": 0.0003120696053811993, "loss": 2.7203, "step": 27880 }, { "epoch": 0.75, "learning_rate": 0.0003120064369711648, "loss": 2.3574, "step": 27881 }, { "epoch": 0.75, "learning_rate": 0.0003119432737732466, "loss": 2.6951, "step": 27882 }, { "epoch": 0.75, "learning_rate": 0.0003118801157879232, "loss": 2.4972, "step": 27883 }, { "epoch": 0.75, "learning_rate": 0.0003118169630156732, "loss": 2.783, "step": 27884 }, { "epoch": 0.75, "learning_rate": 0.0003117538154569746, "loss": 2.5132, "step": 27885 }, { "epoch": 0.75, "learning_rate": 0.000311690673112306, "loss": 2.6811, "step": 27886 }, { "epoch": 0.75, "learning_rate": 0.0003116275359821459, "loss": 2.0769, "step": 27887 }, { "epoch": 0.75, "learning_rate": 0.0003115644040669724, "loss": 2.4716, "step": 27888 }, { "epoch": 0.75, "learning_rate": 0.0003115012773672643, "loss": 2.3219, "step": 27889 }, { "epoch": 0.75, "learning_rate": 0.0003114381558834991, "loss": 2.2066, "step": 27890 }, { "epoch": 0.75, "learning_rate": 0.0003113750396161552, "loss": 2.7268, "step": 27891 }, { "epoch": 0.75, "learning_rate": 0.00031131192856571134, "loss": 2.7354, "step": 27892 }, { "epoch": 0.75, "learning_rate": 0.0003112488227326449, "loss": 2.8241, "step": 27893 }, { "epoch": 0.75, "learning_rate": 0.0003111857221174341, "loss": 2.568, "step": 27894 }, { "epoch": 0.75, "learning_rate": 0.0003111226267205572, "loss": 2.4033, "step": 27895 }, { "epoch": 0.75, "learning_rate": 0.0003110595365424922, "loss": 2.6183, "step": 27896 }, { "epoch": 0.75, "learning_rate": 0.00031099645158371716, "loss": 2.3395, "step": 27897 }, { "epoch": 0.75, "learning_rate": 0.0003109333718447096, "loss": 2.1666, "step": 27898 }, { "epoch": 0.75, "learning_rate": 0.00031087029732594754, "loss": 2.1357, "step": 27899 }, { "epoch": 0.75, "learning_rate": 0.00031080722802790897, "loss": 2.5838, "step": 27900 }, { "epoch": 0.75, "learning_rate": 0.00031074416395107153, "loss": 2.6858, "step": 27901 }, { "epoch": 0.75, "learning_rate": 0.0003106811050959132, "loss": 2.3973, "step": 27902 }, { "epoch": 0.75, "learning_rate": 0.00031061805146291176, "loss": 2.6427, "step": 27903 }, { "epoch": 0.75, "learning_rate": 0.00031055500305254456, "loss": 2.4415, "step": 27904 }, { "epoch": 0.75, "learning_rate": 0.00031049195986528955, "loss": 2.5475, "step": 27905 }, { "epoch": 0.75, "learning_rate": 0.00031042892190162396, "loss": 2.4542, "step": 27906 }, { "epoch": 0.75, "learning_rate": 0.0003103658891620256, "loss": 2.5627, "step": 27907 }, { "epoch": 0.75, "learning_rate": 0.00031030286164697186, "loss": 2.555, "step": 27908 }, { "epoch": 0.75, "learning_rate": 0.0003102398393569404, "loss": 2.393, "step": 27909 }, { "epoch": 0.75, "learning_rate": 0.0003101768222924086, "loss": 2.5227, "step": 27910 }, { "epoch": 0.75, "learning_rate": 0.00031011381045385425, "loss": 2.7006, "step": 27911 }, { "epoch": 0.75, "learning_rate": 0.0003100508038417539, "loss": 2.3017, "step": 27912 }, { "epoch": 0.75, "learning_rate": 0.0003099878024565853, "loss": 2.526, "step": 27913 }, { "epoch": 0.75, "learning_rate": 0.0003099248062988258, "loss": 2.3404, "step": 27914 }, { "epoch": 0.75, "learning_rate": 0.0003098618153689526, "loss": 2.154, "step": 27915 }, { "epoch": 0.75, "learning_rate": 0.0003097988296674432, "loss": 2.454, "step": 27916 }, { "epoch": 0.75, "learning_rate": 0.0003097358491947743, "loss": 2.8156, "step": 27917 }, { "epoch": 0.75, "learning_rate": 0.000309672873951423, "loss": 2.5829, "step": 27918 }, { "epoch": 0.75, "learning_rate": 0.0003096099039378669, "loss": 2.1797, "step": 27919 }, { "epoch": 0.75, "learning_rate": 0.00030954693915458256, "loss": 2.2275, "step": 27920 }, { "epoch": 0.75, "learning_rate": 0.00030948397960204677, "loss": 2.0371, "step": 27921 }, { "epoch": 0.75, "learning_rate": 0.00030942102528073756, "loss": 2.1955, "step": 27922 }, { "epoch": 0.75, "learning_rate": 0.00030935807619113074, "loss": 2.3847, "step": 27923 }, { "epoch": 0.75, "learning_rate": 0.00030929513233370423, "loss": 2.0667, "step": 27924 }, { "epoch": 0.75, "learning_rate": 0.00030923219370893387, "loss": 2.5477, "step": 27925 }, { "epoch": 0.75, "learning_rate": 0.0003091692603172969, "loss": 2.5292, "step": 27926 }, { "epoch": 0.75, "learning_rate": 0.0003091063321592701, "loss": 2.2656, "step": 27927 }, { "epoch": 0.75, "learning_rate": 0.00030904340923533014, "loss": 2.6327, "step": 27928 }, { "epoch": 0.75, "learning_rate": 0.0003089804915459539, "loss": 2.7244, "step": 27929 }, { "epoch": 0.75, "learning_rate": 0.0003089175790916182, "loss": 2.2852, "step": 27930 }, { "epoch": 0.75, "learning_rate": 0.00030885467187279905, "loss": 2.0897, "step": 27931 }, { "epoch": 0.75, "learning_rate": 0.0003087917698899736, "loss": 2.7269, "step": 27932 }, { "epoch": 0.75, "learning_rate": 0.0003087288731436179, "loss": 2.1018, "step": 27933 }, { "epoch": 0.75, "learning_rate": 0.00030866598163420823, "loss": 2.6523, "step": 27934 }, { "epoch": 0.75, "learning_rate": 0.0003086030953622222, "loss": 2.5156, "step": 27935 }, { "epoch": 0.75, "learning_rate": 0.00030854021432813515, "loss": 2.4788, "step": 27936 }, { "epoch": 0.75, "learning_rate": 0.00030847733853242386, "loss": 2.6719, "step": 27937 }, { "epoch": 0.75, "learning_rate": 0.00030841446797556495, "loss": 2.5814, "step": 27938 }, { "epoch": 0.75, "learning_rate": 0.0003083516026580341, "loss": 2.6367, "step": 27939 }, { "epoch": 0.75, "learning_rate": 0.00030828874258030783, "loss": 2.3255, "step": 27940 }, { "epoch": 0.75, "learning_rate": 0.0003082258877428623, "loss": 2.2175, "step": 27941 }, { "epoch": 0.75, "learning_rate": 0.00030816303814617374, "loss": 2.2267, "step": 27942 }, { "epoch": 0.75, "learning_rate": 0.0003081001937907187, "loss": 2.1769, "step": 27943 }, { "epoch": 0.75, "learning_rate": 0.0003080373546769727, "loss": 2.7426, "step": 27944 }, { "epoch": 0.75, "learning_rate": 0.0003079745208054118, "loss": 2.0803, "step": 27945 }, { "epoch": 0.75, "learning_rate": 0.0003079116921765126, "loss": 2.332, "step": 27946 }, { "epoch": 0.75, "learning_rate": 0.00030784886879075, "loss": 2.6711, "step": 27947 }, { "epoch": 0.75, "learning_rate": 0.0003077860506486011, "loss": 2.5455, "step": 27948 }, { "epoch": 0.75, "learning_rate": 0.00030772323775054146, "loss": 2.6508, "step": 27949 }, { "epoch": 0.75, "learning_rate": 0.0003076604300970466, "loss": 2.688, "step": 27950 }, { "epoch": 0.75, "learning_rate": 0.0003075976276885928, "loss": 2.6558, "step": 27951 }, { "epoch": 0.75, "learning_rate": 0.00030753483052565534, "loss": 2.1644, "step": 27952 }, { "epoch": 0.75, "learning_rate": 0.0003074720386087101, "loss": 2.4962, "step": 27953 }, { "epoch": 0.75, "learning_rate": 0.0003074092519382329, "loss": 2.5688, "step": 27954 }, { "epoch": 0.75, "learning_rate": 0.0003073464705146994, "loss": 2.2343, "step": 27955 }, { "epoch": 0.75, "learning_rate": 0.00030728369433858526, "loss": 2.3159, "step": 27956 }, { "epoch": 0.75, "learning_rate": 0.0003072209234103663, "loss": 2.6767, "step": 27957 }, { "epoch": 0.75, "learning_rate": 0.0003071581577305175, "loss": 2.6486, "step": 27958 }, { "epoch": 0.75, "learning_rate": 0.00030709539729951475, "loss": 2.4085, "step": 27959 }, { "epoch": 0.75, "learning_rate": 0.00030703264211783286, "loss": 2.5253, "step": 27960 }, { "epoch": 0.75, "learning_rate": 0.00030696989218594815, "loss": 2.1246, "step": 27961 }, { "epoch": 0.75, "learning_rate": 0.00030690714750433604, "loss": 2.3718, "step": 27962 }, { "epoch": 0.75, "learning_rate": 0.0003068444080734709, "loss": 2.7301, "step": 27963 }, { "epoch": 0.75, "learning_rate": 0.0003067816738938288, "loss": 2.227, "step": 27964 }, { "epoch": 0.75, "learning_rate": 0.00030671894496588504, "loss": 2.4993, "step": 27965 }, { "epoch": 0.75, "learning_rate": 0.00030665622129011426, "loss": 2.6591, "step": 27966 }, { "epoch": 0.75, "learning_rate": 0.00030659350286699205, "loss": 2.3169, "step": 27967 }, { "epoch": 0.75, "learning_rate": 0.00030653078969699357, "loss": 2.5614, "step": 27968 }, { "epoch": 0.75, "learning_rate": 0.0003064680817805937, "loss": 2.4529, "step": 27969 }, { "epoch": 0.75, "learning_rate": 0.000306405379118268, "loss": 2.1778, "step": 27970 }, { "epoch": 0.75, "learning_rate": 0.0003063426817104908, "loss": 2.7823, "step": 27971 }, { "epoch": 0.75, "learning_rate": 0.0003062799895577375, "loss": 2.6676, "step": 27972 }, { "epoch": 0.75, "learning_rate": 0.00030621730266048295, "loss": 2.365, "step": 27973 }, { "epoch": 0.75, "learning_rate": 0.0003061546210192021, "loss": 2.3024, "step": 27974 }, { "epoch": 0.75, "learning_rate": 0.00030609194463437006, "loss": 2.4609, "step": 27975 }, { "epoch": 0.75, "learning_rate": 0.00030602927350646117, "loss": 2.2816, "step": 27976 }, { "epoch": 0.75, "learning_rate": 0.0003059666076359503, "loss": 2.8756, "step": 27977 }, { "epoch": 0.75, "learning_rate": 0.0003059039470233127, "loss": 2.6623, "step": 27978 }, { "epoch": 0.75, "learning_rate": 0.00030584129166902243, "loss": 2.4466, "step": 27979 }, { "epoch": 0.75, "learning_rate": 0.0003057786415735544, "loss": 2.3227, "step": 27980 }, { "epoch": 0.75, "learning_rate": 0.00030571599673738325, "loss": 2.3595, "step": 27981 }, { "epoch": 0.75, "learning_rate": 0.00030565335716098365, "loss": 3.0877, "step": 27982 }, { "epoch": 0.75, "learning_rate": 0.0003055907228448299, "loss": 2.2263, "step": 27983 }, { "epoch": 0.75, "learning_rate": 0.00030552809378939715, "loss": 2.548, "step": 27984 }, { "epoch": 0.75, "learning_rate": 0.0003054654699951591, "loss": 2.5334, "step": 27985 }, { "epoch": 0.75, "learning_rate": 0.0003054028514625904, "loss": 2.1234, "step": 27986 }, { "epoch": 0.75, "learning_rate": 0.0003053402381921656, "loss": 2.5123, "step": 27987 }, { "epoch": 0.75, "learning_rate": 0.00030527763018435897, "loss": 2.5291, "step": 27988 }, { "epoch": 0.75, "learning_rate": 0.000305215027439645, "loss": 2.9177, "step": 27989 }, { "epoch": 0.75, "learning_rate": 0.00030515242995849757, "loss": 2.3426, "step": 27990 }, { "epoch": 0.75, "learning_rate": 0.000305089837741391, "loss": 2.8191, "step": 27991 }, { "epoch": 0.75, "learning_rate": 0.0003050272507888, "loss": 2.3046, "step": 27992 }, { "epoch": 0.75, "learning_rate": 0.0003049646691011979, "loss": 2.9041, "step": 27993 }, { "epoch": 0.75, "learning_rate": 0.0003049020926790592, "loss": 2.5691, "step": 27994 }, { "epoch": 0.75, "learning_rate": 0.0003048395215228581, "loss": 2.722, "step": 27995 }, { "epoch": 0.75, "learning_rate": 0.0003047769556330684, "loss": 2.6308, "step": 27996 }, { "epoch": 0.75, "learning_rate": 0.00030471439501016453, "loss": 2.8396, "step": 27997 }, { "epoch": 0.75, "learning_rate": 0.0003046518396546197, "loss": 2.689, "step": 27998 }, { "epoch": 0.75, "learning_rate": 0.00030458928956690834, "loss": 2.5351, "step": 27999 }, { "epoch": 0.75, "learning_rate": 0.00030452674474750407, "loss": 2.4838, "step": 28000 }, { "epoch": 0.75, "learning_rate": 0.00030446420519688103, "loss": 2.5097, "step": 28001 }, { "epoch": 0.75, "learning_rate": 0.00030440167091551297, "loss": 2.6501, "step": 28002 }, { "epoch": 0.75, "learning_rate": 0.00030433914190387324, "loss": 2.6776, "step": 28003 }, { "epoch": 0.75, "learning_rate": 0.0003042766181624358, "loss": 2.5376, "step": 28004 }, { "epoch": 0.75, "learning_rate": 0.0003042140996916746, "loss": 2.4295, "step": 28005 }, { "epoch": 0.75, "learning_rate": 0.00030415158649206266, "loss": 2.5624, "step": 28006 }, { "epoch": 0.75, "learning_rate": 0.00030408907856407366, "loss": 2.2485, "step": 28007 }, { "epoch": 0.75, "learning_rate": 0.0003040265759081819, "loss": 2.6478, "step": 28008 }, { "epoch": 0.75, "learning_rate": 0.00030396407852486016, "loss": 2.5979, "step": 28009 }, { "epoch": 0.75, "learning_rate": 0.00030390158641458245, "loss": 2.9909, "step": 28010 }, { "epoch": 0.75, "learning_rate": 0.0003038390995778214, "loss": 2.6188, "step": 28011 }, { "epoch": 0.75, "learning_rate": 0.0003037766180150511, "loss": 2.4169, "step": 28012 }, { "epoch": 0.75, "learning_rate": 0.0003037141417267445, "loss": 2.6302, "step": 28013 }, { "epoch": 0.75, "learning_rate": 0.0003036516707133751, "loss": 2.2, "step": 28014 }, { "epoch": 0.75, "learning_rate": 0.0003035892049754162, "loss": 2.7195, "step": 28015 }, { "epoch": 0.75, "learning_rate": 0.00030352674451334115, "loss": 2.3064, "step": 28016 }, { "epoch": 0.75, "learning_rate": 0.0003034642893276228, "loss": 2.722, "step": 28017 }, { "epoch": 0.75, "learning_rate": 0.0003034018394187348, "loss": 2.1666, "step": 28018 }, { "epoch": 0.75, "learning_rate": 0.00030333939478714955, "loss": 2.2117, "step": 28019 }, { "epoch": 0.75, "learning_rate": 0.0003032769554333401, "loss": 2.3211, "step": 28020 }, { "epoch": 0.75, "learning_rate": 0.0003032145213577806, "loss": 2.4359, "step": 28021 }, { "epoch": 0.75, "learning_rate": 0.000303152092560943, "loss": 2.7872, "step": 28022 }, { "epoch": 0.75, "learning_rate": 0.0003030896690433005, "loss": 2.7328, "step": 28023 }, { "epoch": 0.75, "learning_rate": 0.00030302725080532647, "loss": 2.5461, "step": 28024 }, { "epoch": 0.75, "learning_rate": 0.00030296483784749296, "loss": 3.1224, "step": 28025 }, { "epoch": 0.75, "learning_rate": 0.0003029024301702733, "loss": 2.7285, "step": 28026 }, { "epoch": 0.75, "learning_rate": 0.0003028400277741402, "loss": 2.833, "step": 28027 }, { "epoch": 0.75, "learning_rate": 0.0003027776306595664, "loss": 2.4773, "step": 28028 }, { "epoch": 0.75, "learning_rate": 0.0003027152388270249, "loss": 2.6743, "step": 28029 }, { "epoch": 0.75, "learning_rate": 0.0003026528522769878, "loss": 2.7965, "step": 28030 }, { "epoch": 0.75, "learning_rate": 0.0003025904710099281, "loss": 2.185, "step": 28031 }, { "epoch": 0.75, "learning_rate": 0.0003025280950263182, "loss": 2.1334, "step": 28032 }, { "epoch": 0.75, "learning_rate": 0.00030246572432663076, "loss": 2.6068, "step": 28033 }, { "epoch": 0.75, "learning_rate": 0.0003024033589113383, "loss": 2.1067, "step": 28034 }, { "epoch": 0.75, "learning_rate": 0.0003023409987809136, "loss": 2.298, "step": 28035 }, { "epoch": 0.75, "learning_rate": 0.0003022786439358284, "loss": 2.302, "step": 28036 }, { "epoch": 0.75, "learning_rate": 0.00030221629437655585, "loss": 2.1417, "step": 28037 }, { "epoch": 0.75, "learning_rate": 0.0003021539501035675, "loss": 2.1308, "step": 28038 }, { "epoch": 0.75, "learning_rate": 0.0003020916111173361, "loss": 2.4939, "step": 28039 }, { "epoch": 0.75, "learning_rate": 0.00030202927741833385, "loss": 2.7625, "step": 28040 }, { "epoch": 0.75, "learning_rate": 0.00030196694900703314, "loss": 3.1041, "step": 28041 }, { "epoch": 0.75, "learning_rate": 0.0003019046258839059, "loss": 2.6779, "step": 28042 }, { "epoch": 0.75, "learning_rate": 0.0003018423080494247, "loss": 2.7467, "step": 28043 }, { "epoch": 0.75, "learning_rate": 0.0003017799955040611, "loss": 2.7894, "step": 28044 }, { "epoch": 0.75, "learning_rate": 0.0003017176882482875, "loss": 2.459, "step": 28045 }, { "epoch": 0.75, "learning_rate": 0.0003016553862825757, "loss": 2.3047, "step": 28046 }, { "epoch": 0.75, "learning_rate": 0.00030159308960739796, "loss": 2.8191, "step": 28047 }, { "epoch": 0.75, "learning_rate": 0.0003015307982232264, "loss": 2.723, "step": 28048 }, { "epoch": 0.75, "learning_rate": 0.00030146851213053226, "loss": 2.5579, "step": 28049 }, { "epoch": 0.75, "learning_rate": 0.00030140623132978784, "loss": 2.7333, "step": 28050 }, { "epoch": 0.75, "learning_rate": 0.00030134395582146525, "loss": 2.3642, "step": 28051 }, { "epoch": 0.75, "learning_rate": 0.0003012816856060355, "loss": 2.4262, "step": 28052 }, { "epoch": 0.75, "learning_rate": 0.0003012194206839709, "loss": 2.5672, "step": 28053 }, { "epoch": 0.75, "learning_rate": 0.000301157161055743, "loss": 2.3562, "step": 28054 }, { "epoch": 0.75, "learning_rate": 0.0003010949067218235, "loss": 2.6648, "step": 28055 }, { "epoch": 0.75, "learning_rate": 0.0003010326576826844, "loss": 2.7095, "step": 28056 }, { "epoch": 0.75, "learning_rate": 0.00030097041393879656, "loss": 2.6334, "step": 28057 }, { "epoch": 0.75, "learning_rate": 0.00030090817549063186, "loss": 2.0341, "step": 28058 }, { "epoch": 0.75, "learning_rate": 0.0003008459423386619, "loss": 2.341, "step": 28059 }, { "epoch": 0.75, "learning_rate": 0.00030078371448335805, "loss": 2.2877, "step": 28060 }, { "epoch": 0.75, "learning_rate": 0.0003007214919251918, "loss": 2.5493, "step": 28061 }, { "epoch": 0.75, "learning_rate": 0.00030065927466463484, "loss": 2.6, "step": 28062 }, { "epoch": 0.75, "learning_rate": 0.0003005970627021578, "loss": 2.6395, "step": 28063 }, { "epoch": 0.75, "learning_rate": 0.00030053485603823285, "loss": 2.53, "step": 28064 }, { "epoch": 0.75, "learning_rate": 0.0003004726546733303, "loss": 2.2447, "step": 28065 }, { "epoch": 0.75, "learning_rate": 0.0003004104586079215, "loss": 2.6799, "step": 28066 }, { "epoch": 0.75, "learning_rate": 0.0003003482678424787, "loss": 2.3315, "step": 28067 }, { "epoch": 0.75, "learning_rate": 0.000300286082377472, "loss": 2.4484, "step": 28068 }, { "epoch": 0.75, "learning_rate": 0.00030022390221337293, "loss": 2.3287, "step": 28069 }, { "epoch": 0.75, "learning_rate": 0.0003001617273506527, "loss": 2.333, "step": 28070 }, { "epoch": 0.75, "learning_rate": 0.0003000995577897818, "loss": 2.2265, "step": 28071 }, { "epoch": 0.75, "learning_rate": 0.0003000373935312315, "loss": 2.1842, "step": 28072 }, { "epoch": 0.75, "learning_rate": 0.00029997523457547283, "loss": 2.168, "step": 28073 }, { "epoch": 0.75, "learning_rate": 0.00029991308092297656, "loss": 2.6509, "step": 28074 }, { "epoch": 0.75, "learning_rate": 0.00029985093257421403, "loss": 2.6604, "step": 28075 }, { "epoch": 0.75, "learning_rate": 0.00029978878952965525, "loss": 2.6083, "step": 28076 }, { "epoch": 0.75, "learning_rate": 0.00029972665178977146, "loss": 2.5971, "step": 28077 }, { "epoch": 0.75, "learning_rate": 0.0002996645193550337, "loss": 2.7542, "step": 28078 }, { "epoch": 0.75, "learning_rate": 0.0002996023922259116, "loss": 2.6524, "step": 28079 }, { "epoch": 0.75, "learning_rate": 0.0002995402704028772, "loss": 2.4661, "step": 28080 }, { "epoch": 0.75, "learning_rate": 0.0002994781538864003, "loss": 2.5123, "step": 28081 }, { "epoch": 0.75, "learning_rate": 0.00029941604267695154, "loss": 2.5463, "step": 28082 }, { "epoch": 0.75, "learning_rate": 0.000299353936775002, "loss": 2.2438, "step": 28083 }, { "epoch": 0.75, "learning_rate": 0.00029929183618102143, "loss": 2.3575, "step": 28084 }, { "epoch": 0.75, "learning_rate": 0.00029922974089548047, "loss": 2.2611, "step": 28085 }, { "epoch": 0.75, "learning_rate": 0.0002991676509188499, "loss": 2.442, "step": 28086 }, { "epoch": 0.75, "learning_rate": 0.0002991055662515999, "loss": 2.2623, "step": 28087 }, { "epoch": 0.75, "learning_rate": 0.00029904348689420104, "loss": 2.3767, "step": 28088 }, { "epoch": 0.75, "learning_rate": 0.0002989814128471232, "loss": 2.2475, "step": 28089 }, { "epoch": 0.75, "learning_rate": 0.00029891934411083675, "loss": 2.33, "step": 28090 }, { "epoch": 0.75, "learning_rate": 0.0002988572806858123, "loss": 2.206, "step": 28091 }, { "epoch": 0.75, "learning_rate": 0.00029879522257251925, "loss": 2.2389, "step": 28092 }, { "epoch": 0.75, "learning_rate": 0.0002987331697714284, "loss": 2.7778, "step": 28093 }, { "epoch": 0.75, "learning_rate": 0.0002986711222830101, "loss": 2.4958, "step": 28094 }, { "epoch": 0.76, "learning_rate": 0.00029860908010773357, "loss": 2.8166, "step": 28095 }, { "epoch": 0.76, "learning_rate": 0.0002985470432460694, "loss": 1.949, "step": 28096 }, { "epoch": 0.76, "learning_rate": 0.00029848501169848764, "loss": 2.6487, "step": 28097 }, { "epoch": 0.76, "learning_rate": 0.0002984229854654577, "loss": 2.5054, "step": 28098 }, { "epoch": 0.76, "learning_rate": 0.0002983609645474498, "loss": 2.5299, "step": 28099 }, { "epoch": 0.76, "learning_rate": 0.0002982989489449338, "loss": 2.7327, "step": 28100 }, { "epoch": 0.76, "learning_rate": 0.00029823693865837955, "loss": 2.1398, "step": 28101 }, { "epoch": 0.76, "learning_rate": 0.000298174933688257, "loss": 2.5848, "step": 28102 }, { "epoch": 0.76, "learning_rate": 0.00029811293403503547, "loss": 2.5828, "step": 28103 }, { "epoch": 0.76, "learning_rate": 0.00029805093969918474, "loss": 2.7936, "step": 28104 }, { "epoch": 0.76, "learning_rate": 0.0002979889506811747, "loss": 2.3683, "step": 28105 }, { "epoch": 0.76, "learning_rate": 0.0002979269669814748, "loss": 2.655, "step": 28106 }, { "epoch": 0.76, "learning_rate": 0.0002978649886005551, "loss": 2.4085, "step": 28107 }, { "epoch": 0.76, "learning_rate": 0.00029780301553888433, "loss": 2.4521, "step": 28108 }, { "epoch": 0.76, "learning_rate": 0.00029774104779693234, "loss": 2.4052, "step": 28109 }, { "epoch": 0.76, "learning_rate": 0.000297679085375169, "loss": 2.6134, "step": 28110 }, { "epoch": 0.76, "learning_rate": 0.00029761712827406294, "loss": 2.3156, "step": 28111 }, { "epoch": 0.76, "learning_rate": 0.000297555176494084, "loss": 2.3525, "step": 28112 }, { "epoch": 0.76, "learning_rate": 0.0002974932300357015, "loss": 2.2726, "step": 28113 }, { "epoch": 0.76, "learning_rate": 0.00029743128889938463, "loss": 2.832, "step": 28114 }, { "epoch": 0.76, "learning_rate": 0.0002973693530856031, "loss": 2.6447, "step": 28115 }, { "epoch": 0.76, "learning_rate": 0.00029730742259482536, "loss": 2.4449, "step": 28116 }, { "epoch": 0.76, "learning_rate": 0.00029724549742752096, "loss": 2.1222, "step": 28117 }, { "epoch": 0.76, "learning_rate": 0.000297183577584159, "loss": 2.6829, "step": 28118 }, { "epoch": 0.76, "learning_rate": 0.0002971216630652086, "loss": 2.649, "step": 28119 }, { "epoch": 0.76, "learning_rate": 0.0002970597538711388, "loss": 2.4982, "step": 28120 }, { "epoch": 0.76, "learning_rate": 0.00029699785000241905, "loss": 2.1104, "step": 28121 }, { "epoch": 0.76, "learning_rate": 0.0002969359514595176, "loss": 2.4266, "step": 28122 }, { "epoch": 0.76, "learning_rate": 0.0002968740582429039, "loss": 2.8873, "step": 28123 }, { "epoch": 0.76, "learning_rate": 0.0002968121703530463, "loss": 2.6026, "step": 28124 }, { "epoch": 0.76, "learning_rate": 0.00029675028779041403, "loss": 2.8168, "step": 28125 }, { "epoch": 0.76, "learning_rate": 0.00029668841055547593, "loss": 2.1339, "step": 28126 }, { "epoch": 0.76, "learning_rate": 0.0002966265386487006, "loss": 2.2599, "step": 28127 }, { "epoch": 0.76, "learning_rate": 0.00029656467207055684, "loss": 2.1654, "step": 28128 }, { "epoch": 0.76, "learning_rate": 0.00029650281082151364, "loss": 2.2987, "step": 28129 }, { "epoch": 0.76, "learning_rate": 0.00029644095490203914, "loss": 2.8983, "step": 28130 }, { "epoch": 0.76, "learning_rate": 0.00029637910431260217, "loss": 2.6841, "step": 28131 }, { "epoch": 0.76, "learning_rate": 0.00029631725905367135, "loss": 2.5389, "step": 28132 }, { "epoch": 0.76, "learning_rate": 0.0002962554191257151, "loss": 2.4051, "step": 28133 }, { "epoch": 0.76, "learning_rate": 0.0002961935845292023, "loss": 2.3908, "step": 28134 }, { "epoch": 0.76, "learning_rate": 0.0002961317552646008, "loss": 2.7282, "step": 28135 }, { "epoch": 0.76, "learning_rate": 0.00029606993133237926, "loss": 2.4364, "step": 28136 }, { "epoch": 0.76, "learning_rate": 0.0002960081127330064, "loss": 2.2462, "step": 28137 }, { "epoch": 0.76, "learning_rate": 0.00029594629946694983, "loss": 2.4, "step": 28138 }, { "epoch": 0.76, "learning_rate": 0.000295884491534678, "loss": 2.6975, "step": 28139 }, { "epoch": 0.76, "learning_rate": 0.00029582268893666, "loss": 2.5919, "step": 28140 }, { "epoch": 0.76, "learning_rate": 0.0002957608916733631, "loss": 2.6267, "step": 28141 }, { "epoch": 0.76, "learning_rate": 0.000295699099745256, "loss": 2.7476, "step": 28142 }, { "epoch": 0.76, "learning_rate": 0.0002956373131528064, "loss": 2.4851, "step": 28143 }, { "epoch": 0.76, "learning_rate": 0.00029557553189648244, "loss": 2.4627, "step": 28144 }, { "epoch": 0.76, "learning_rate": 0.00029551375597675246, "loss": 3.0665, "step": 28145 }, { "epoch": 0.76, "learning_rate": 0.00029545198539408427, "loss": 2.4712, "step": 28146 }, { "epoch": 0.76, "learning_rate": 0.0002953902201489459, "loss": 2.2763, "step": 28147 }, { "epoch": 0.76, "learning_rate": 0.00029532846024180547, "loss": 2.0961, "step": 28148 }, { "epoch": 0.76, "learning_rate": 0.0002952667056731304, "loss": 3.0535, "step": 28149 }, { "epoch": 0.76, "learning_rate": 0.0002952049564433891, "loss": 2.3212, "step": 28150 }, { "epoch": 0.76, "learning_rate": 0.00029514321255304866, "loss": 2.3255, "step": 28151 }, { "epoch": 0.76, "learning_rate": 0.00029508147400257703, "loss": 2.6861, "step": 28152 }, { "epoch": 0.76, "learning_rate": 0.0002950197407924426, "loss": 2.6557, "step": 28153 }, { "epoch": 0.76, "learning_rate": 0.0002949580129231124, "loss": 2.4687, "step": 28154 }, { "epoch": 0.76, "learning_rate": 0.00029489629039505414, "loss": 2.3721, "step": 28155 }, { "epoch": 0.76, "learning_rate": 0.00029483457320873596, "loss": 2.5835, "step": 28156 }, { "epoch": 0.76, "learning_rate": 0.00029477286136462454, "loss": 2.5699, "step": 28157 }, { "epoch": 0.76, "learning_rate": 0.0002947111548631879, "loss": 1.9551, "step": 28158 }, { "epoch": 0.76, "learning_rate": 0.0002946494537048935, "loss": 2.7014, "step": 28159 }, { "epoch": 0.76, "learning_rate": 0.0002945877578902086, "loss": 2.492, "step": 28160 }, { "epoch": 0.76, "learning_rate": 0.0002945260674196012, "loss": 2.3921, "step": 28161 }, { "epoch": 0.76, "learning_rate": 0.0002944643822935378, "loss": 2.5299, "step": 28162 }, { "epoch": 0.76, "learning_rate": 0.00029440270251248615, "loss": 2.2429, "step": 28163 }, { "epoch": 0.76, "learning_rate": 0.00029434102807691367, "loss": 2.3619, "step": 28164 }, { "epoch": 0.76, "learning_rate": 0.0002942793589872869, "loss": 2.011, "step": 28165 }, { "epoch": 0.76, "learning_rate": 0.00029421769524407405, "loss": 2.4121, "step": 28166 }, { "epoch": 0.76, "learning_rate": 0.0002941560368477415, "loss": 2.3403, "step": 28167 }, { "epoch": 0.76, "learning_rate": 0.0002940943837987566, "loss": 2.383, "step": 28168 }, { "epoch": 0.76, "learning_rate": 0.00029403273609758686, "loss": 2.6298, "step": 28169 }, { "epoch": 0.76, "learning_rate": 0.00029397109374469844, "loss": 2.581, "step": 28170 }, { "epoch": 0.76, "learning_rate": 0.0002939094567405589, "loss": 2.4597, "step": 28171 }, { "epoch": 0.76, "learning_rate": 0.00029384782508563504, "loss": 2.3066, "step": 28172 }, { "epoch": 0.76, "learning_rate": 0.0002937861987803938, "loss": 2.2937, "step": 28173 }, { "epoch": 0.76, "learning_rate": 0.000293724577825302, "loss": 2.7311, "step": 28174 }, { "epoch": 0.76, "learning_rate": 0.00029366296222082687, "loss": 2.1156, "step": 28175 }, { "epoch": 0.76, "learning_rate": 0.00029360135196743463, "loss": 2.4518, "step": 28176 }, { "epoch": 0.76, "learning_rate": 0.0002935397470655925, "loss": 2.254, "step": 28177 }, { "epoch": 0.76, "learning_rate": 0.0002934781475157664, "loss": 2.0241, "step": 28178 }, { "epoch": 0.76, "learning_rate": 0.00029341655331842375, "loss": 2.4121, "step": 28179 }, { "epoch": 0.76, "learning_rate": 0.0002933549644740313, "loss": 2.8619, "step": 28180 }, { "epoch": 0.76, "learning_rate": 0.000293293380983055, "loss": 2.502, "step": 28181 }, { "epoch": 0.76, "learning_rate": 0.0002932318028459617, "loss": 2.6876, "step": 28182 }, { "epoch": 0.76, "learning_rate": 0.0002931702300632182, "loss": 2.1566, "step": 28183 }, { "epoch": 0.76, "learning_rate": 0.0002931086626352905, "loss": 2.5597, "step": 28184 }, { "epoch": 0.76, "learning_rate": 0.00029304710056264496, "loss": 2.556, "step": 28185 }, { "epoch": 0.76, "learning_rate": 0.0002929855438457483, "loss": 2.1669, "step": 28186 }, { "epoch": 0.76, "learning_rate": 0.00029292399248506673, "loss": 2.2627, "step": 28187 }, { "epoch": 0.76, "learning_rate": 0.000292862446481067, "loss": 2.2586, "step": 28188 }, { "epoch": 0.76, "learning_rate": 0.00029280090583421446, "loss": 2.1733, "step": 28189 }, { "epoch": 0.76, "learning_rate": 0.000292739370544976, "loss": 2.7432, "step": 28190 }, { "epoch": 0.76, "learning_rate": 0.0002926778406138175, "loss": 3.1413, "step": 28191 }, { "epoch": 0.76, "learning_rate": 0.0002926163160412053, "loss": 2.2334, "step": 28192 }, { "epoch": 0.76, "learning_rate": 0.0002925547968276057, "loss": 2.252, "step": 28193 }, { "epoch": 0.76, "learning_rate": 0.0002924932829734841, "loss": 2.4696, "step": 28194 }, { "epoch": 0.76, "learning_rate": 0.000292431774479307, "loss": 2.198, "step": 28195 }, { "epoch": 0.76, "learning_rate": 0.0002923702713455406, "loss": 1.9189, "step": 28196 }, { "epoch": 0.76, "learning_rate": 0.0002923087735726501, "loss": 2.703, "step": 28197 }, { "epoch": 0.76, "learning_rate": 0.00029224728116110154, "loss": 2.8907, "step": 28198 }, { "epoch": 0.76, "learning_rate": 0.0002921857941113617, "loss": 2.5189, "step": 28199 }, { "epoch": 0.76, "learning_rate": 0.00029212431242389535, "loss": 2.218, "step": 28200 }, { "epoch": 0.76, "learning_rate": 0.00029206283609916906, "loss": 2.2393, "step": 28201 }, { "epoch": 0.76, "learning_rate": 0.00029200136513764783, "loss": 2.331, "step": 28202 }, { "epoch": 0.76, "learning_rate": 0.0002919398995397976, "loss": 2.8511, "step": 28203 }, { "epoch": 0.76, "learning_rate": 0.00029187843930608416, "loss": 2.7475, "step": 28204 }, { "epoch": 0.76, "learning_rate": 0.00029181698443697305, "loss": 2.481, "step": 28205 }, { "epoch": 0.76, "learning_rate": 0.0002917555349329298, "loss": 2.4961, "step": 28206 }, { "epoch": 0.76, "learning_rate": 0.00029169409079442043, "loss": 2.4893, "step": 28207 }, { "epoch": 0.76, "learning_rate": 0.00029163265202190956, "loss": 2.6599, "step": 28208 }, { "epoch": 0.76, "learning_rate": 0.0002915712186158632, "loss": 2.7531, "step": 28209 }, { "epoch": 0.76, "learning_rate": 0.0002915097905767469, "loss": 2.4765, "step": 28210 }, { "epoch": 0.76, "learning_rate": 0.00029144836790502505, "loss": 2.3706, "step": 28211 }, { "epoch": 0.76, "learning_rate": 0.0002913869506011644, "loss": 2.5135, "step": 28212 }, { "epoch": 0.76, "learning_rate": 0.0002913255386656292, "loss": 1.9863, "step": 28213 }, { "epoch": 0.76, "learning_rate": 0.000291264132098885, "loss": 2.6509, "step": 28214 }, { "epoch": 0.76, "learning_rate": 0.00029120273090139736, "loss": 2.8288, "step": 28215 }, { "epoch": 0.76, "learning_rate": 0.0002911413350736308, "loss": 2.2217, "step": 28216 }, { "epoch": 0.76, "learning_rate": 0.0002910799446160507, "loss": 2.099, "step": 28217 }, { "epoch": 0.76, "learning_rate": 0.00029101855952912224, "loss": 2.6564, "step": 28218 }, { "epoch": 0.76, "learning_rate": 0.0002909571798133104, "loss": 2.6755, "step": 28219 }, { "epoch": 0.76, "learning_rate": 0.00029089580546908054, "loss": 2.1782, "step": 28220 }, { "epoch": 0.76, "learning_rate": 0.000290834436496897, "loss": 3.1204, "step": 28221 }, { "epoch": 0.76, "learning_rate": 0.00029077307289722485, "loss": 2.2169, "step": 28222 }, { "epoch": 0.76, "learning_rate": 0.0002907117146705296, "loss": 2.3856, "step": 28223 }, { "epoch": 0.76, "learning_rate": 0.00029065036181727475, "loss": 2.7865, "step": 28224 }, { "epoch": 0.76, "learning_rate": 0.0002905890143379264, "loss": 2.2576, "step": 28225 }, { "epoch": 0.76, "learning_rate": 0.00029052767223294916, "loss": 2.3258, "step": 28226 }, { "epoch": 0.76, "learning_rate": 0.0002904663355028071, "loss": 2.4686, "step": 28227 }, { "epoch": 0.76, "learning_rate": 0.00029040500414796554, "loss": 2.6163, "step": 28228 }, { "epoch": 0.76, "learning_rate": 0.00029034367816888854, "loss": 2.7227, "step": 28229 }, { "epoch": 0.76, "learning_rate": 0.00029028235756604085, "loss": 2.6221, "step": 28230 }, { "epoch": 0.76, "learning_rate": 0.0002902210423398872, "loss": 2.5792, "step": 28231 }, { "epoch": 0.76, "learning_rate": 0.000290159732490892, "loss": 2.6445, "step": 28232 }, { "epoch": 0.76, "learning_rate": 0.0002900984280195198, "loss": 2.449, "step": 28233 }, { "epoch": 0.76, "learning_rate": 0.00029003712892623524, "loss": 2.0916, "step": 28234 }, { "epoch": 0.76, "learning_rate": 0.00028997583521150216, "loss": 2.5156, "step": 28235 }, { "epoch": 0.76, "learning_rate": 0.00028991454687578554, "loss": 2.654, "step": 28236 }, { "epoch": 0.76, "learning_rate": 0.00028985326391954883, "loss": 2.5243, "step": 28237 }, { "epoch": 0.76, "learning_rate": 0.0002897919863432571, "loss": 2.2182, "step": 28238 }, { "epoch": 0.76, "learning_rate": 0.0002897307141473745, "loss": 2.4449, "step": 28239 }, { "epoch": 0.76, "learning_rate": 0.0002896694473323649, "loss": 2.3111, "step": 28240 }, { "epoch": 0.76, "learning_rate": 0.00028960818589869245, "loss": 2.4821, "step": 28241 }, { "epoch": 0.76, "learning_rate": 0.00028954692984682173, "loss": 2.511, "step": 28242 }, { "epoch": 0.76, "learning_rate": 0.0002894856791772161, "loss": 2.3182, "step": 28243 }, { "epoch": 0.76, "learning_rate": 0.0002894244338903399, "loss": 2.1376, "step": 28244 }, { "epoch": 0.76, "learning_rate": 0.00028936319398665725, "loss": 2.2899, "step": 28245 }, { "epoch": 0.76, "learning_rate": 0.00028930195946663196, "loss": 2.9165, "step": 28246 }, { "epoch": 0.76, "learning_rate": 0.0002892407303307283, "loss": 2.3687, "step": 28247 }, { "epoch": 0.76, "learning_rate": 0.00028917950657940937, "loss": 2.4295, "step": 28248 }, { "epoch": 0.76, "learning_rate": 0.00028911828821313954, "loss": 2.7488, "step": 28249 }, { "epoch": 0.76, "learning_rate": 0.00028905707523238245, "loss": 2.4066, "step": 28250 }, { "epoch": 0.76, "learning_rate": 0.00028899586763760175, "loss": 2.3705, "step": 28251 }, { "epoch": 0.76, "learning_rate": 0.0002889346654292614, "loss": 2.6212, "step": 28252 }, { "epoch": 0.76, "learning_rate": 0.00028887346860782505, "loss": 2.4336, "step": 28253 }, { "epoch": 0.76, "learning_rate": 0.0002888122771737559, "loss": 2.005, "step": 28254 }, { "epoch": 0.76, "learning_rate": 0.0002887510911275182, "loss": 2.3339, "step": 28255 }, { "epoch": 0.76, "learning_rate": 0.0002886899104695747, "loss": 2.3027, "step": 28256 }, { "epoch": 0.76, "learning_rate": 0.00028862873520038926, "loss": 2.7637, "step": 28257 }, { "epoch": 0.76, "learning_rate": 0.0002885675653204253, "loss": 2.4486, "step": 28258 }, { "epoch": 0.76, "learning_rate": 0.00028850640083014637, "loss": 2.6157, "step": 28259 }, { "epoch": 0.76, "learning_rate": 0.00028844524173001564, "loss": 2.5563, "step": 28260 }, { "epoch": 0.76, "learning_rate": 0.00028838408802049685, "loss": 2.6812, "step": 28261 }, { "epoch": 0.76, "learning_rate": 0.0002883229397020528, "loss": 2.5103, "step": 28262 }, { "epoch": 0.76, "learning_rate": 0.00028826179677514683, "loss": 2.3585, "step": 28263 }, { "epoch": 0.76, "learning_rate": 0.0002882006592402423, "loss": 2.1871, "step": 28264 }, { "epoch": 0.76, "learning_rate": 0.00028813952709780223, "loss": 2.6718, "step": 28265 }, { "epoch": 0.76, "learning_rate": 0.00028807840034829026, "loss": 2.6597, "step": 28266 }, { "epoch": 0.76, "learning_rate": 0.00028801727899216867, "loss": 2.397, "step": 28267 }, { "epoch": 0.76, "learning_rate": 0.0002879561630299008, "loss": 2.4494, "step": 28268 }, { "epoch": 0.76, "learning_rate": 0.00028789505246195013, "loss": 2.2817, "step": 28269 }, { "epoch": 0.76, "learning_rate": 0.000287833947288779, "loss": 2.8488, "step": 28270 }, { "epoch": 0.76, "learning_rate": 0.00028777284751085045, "loss": 2.1252, "step": 28271 }, { "epoch": 0.76, "learning_rate": 0.0002877117531286275, "loss": 2.4466, "step": 28272 }, { "epoch": 0.76, "learning_rate": 0.000287650664142573, "loss": 2.6037, "step": 28273 }, { "epoch": 0.76, "learning_rate": 0.00028758958055315, "loss": 2.7554, "step": 28274 }, { "epoch": 0.76, "learning_rate": 0.00028752850236082064, "loss": 2.7094, "step": 28275 }, { "epoch": 0.76, "learning_rate": 0.000287467429566048, "loss": 2.5051, "step": 28276 }, { "epoch": 0.76, "learning_rate": 0.0002874063621692947, "loss": 2.1271, "step": 28277 }, { "epoch": 0.76, "learning_rate": 0.00028734530017102334, "loss": 2.7109, "step": 28278 }, { "epoch": 0.76, "learning_rate": 0.000287284243571697, "loss": 2.4461, "step": 28279 }, { "epoch": 0.76, "learning_rate": 0.0002872231923717774, "loss": 2.4027, "step": 28280 }, { "epoch": 0.76, "learning_rate": 0.00028716214657172756, "loss": 2.7338, "step": 28281 }, { "epoch": 0.76, "learning_rate": 0.00028710110617201015, "loss": 2.5331, "step": 28282 }, { "epoch": 0.76, "learning_rate": 0.00028704007117308697, "loss": 2.4208, "step": 28283 }, { "epoch": 0.76, "learning_rate": 0.00028697904157542044, "loss": 2.4992, "step": 28284 }, { "epoch": 0.76, "learning_rate": 0.0002869180173794738, "loss": 2.5201, "step": 28285 }, { "epoch": 0.76, "learning_rate": 0.00028685699858570847, "loss": 2.2597, "step": 28286 }, { "epoch": 0.76, "learning_rate": 0.00028679598519458705, "loss": 2.476, "step": 28287 }, { "epoch": 0.76, "learning_rate": 0.00028673497720657203, "loss": 2.6506, "step": 28288 }, { "epoch": 0.76, "learning_rate": 0.00028667397462212496, "loss": 2.4899, "step": 28289 }, { "epoch": 0.76, "learning_rate": 0.00028661297744170835, "loss": 2.4469, "step": 28290 }, { "epoch": 0.76, "learning_rate": 0.00028655198566578436, "loss": 2.0305, "step": 28291 }, { "epoch": 0.76, "learning_rate": 0.00028649099929481495, "loss": 2.5238, "step": 28292 }, { "epoch": 0.76, "learning_rate": 0.00028643001832926243, "loss": 2.4292, "step": 28293 }, { "epoch": 0.76, "learning_rate": 0.0002863690427695882, "loss": 2.8245, "step": 28294 }, { "epoch": 0.76, "learning_rate": 0.00028630807261625446, "loss": 2.7897, "step": 28295 }, { "epoch": 0.76, "learning_rate": 0.0002862471078697235, "loss": 2.9753, "step": 28296 }, { "epoch": 0.76, "learning_rate": 0.00028618614853045634, "loss": 2.2425, "step": 28297 }, { "epoch": 0.76, "learning_rate": 0.00028612519459891584, "loss": 2.4777, "step": 28298 }, { "epoch": 0.76, "learning_rate": 0.0002860642460755629, "loss": 2.6063, "step": 28299 }, { "epoch": 0.76, "learning_rate": 0.00028600330296085964, "loss": 2.2141, "step": 28300 }, { "epoch": 0.76, "learning_rate": 0.00028594236525526806, "loss": 2.2299, "step": 28301 }, { "epoch": 0.76, "learning_rate": 0.00028588143295924906, "loss": 2.5707, "step": 28302 }, { "epoch": 0.76, "learning_rate": 0.0002858205060732647, "loss": 2.2985, "step": 28303 }, { "epoch": 0.76, "learning_rate": 0.0002857595845977765, "loss": 2.1999, "step": 28304 }, { "epoch": 0.76, "learning_rate": 0.000285698668533246, "loss": 2.6406, "step": 28305 }, { "epoch": 0.76, "learning_rate": 0.0002856377578801349, "loss": 2.6068, "step": 28306 }, { "epoch": 0.76, "learning_rate": 0.0002855768526389042, "loss": 2.5701, "step": 28307 }, { "epoch": 0.76, "learning_rate": 0.00028551595281001553, "loss": 2.4186, "step": 28308 }, { "epoch": 0.76, "learning_rate": 0.0002854550583939306, "loss": 2.1827, "step": 28309 }, { "epoch": 0.76, "learning_rate": 0.0002853941693911097, "loss": 1.8308, "step": 28310 }, { "epoch": 0.76, "learning_rate": 0.0002853332858020152, "loss": 2.8142, "step": 28311 }, { "epoch": 0.76, "learning_rate": 0.00028527240762710827, "loss": 1.9524, "step": 28312 }, { "epoch": 0.76, "learning_rate": 0.0002852115348668495, "loss": 2.5011, "step": 28313 }, { "epoch": 0.76, "learning_rate": 0.0002851506675217006, "loss": 2.7839, "step": 28314 }, { "epoch": 0.76, "learning_rate": 0.0002850898055921222, "loss": 2.5744, "step": 28315 }, { "epoch": 0.76, "learning_rate": 0.00028502894907857544, "loss": 2.9365, "step": 28316 }, { "epoch": 0.76, "learning_rate": 0.0002849680979815217, "loss": 2.8947, "step": 28317 }, { "epoch": 0.76, "learning_rate": 0.00028490725230142177, "loss": 2.6377, "step": 28318 }, { "epoch": 0.76, "learning_rate": 0.00028484641203873674, "loss": 2.2838, "step": 28319 }, { "epoch": 0.76, "learning_rate": 0.0002847855771939276, "loss": 2.656, "step": 28320 }, { "epoch": 0.76, "learning_rate": 0.0002847247477674548, "loss": 2.6767, "step": 28321 }, { "epoch": 0.76, "learning_rate": 0.00028466392375977944, "loss": 2.0257, "step": 28322 }, { "epoch": 0.76, "learning_rate": 0.00028460310517136237, "loss": 2.7456, "step": 28323 }, { "epoch": 0.76, "learning_rate": 0.0002845422920026642, "loss": 1.8069, "step": 28324 }, { "epoch": 0.76, "learning_rate": 0.000284481484254146, "loss": 2.2687, "step": 28325 }, { "epoch": 0.76, "learning_rate": 0.0002844206819262679, "loss": 2.4244, "step": 28326 }, { "epoch": 0.76, "learning_rate": 0.0002843598850194907, "loss": 2.6958, "step": 28327 }, { "epoch": 0.76, "learning_rate": 0.0002842990935342755, "loss": 2.7511, "step": 28328 }, { "epoch": 0.76, "learning_rate": 0.00028423830747108204, "loss": 2.6493, "step": 28329 }, { "epoch": 0.76, "learning_rate": 0.00028417752683037125, "loss": 2.5716, "step": 28330 }, { "epoch": 0.76, "learning_rate": 0.00028411675161260343, "loss": 2.1529, "step": 28331 }, { "epoch": 0.76, "learning_rate": 0.0002840559818182392, "loss": 2.0163, "step": 28332 }, { "epoch": 0.76, "learning_rate": 0.00028399521744773917, "loss": 2.0627, "step": 28333 }, { "epoch": 0.76, "learning_rate": 0.00028393445850156295, "loss": 2.3197, "step": 28334 }, { "epoch": 0.76, "learning_rate": 0.00028387370498017127, "loss": 2.141, "step": 28335 }, { "epoch": 0.76, "learning_rate": 0.0002838129568840244, "loss": 2.3372, "step": 28336 }, { "epoch": 0.76, "learning_rate": 0.00028375221421358254, "loss": 2.4861, "step": 28337 }, { "epoch": 0.76, "learning_rate": 0.0002836914769693059, "loss": 2.2078, "step": 28338 }, { "epoch": 0.76, "learning_rate": 0.0002836307451516549, "loss": 2.4118, "step": 28339 }, { "epoch": 0.76, "learning_rate": 0.0002835700187610889, "loss": 2.368, "step": 28340 }, { "epoch": 0.76, "learning_rate": 0.0002835092977980687, "loss": 2.4795, "step": 28341 }, { "epoch": 0.76, "learning_rate": 0.0002834485822630536, "loss": 2.0793, "step": 28342 }, { "epoch": 0.76, "learning_rate": 0.000283387872156504, "loss": 2.6806, "step": 28343 }, { "epoch": 0.76, "learning_rate": 0.00028332716747887966, "loss": 2.7984, "step": 28344 }, { "epoch": 0.76, "learning_rate": 0.00028326646823064063, "loss": 2.4669, "step": 28345 }, { "epoch": 0.76, "learning_rate": 0.0002832057744122467, "loss": 2.8623, "step": 28346 }, { "epoch": 0.76, "learning_rate": 0.000283145086024158, "loss": 2.2544, "step": 28347 }, { "epoch": 0.76, "learning_rate": 0.00028308440306683367, "loss": 2.164, "step": 28348 }, { "epoch": 0.76, "learning_rate": 0.00028302372554073375, "loss": 2.385, "step": 28349 }, { "epoch": 0.76, "learning_rate": 0.0002829630534463178, "loss": 2.4884, "step": 28350 }, { "epoch": 0.76, "learning_rate": 0.0002829023867840457, "loss": 2.7769, "step": 28351 }, { "epoch": 0.76, "learning_rate": 0.00028284172555437703, "loss": 2.739, "step": 28352 }, { "epoch": 0.76, "learning_rate": 0.0002827810697577711, "loss": 2.2765, "step": 28353 }, { "epoch": 0.76, "learning_rate": 0.0002827204193946875, "loss": 2.12, "step": 28354 }, { "epoch": 0.76, "learning_rate": 0.000282659774465586, "loss": 2.5002, "step": 28355 }, { "epoch": 0.76, "learning_rate": 0.00028259913497092525, "loss": 2.4642, "step": 28356 }, { "epoch": 0.76, "learning_rate": 0.0002825385009111655, "loss": 2.6323, "step": 28357 }, { "epoch": 0.76, "learning_rate": 0.00028247787228676615, "loss": 2.8016, "step": 28358 }, { "epoch": 0.76, "learning_rate": 0.0002824172490981858, "loss": 2.5667, "step": 28359 }, { "epoch": 0.76, "learning_rate": 0.0002823566313458844, "loss": 2.5626, "step": 28360 }, { "epoch": 0.76, "learning_rate": 0.00028229601903032053, "loss": 2.4971, "step": 28361 }, { "epoch": 0.76, "learning_rate": 0.0002822354121519537, "loss": 2.2501, "step": 28362 }, { "epoch": 0.76, "learning_rate": 0.0002821748107112432, "loss": 2.4981, "step": 28363 }, { "epoch": 0.76, "learning_rate": 0.00028211421470864786, "loss": 2.7899, "step": 28364 }, { "epoch": 0.76, "learning_rate": 0.00028205362414462687, "loss": 2.5047, "step": 28365 }, { "epoch": 0.76, "learning_rate": 0.0002819930390196396, "loss": 2.5397, "step": 28366 }, { "epoch": 0.76, "learning_rate": 0.0002819324593341445, "loss": 2.4965, "step": 28367 }, { "epoch": 0.76, "learning_rate": 0.0002818718850886008, "loss": 2.5408, "step": 28368 }, { "epoch": 0.76, "learning_rate": 0.0002818113162834669, "loss": 2.4957, "step": 28369 }, { "epoch": 0.76, "learning_rate": 0.0002817507529192023, "loss": 2.5604, "step": 28370 }, { "epoch": 0.76, "learning_rate": 0.0002816901949962658, "loss": 2.6147, "step": 28371 }, { "epoch": 0.76, "learning_rate": 0.0002816296425151158, "loss": 2.6712, "step": 28372 }, { "epoch": 0.76, "learning_rate": 0.0002815690954762111, "loss": 2.7836, "step": 28373 }, { "epoch": 0.76, "learning_rate": 0.00028150855388001084, "loss": 2.6103, "step": 28374 }, { "epoch": 0.76, "learning_rate": 0.00028144801772697305, "loss": 2.546, "step": 28375 }, { "epoch": 0.76, "learning_rate": 0.00028138748701755646, "loss": 2.711, "step": 28376 }, { "epoch": 0.76, "learning_rate": 0.00028132696175221995, "loss": 2.6222, "step": 28377 }, { "epoch": 0.76, "learning_rate": 0.0002812664419314218, "loss": 2.0433, "step": 28378 }, { "epoch": 0.76, "learning_rate": 0.00028120592755562094, "loss": 2.0924, "step": 28379 }, { "epoch": 0.76, "learning_rate": 0.0002811454186252752, "loss": 2.128, "step": 28380 }, { "epoch": 0.76, "learning_rate": 0.0002810849151408432, "loss": 2.3824, "step": 28381 }, { "epoch": 0.76, "learning_rate": 0.00028102441710278335, "loss": 2.6021, "step": 28382 }, { "epoch": 0.76, "learning_rate": 0.00028096392451155397, "loss": 2.1579, "step": 28383 }, { "epoch": 0.76, "learning_rate": 0.0002809034373676137, "loss": 2.49, "step": 28384 }, { "epoch": 0.76, "learning_rate": 0.00028084295567142004, "loss": 2.3406, "step": 28385 }, { "epoch": 0.76, "learning_rate": 0.0002807824794234316, "loss": 2.6105, "step": 28386 }, { "epoch": 0.76, "learning_rate": 0.0002807220086241068, "loss": 2.1646, "step": 28387 }, { "epoch": 0.76, "learning_rate": 0.00028066154327390327, "loss": 2.0914, "step": 28388 }, { "epoch": 0.76, "learning_rate": 0.00028060108337327915, "loss": 2.5405, "step": 28389 }, { "epoch": 0.76, "learning_rate": 0.0002805406289226927, "loss": 2.3182, "step": 28390 }, { "epoch": 0.76, "learning_rate": 0.00028048017992260177, "loss": 2.4156, "step": 28391 }, { "epoch": 0.76, "learning_rate": 0.0002804197363734647, "loss": 2.5409, "step": 28392 }, { "epoch": 0.76, "learning_rate": 0.0002803592982757387, "loss": 2.3391, "step": 28393 }, { "epoch": 0.76, "learning_rate": 0.00028029886562988207, "loss": 2.5955, "step": 28394 }, { "epoch": 0.76, "learning_rate": 0.0002802384384363525, "loss": 2.3894, "step": 28395 }, { "epoch": 0.76, "learning_rate": 0.00028017801669560785, "loss": 2.0833, "step": 28396 }, { "epoch": 0.76, "learning_rate": 0.00028011760040810586, "loss": 2.7598, "step": 28397 }, { "epoch": 0.76, "learning_rate": 0.0002800571895743046, "loss": 2.3424, "step": 28398 }, { "epoch": 0.76, "learning_rate": 0.0002799967841946609, "loss": 2.8207, "step": 28399 }, { "epoch": 0.76, "learning_rate": 0.000279936384269633, "loss": 2.1897, "step": 28400 }, { "epoch": 0.76, "learning_rate": 0.00027987598979967854, "loss": 2.5475, "step": 28401 }, { "epoch": 0.76, "learning_rate": 0.0002798156007852545, "loss": 3.139, "step": 28402 }, { "epoch": 0.76, "learning_rate": 0.00027975521722681875, "loss": 2.7273, "step": 28403 }, { "epoch": 0.76, "learning_rate": 0.00027969483912482874, "loss": 2.6264, "step": 28404 }, { "epoch": 0.76, "learning_rate": 0.0002796344664797418, "loss": 2.4544, "step": 28405 }, { "epoch": 0.76, "learning_rate": 0.00027957409929201573, "loss": 2.4403, "step": 28406 }, { "epoch": 0.76, "learning_rate": 0.0002795137375621071, "loss": 2.2376, "step": 28407 }, { "epoch": 0.76, "learning_rate": 0.00027945338129047357, "loss": 2.282, "step": 28408 }, { "epoch": 0.76, "learning_rate": 0.00027939303047757246, "loss": 2.4314, "step": 28409 }, { "epoch": 0.76, "learning_rate": 0.0002793326851238609, "loss": 2.4629, "step": 28410 }, { "epoch": 0.76, "learning_rate": 0.00027927234522979636, "loss": 2.7228, "step": 28411 }, { "epoch": 0.76, "learning_rate": 0.00027921201079583535, "loss": 2.5894, "step": 28412 }, { "epoch": 0.76, "learning_rate": 0.0002791516818224353, "loss": 2.2781, "step": 28413 }, { "epoch": 0.76, "learning_rate": 0.0002790913583100536, "loss": 2.2262, "step": 28414 }, { "epoch": 0.76, "learning_rate": 0.0002790310402591465, "loss": 2.2811, "step": 28415 }, { "epoch": 0.76, "learning_rate": 0.00027897072767017105, "loss": 2.3424, "step": 28416 }, { "epoch": 0.76, "learning_rate": 0.0002789104205435852, "loss": 2.9356, "step": 28417 }, { "epoch": 0.76, "learning_rate": 0.0002788501188798446, "loss": 2.4133, "step": 28418 }, { "epoch": 0.76, "learning_rate": 0.000278789822679407, "loss": 2.1298, "step": 28419 }, { "epoch": 0.76, "learning_rate": 0.00027872953194272844, "loss": 2.2582, "step": 28420 }, { "epoch": 0.76, "learning_rate": 0.0002786692466702659, "loss": 1.7743, "step": 28421 }, { "epoch": 0.76, "learning_rate": 0.00027860896686247627, "loss": 2.3991, "step": 28422 }, { "epoch": 0.76, "learning_rate": 0.00027854869251981606, "loss": 1.9871, "step": 28423 }, { "epoch": 0.76, "learning_rate": 0.00027848842364274206, "loss": 2.6535, "step": 28424 }, { "epoch": 0.76, "learning_rate": 0.00027842816023171104, "loss": 2.4372, "step": 28425 }, { "epoch": 0.76, "learning_rate": 0.0002783679022871789, "loss": 2.5696, "step": 28426 }, { "epoch": 0.76, "learning_rate": 0.000278307649809603, "loss": 2.8324, "step": 28427 }, { "epoch": 0.76, "learning_rate": 0.00027824740279943884, "loss": 2.259, "step": 28428 }, { "epoch": 0.76, "learning_rate": 0.00027818716125714305, "loss": 2.6137, "step": 28429 }, { "epoch": 0.76, "learning_rate": 0.0002781269251831729, "loss": 2.3791, "step": 28430 }, { "epoch": 0.76, "learning_rate": 0.0002780666945779838, "loss": 2.6419, "step": 28431 }, { "epoch": 0.76, "learning_rate": 0.00027800646944203247, "loss": 2.5459, "step": 28432 }, { "epoch": 0.76, "learning_rate": 0.0002779462497757752, "loss": 2.3592, "step": 28433 }, { "epoch": 0.76, "learning_rate": 0.0002778860355796677, "loss": 2.8066, "step": 28434 }, { "epoch": 0.76, "learning_rate": 0.00027782582685416667, "loss": 2.0641, "step": 28435 }, { "epoch": 0.76, "learning_rate": 0.00027776562359972803, "loss": 2.4168, "step": 28436 }, { "epoch": 0.76, "learning_rate": 0.0002777054258168078, "loss": 2.1663, "step": 28437 }, { "epoch": 0.76, "learning_rate": 0.00027764523350586246, "loss": 2.8304, "step": 28438 }, { "epoch": 0.76, "learning_rate": 0.0002775850466673474, "loss": 2.9252, "step": 28439 }, { "epoch": 0.76, "learning_rate": 0.0002775248653017189, "loss": 2.4241, "step": 28440 }, { "epoch": 0.76, "learning_rate": 0.00027746468940943313, "loss": 2.4827, "step": 28441 }, { "epoch": 0.76, "learning_rate": 0.0002774045189909451, "loss": 2.1371, "step": 28442 }, { "epoch": 0.76, "learning_rate": 0.00027734435404671155, "loss": 2.2009, "step": 28443 }, { "epoch": 0.76, "learning_rate": 0.0002772841945771882, "loss": 3.1857, "step": 28444 }, { "epoch": 0.76, "learning_rate": 0.00027722404058283046, "loss": 2.4015, "step": 28445 }, { "epoch": 0.76, "learning_rate": 0.00027716389206409434, "loss": 2.6735, "step": 28446 }, { "epoch": 0.76, "learning_rate": 0.0002771037490214351, "loss": 2.4326, "step": 28447 }, { "epoch": 0.76, "learning_rate": 0.0002770436114553085, "loss": 2.5626, "step": 28448 }, { "epoch": 0.76, "learning_rate": 0.0002769834793661703, "loss": 2.4406, "step": 28449 }, { "epoch": 0.76, "learning_rate": 0.0002769233527544761, "loss": 2.0346, "step": 28450 }, { "epoch": 0.76, "learning_rate": 0.00027686323162068115, "loss": 2.4047, "step": 28451 }, { "epoch": 0.76, "learning_rate": 0.00027680311596524153, "loss": 2.3594, "step": 28452 }, { "epoch": 0.76, "learning_rate": 0.00027674300578861175, "loss": 2.7641, "step": 28453 }, { "epoch": 0.76, "learning_rate": 0.00027668290109124805, "loss": 2.4852, "step": 28454 }, { "epoch": 0.76, "learning_rate": 0.00027662280187360476, "loss": 2.5448, "step": 28455 }, { "epoch": 0.76, "learning_rate": 0.00027656270813613816, "loss": 2.1818, "step": 28456 }, { "epoch": 0.76, "learning_rate": 0.00027650261987930335, "loss": 2.6817, "step": 28457 }, { "epoch": 0.76, "learning_rate": 0.00027644253710355505, "loss": 2.2083, "step": 28458 }, { "epoch": 0.76, "learning_rate": 0.00027638245980934873, "loss": 2.8146, "step": 28459 }, { "epoch": 0.76, "learning_rate": 0.0002763223879971398, "loss": 2.5924, "step": 28460 }, { "epoch": 0.76, "learning_rate": 0.0002762623216673829, "loss": 2.9959, "step": 28461 }, { "epoch": 0.76, "learning_rate": 0.0002762022608205331, "loss": 1.9167, "step": 28462 }, { "epoch": 0.76, "learning_rate": 0.0002761422054570457, "loss": 2.399, "step": 28463 }, { "epoch": 0.76, "learning_rate": 0.0002760821555773755, "loss": 2.2174, "step": 28464 }, { "epoch": 0.76, "learning_rate": 0.00027602211118197775, "loss": 2.2114, "step": 28465 }, { "epoch": 0.76, "learning_rate": 0.00027596207227130676, "loss": 2.6614, "step": 28466 }, { "epoch": 0.77, "learning_rate": 0.00027590203884581764, "loss": 2.7245, "step": 28467 }, { "epoch": 0.77, "learning_rate": 0.00027584201090596514, "loss": 1.7985, "step": 28468 }, { "epoch": 0.77, "learning_rate": 0.00027578198845220426, "loss": 2.8212, "step": 28469 }, { "epoch": 0.77, "learning_rate": 0.00027572197148498944, "loss": 2.5445, "step": 28470 }, { "epoch": 0.77, "learning_rate": 0.00027566196000477583, "loss": 2.5913, "step": 28471 }, { "epoch": 0.77, "learning_rate": 0.0002756019540120175, "loss": 2.3316, "step": 28472 }, { "epoch": 0.77, "learning_rate": 0.00027554195350716935, "loss": 2.8664, "step": 28473 }, { "epoch": 0.77, "learning_rate": 0.0002754819584906857, "loss": 2.4848, "step": 28474 }, { "epoch": 0.77, "learning_rate": 0.0002754219689630212, "loss": 2.7396, "step": 28475 }, { "epoch": 0.77, "learning_rate": 0.00027536198492463014, "loss": 2.2035, "step": 28476 }, { "epoch": 0.77, "learning_rate": 0.00027530200637596736, "loss": 2.6148, "step": 28477 }, { "epoch": 0.77, "learning_rate": 0.0002752420333174869, "loss": 2.0161, "step": 28478 }, { "epoch": 0.77, "learning_rate": 0.00027518206574964353, "loss": 2.3203, "step": 28479 }, { "epoch": 0.77, "learning_rate": 0.0002751221036728909, "loss": 3.0695, "step": 28480 }, { "epoch": 0.77, "learning_rate": 0.00027506214708768374, "loss": 2.8847, "step": 28481 }, { "epoch": 0.77, "learning_rate": 0.00027500219599447607, "loss": 2.3477, "step": 28482 }, { "epoch": 0.77, "learning_rate": 0.0002749422503937221, "loss": 2.2745, "step": 28483 }, { "epoch": 0.77, "learning_rate": 0.0002748823102858764, "loss": 2.4675, "step": 28484 }, { "epoch": 0.77, "learning_rate": 0.00027482237567139236, "loss": 2.4788, "step": 28485 }, { "epoch": 0.77, "learning_rate": 0.00027476244655072425, "loss": 2.3247, "step": 28486 }, { "epoch": 0.77, "learning_rate": 0.0002747025229243266, "loss": 2.3502, "step": 28487 }, { "epoch": 0.77, "learning_rate": 0.00027464260479265266, "loss": 2.6396, "step": 28488 }, { "epoch": 0.77, "learning_rate": 0.0002745826921561566, "loss": 1.8309, "step": 28489 }, { "epoch": 0.77, "learning_rate": 0.0002745227850152924, "loss": 2.4229, "step": 28490 }, { "epoch": 0.77, "learning_rate": 0.00027446288337051395, "loss": 2.4323, "step": 28491 }, { "epoch": 0.77, "learning_rate": 0.0002744029872222752, "loss": 2.4467, "step": 28492 }, { "epoch": 0.77, "learning_rate": 0.0002743430965710294, "loss": 2.3235, "step": 28493 }, { "epoch": 0.77, "learning_rate": 0.00027428321141723057, "loss": 2.3149, "step": 28494 }, { "epoch": 0.77, "learning_rate": 0.0002742233317613324, "loss": 2.4085, "step": 28495 }, { "epoch": 0.77, "learning_rate": 0.0002741634576037885, "loss": 2.8095, "step": 28496 }, { "epoch": 0.77, "learning_rate": 0.0002741035889450528, "loss": 2.3946, "step": 28497 }, { "epoch": 0.77, "learning_rate": 0.00027404372578557825, "loss": 1.885, "step": 28498 }, { "epoch": 0.77, "learning_rate": 0.00027398386812581857, "loss": 2.3412, "step": 28499 }, { "epoch": 0.77, "learning_rate": 0.0002739240159662276, "loss": 2.2173, "step": 28500 }, { "epoch": 0.77, "learning_rate": 0.00027386416930725823, "loss": 2.2265, "step": 28501 }, { "epoch": 0.77, "learning_rate": 0.00027380432814936374, "loss": 2.3993, "step": 28502 }, { "epoch": 0.77, "learning_rate": 0.0002737444924929985, "loss": 2.386, "step": 28503 }, { "epoch": 0.77, "learning_rate": 0.0002736846623386148, "loss": 2.4257, "step": 28504 }, { "epoch": 0.77, "learning_rate": 0.0002736248376866662, "loss": 2.3023, "step": 28505 }, { "epoch": 0.77, "learning_rate": 0.00027356501853760643, "loss": 3.0105, "step": 28506 }, { "epoch": 0.77, "learning_rate": 0.0002735052048918878, "loss": 2.4931, "step": 28507 }, { "epoch": 0.77, "learning_rate": 0.0002734453967499638, "loss": 2.6095, "step": 28508 }, { "epoch": 0.77, "learning_rate": 0.0002733855941122877, "loss": 2.5749, "step": 28509 }, { "epoch": 0.77, "learning_rate": 0.0002733257969793124, "loss": 2.2311, "step": 28510 }, { "epoch": 0.77, "learning_rate": 0.00027326600535149115, "loss": 2.7469, "step": 28511 }, { "epoch": 0.77, "learning_rate": 0.00027320621922927646, "loss": 2.4666, "step": 28512 }, { "epoch": 0.77, "learning_rate": 0.0002731464386131215, "loss": 2.0728, "step": 28513 }, { "epoch": 0.77, "learning_rate": 0.00027308666350347956, "loss": 2.5283, "step": 28514 }, { "epoch": 0.77, "learning_rate": 0.0002730268939008024, "loss": 2.3222, "step": 28515 }, { "epoch": 0.77, "learning_rate": 0.0002729671298055442, "loss": 2.832, "step": 28516 }, { "epoch": 0.77, "learning_rate": 0.00027290737121815666, "loss": 2.2662, "step": 28517 }, { "epoch": 0.77, "learning_rate": 0.00027284761813909286, "loss": 2.7177, "step": 28518 }, { "epoch": 0.77, "learning_rate": 0.00027278787056880593, "loss": 2.6191, "step": 28519 }, { "epoch": 0.77, "learning_rate": 0.00027272812850774776, "loss": 2.4726, "step": 28520 }, { "epoch": 0.77, "learning_rate": 0.00027266839195637117, "loss": 2.5717, "step": 28521 }, { "epoch": 0.77, "learning_rate": 0.0002726086609151288, "loss": 2.4043, "step": 28522 }, { "epoch": 0.77, "learning_rate": 0.0002725489353844732, "loss": 2.329, "step": 28523 }, { "epoch": 0.77, "learning_rate": 0.00027248921536485713, "loss": 1.8519, "step": 28524 }, { "epoch": 0.77, "learning_rate": 0.0002724295008567325, "loss": 2.4073, "step": 28525 }, { "epoch": 0.77, "learning_rate": 0.0002723697918605518, "loss": 2.1315, "step": 28526 }, { "epoch": 0.77, "learning_rate": 0.0002723100883767674, "loss": 2.5579, "step": 28527 }, { "epoch": 0.77, "learning_rate": 0.00027225039040583177, "loss": 2.7043, "step": 28528 }, { "epoch": 0.77, "learning_rate": 0.0002721906979481971, "loss": 2.4601, "step": 28529 }, { "epoch": 0.77, "learning_rate": 0.0002721310110043158, "loss": 2.3445, "step": 28530 }, { "epoch": 0.77, "learning_rate": 0.00027207132957463953, "loss": 2.2047, "step": 28531 }, { "epoch": 0.77, "learning_rate": 0.0002720116536596211, "loss": 2.5149, "step": 28532 }, { "epoch": 0.77, "learning_rate": 0.0002719519832597118, "loss": 2.652, "step": 28533 }, { "epoch": 0.77, "learning_rate": 0.0002718923183753642, "loss": 2.7154, "step": 28534 }, { "epoch": 0.77, "learning_rate": 0.00027183265900703027, "loss": 2.9445, "step": 28535 }, { "epoch": 0.77, "learning_rate": 0.0002717730051551618, "loss": 2.2179, "step": 28536 }, { "epoch": 0.77, "learning_rate": 0.00027171335682021094, "loss": 3.0128, "step": 28537 }, { "epoch": 0.77, "learning_rate": 0.0002716537140026298, "loss": 2.6453, "step": 28538 }, { "epoch": 0.77, "learning_rate": 0.00027159407670286964, "loss": 2.3352, "step": 28539 }, { "epoch": 0.77, "learning_rate": 0.0002715344449213824, "loss": 2.3479, "step": 28540 }, { "epoch": 0.77, "learning_rate": 0.00027147481865862, "loss": 2.185, "step": 28541 }, { "epoch": 0.77, "learning_rate": 0.00027141519791503424, "loss": 2.5348, "step": 28542 }, { "epoch": 0.77, "learning_rate": 0.00027135558269107685, "loss": 2.5191, "step": 28543 }, { "epoch": 0.77, "learning_rate": 0.000271295972987199, "loss": 2.4793, "step": 28544 }, { "epoch": 0.77, "learning_rate": 0.0002712363688038526, "loss": 2.0893, "step": 28545 }, { "epoch": 0.77, "learning_rate": 0.00027117677014148957, "loss": 2.8067, "step": 28546 }, { "epoch": 0.77, "learning_rate": 0.0002711171770005606, "loss": 2.466, "step": 28547 }, { "epoch": 0.77, "learning_rate": 0.0002710575893815174, "loss": 2.4331, "step": 28548 }, { "epoch": 0.77, "learning_rate": 0.00027099800728481207, "loss": 2.6269, "step": 28549 }, { "epoch": 0.77, "learning_rate": 0.0002709384307108953, "loss": 2.6353, "step": 28550 }, { "epoch": 0.77, "learning_rate": 0.0002708788596602189, "loss": 2.2619, "step": 28551 }, { "epoch": 0.77, "learning_rate": 0.0002708192941332336, "loss": 2.3989, "step": 28552 }, { "epoch": 0.77, "learning_rate": 0.0002707597341303909, "loss": 2.726, "step": 28553 }, { "epoch": 0.77, "learning_rate": 0.0002707001796521422, "loss": 2.6628, "step": 28554 }, { "epoch": 0.77, "learning_rate": 0.0002706406306989384, "loss": 2.341, "step": 28555 }, { "epoch": 0.77, "learning_rate": 0.00027058108727123087, "loss": 2.4888, "step": 28556 }, { "epoch": 0.77, "learning_rate": 0.00027052154936947094, "loss": 2.5459, "step": 28557 }, { "epoch": 0.77, "learning_rate": 0.000270462016994109, "loss": 2.2051, "step": 28558 }, { "epoch": 0.77, "learning_rate": 0.0002704024901455967, "loss": 2.6625, "step": 28559 }, { "epoch": 0.77, "learning_rate": 0.00027034296882438445, "loss": 2.2243, "step": 28560 }, { "epoch": 0.77, "learning_rate": 0.00027028345303092307, "loss": 2.2839, "step": 28561 }, { "epoch": 0.77, "learning_rate": 0.0002702239427656644, "loss": 2.6411, "step": 28562 }, { "epoch": 0.77, "learning_rate": 0.0002701644380290583, "loss": 2.3396, "step": 28563 }, { "epoch": 0.77, "learning_rate": 0.00027010493882155605, "loss": 3.2028, "step": 28564 }, { "epoch": 0.77, "learning_rate": 0.0002700454451436085, "loss": 2.7158, "step": 28565 }, { "epoch": 0.77, "learning_rate": 0.00026998595699566586, "loss": 1.9675, "step": 28566 }, { "epoch": 0.77, "learning_rate": 0.0002699264743781792, "loss": 2.4344, "step": 28567 }, { "epoch": 0.77, "learning_rate": 0.0002698669972915989, "loss": 2.3128, "step": 28568 }, { "epoch": 0.77, "learning_rate": 0.00026980752573637577, "loss": 2.6857, "step": 28569 }, { "epoch": 0.77, "learning_rate": 0.0002697480597129606, "loss": 2.5203, "step": 28570 }, { "epoch": 0.77, "learning_rate": 0.0002696885992218032, "loss": 2.5922, "step": 28571 }, { "epoch": 0.77, "learning_rate": 0.00026962914426335437, "loss": 2.5798, "step": 28572 }, { "epoch": 0.77, "learning_rate": 0.00026956969483806506, "loss": 2.0065, "step": 28573 }, { "epoch": 0.77, "learning_rate": 0.00026951025094638437, "loss": 2.2551, "step": 28574 }, { "epoch": 0.77, "learning_rate": 0.00026945081258876403, "loss": 1.7487, "step": 28575 }, { "epoch": 0.77, "learning_rate": 0.00026939137976565356, "loss": 2.3243, "step": 28576 }, { "epoch": 0.77, "learning_rate": 0.0002693319524775032, "loss": 2.318, "step": 28577 }, { "epoch": 0.77, "learning_rate": 0.00026927253072476376, "loss": 2.1714, "step": 28578 }, { "epoch": 0.77, "learning_rate": 0.00026921311450788465, "loss": 2.9321, "step": 28579 }, { "epoch": 0.77, "learning_rate": 0.0002691537038273163, "loss": 2.5928, "step": 28580 }, { "epoch": 0.77, "learning_rate": 0.00026909429868350886, "loss": 2.3888, "step": 28581 }, { "epoch": 0.77, "learning_rate": 0.00026903489907691234, "loss": 1.9696, "step": 28582 }, { "epoch": 0.77, "learning_rate": 0.00026897550500797675, "loss": 2.5392, "step": 28583 }, { "epoch": 0.77, "learning_rate": 0.0002689161164771523, "loss": 2.4655, "step": 28584 }, { "epoch": 0.77, "learning_rate": 0.0002688567334848885, "loss": 2.28, "step": 28585 }, { "epoch": 0.77, "learning_rate": 0.00026879735603163547, "loss": 2.5678, "step": 28586 }, { "epoch": 0.77, "learning_rate": 0.00026873798411784246, "loss": 1.7069, "step": 28587 }, { "epoch": 0.77, "learning_rate": 0.00026867861774395994, "loss": 2.6122, "step": 28588 }, { "epoch": 0.77, "learning_rate": 0.00026861925691043785, "loss": 2.6153, "step": 28589 }, { "epoch": 0.77, "learning_rate": 0.0002685599016177253, "loss": 2.7542, "step": 28590 }, { "epoch": 0.77, "learning_rate": 0.000268500551866272, "loss": 2.3702, "step": 28591 }, { "epoch": 0.77, "learning_rate": 0.000268441207656528, "loss": 2.4687, "step": 28592 }, { "epoch": 0.77, "learning_rate": 0.0002683818689889425, "loss": 2.6371, "step": 28593 }, { "epoch": 0.77, "learning_rate": 0.00026832253586396505, "loss": 2.1195, "step": 28594 }, { "epoch": 0.77, "learning_rate": 0.0002682632082820453, "loss": 2.6489, "step": 28595 }, { "epoch": 0.77, "learning_rate": 0.0002682038862436326, "loss": 2.5357, "step": 28596 }, { "epoch": 0.77, "learning_rate": 0.00026814456974917677, "loss": 2.5084, "step": 28597 }, { "epoch": 0.77, "learning_rate": 0.0002680852587991266, "loss": 2.6773, "step": 28598 }, { "epoch": 0.77, "learning_rate": 0.00026802595339393153, "loss": 2.2715, "step": 28599 }, { "epoch": 0.77, "learning_rate": 0.00026796665353404103, "loss": 2.3615, "step": 28600 }, { "epoch": 0.77, "learning_rate": 0.00026790735921990426, "loss": 2.5951, "step": 28601 }, { "epoch": 0.77, "learning_rate": 0.0002678480704519708, "loss": 2.8284, "step": 28602 }, { "epoch": 0.77, "learning_rate": 0.0002677887872306891, "loss": 2.7378, "step": 28603 }, { "epoch": 0.77, "learning_rate": 0.0002677295095565088, "loss": 2.8663, "step": 28604 }, { "epoch": 0.77, "learning_rate": 0.00026767023742987894, "loss": 2.594, "step": 28605 }, { "epoch": 0.77, "learning_rate": 0.0002676109708512482, "loss": 2.2853, "step": 28606 }, { "epoch": 0.77, "learning_rate": 0.0002675517098210658, "loss": 2.4177, "step": 28607 }, { "epoch": 0.77, "learning_rate": 0.0002674924543397806, "loss": 2.0415, "step": 28608 }, { "epoch": 0.77, "learning_rate": 0.0002674332044078418, "loss": 2.7765, "step": 28609 }, { "epoch": 0.77, "learning_rate": 0.00026737396002569826, "loss": 2.4863, "step": 28610 }, { "epoch": 0.77, "learning_rate": 0.0002673147211937984, "loss": 2.5336, "step": 28611 }, { "epoch": 0.77, "learning_rate": 0.0002672554879125911, "loss": 2.6151, "step": 28612 }, { "epoch": 0.77, "learning_rate": 0.0002671962601825253, "loss": 2.6433, "step": 28613 }, { "epoch": 0.77, "learning_rate": 0.00026713703800404953, "loss": 2.6917, "step": 28614 }, { "epoch": 0.77, "learning_rate": 0.00026707782137761263, "loss": 2.7455, "step": 28615 }, { "epoch": 0.77, "learning_rate": 0.00026701861030366334, "loss": 2.2416, "step": 28616 }, { "epoch": 0.77, "learning_rate": 0.00026695940478264977, "loss": 2.5801, "step": 28617 }, { "epoch": 0.77, "learning_rate": 0.0002669002048150208, "loss": 2.6312, "step": 28618 }, { "epoch": 0.77, "learning_rate": 0.000266841010401225, "loss": 2.461, "step": 28619 }, { "epoch": 0.77, "learning_rate": 0.00026678182154171026, "loss": 2.6592, "step": 28620 }, { "epoch": 0.77, "learning_rate": 0.00026672263823692544, "loss": 2.6268, "step": 28621 }, { "epoch": 0.77, "learning_rate": 0.00026666346048731884, "loss": 2.6053, "step": 28622 }, { "epoch": 0.77, "learning_rate": 0.00026660428829333873, "loss": 2.759, "step": 28623 }, { "epoch": 0.77, "learning_rate": 0.00026654512165543364, "loss": 2.4265, "step": 28624 }, { "epoch": 0.77, "learning_rate": 0.0002664859605740513, "loss": 2.3083, "step": 28625 }, { "epoch": 0.77, "learning_rate": 0.00026642680504964023, "loss": 2.2675, "step": 28626 }, { "epoch": 0.77, "learning_rate": 0.0002663676550826486, "loss": 2.066, "step": 28627 }, { "epoch": 0.77, "learning_rate": 0.00026630851067352434, "loss": 2.389, "step": 28628 }, { "epoch": 0.77, "learning_rate": 0.00026624937182271593, "loss": 2.4807, "step": 28629 }, { "epoch": 0.77, "learning_rate": 0.0002661902385306708, "loss": 2.1615, "step": 28630 }, { "epoch": 0.77, "learning_rate": 0.00026613111079783734, "loss": 2.2434, "step": 28631 }, { "epoch": 0.77, "learning_rate": 0.0002660719886246635, "loss": 2.0834, "step": 28632 }, { "epoch": 0.77, "learning_rate": 0.000266012872011597, "loss": 2.3357, "step": 28633 }, { "epoch": 0.77, "learning_rate": 0.0002659537609590853, "loss": 2.3704, "step": 28634 }, { "epoch": 0.77, "learning_rate": 0.0002658946554675773, "loss": 1.9384, "step": 28635 }, { "epoch": 0.77, "learning_rate": 0.0002658355555375198, "loss": 2.1036, "step": 28636 }, { "epoch": 0.77, "learning_rate": 0.0002657764611693612, "loss": 2.1526, "step": 28637 }, { "epoch": 0.77, "learning_rate": 0.00026571737236354853, "loss": 2.7062, "step": 28638 }, { "epoch": 0.77, "learning_rate": 0.0002656582891205299, "loss": 2.2846, "step": 28639 }, { "epoch": 0.77, "learning_rate": 0.0002655992114407527, "loss": 2.621, "step": 28640 }, { "epoch": 0.77, "learning_rate": 0.0002655401393246646, "loss": 2.3354, "step": 28641 }, { "epoch": 0.77, "learning_rate": 0.00026548107277271307, "loss": 2.8656, "step": 28642 }, { "epoch": 0.77, "learning_rate": 0.0002654220117853459, "loss": 2.1866, "step": 28643 }, { "epoch": 0.77, "learning_rate": 0.0002653629563630099, "loss": 2.0819, "step": 28644 }, { "epoch": 0.77, "learning_rate": 0.00026530390650615323, "loss": 2.7545, "step": 28645 }, { "epoch": 0.77, "learning_rate": 0.0002652448622152224, "loss": 2.5583, "step": 28646 }, { "epoch": 0.77, "learning_rate": 0.0002651858234906649, "loss": 2.3558, "step": 28647 }, { "epoch": 0.77, "learning_rate": 0.00026512679033292874, "loss": 2.2084, "step": 28648 }, { "epoch": 0.77, "learning_rate": 0.00026506776274246035, "loss": 2.385, "step": 28649 }, { "epoch": 0.77, "learning_rate": 0.00026500874071970726, "loss": 2.6092, "step": 28650 }, { "epoch": 0.77, "learning_rate": 0.0002649497242651169, "loss": 2.2531, "step": 28651 }, { "epoch": 0.77, "learning_rate": 0.0002648907133791356, "loss": 2.2475, "step": 28652 }, { "epoch": 0.77, "learning_rate": 0.0002648317080622108, "loss": 2.8095, "step": 28653 }, { "epoch": 0.77, "learning_rate": 0.0002647727083147896, "loss": 2.1252, "step": 28654 }, { "epoch": 0.77, "learning_rate": 0.000264713714137319, "loss": 2.7086, "step": 28655 }, { "epoch": 0.77, "learning_rate": 0.00026465472553024603, "loss": 2.5043, "step": 28656 }, { "epoch": 0.77, "learning_rate": 0.0002645957424940172, "loss": 2.466, "step": 28657 }, { "epoch": 0.77, "learning_rate": 0.0002645367650290794, "loss": 2.3887, "step": 28658 }, { "epoch": 0.77, "learning_rate": 0.00026447779313588005, "loss": 2.5715, "step": 28659 }, { "epoch": 0.77, "learning_rate": 0.0002644188268148647, "loss": 2.3977, "step": 28660 }, { "epoch": 0.77, "learning_rate": 0.0002643598660664812, "loss": 1.7894, "step": 28661 }, { "epoch": 0.77, "learning_rate": 0.00026430091089117605, "loss": 2.6285, "step": 28662 }, { "epoch": 0.77, "learning_rate": 0.0002642419612893954, "loss": 2.4527, "step": 28663 }, { "epoch": 0.77, "learning_rate": 0.00026418301726158645, "loss": 2.0809, "step": 28664 }, { "epoch": 0.77, "learning_rate": 0.0002641240788081951, "loss": 2.3471, "step": 28665 }, { "epoch": 0.77, "learning_rate": 0.0002640651459296681, "loss": 2.5403, "step": 28666 }, { "epoch": 0.77, "learning_rate": 0.000264006218626452, "loss": 2.2514, "step": 28667 }, { "epoch": 0.77, "learning_rate": 0.00026394729689899335, "loss": 2.1179, "step": 28668 }, { "epoch": 0.77, "learning_rate": 0.00026388838074773823, "loss": 2.3417, "step": 28669 }, { "epoch": 0.77, "learning_rate": 0.00026382947017313343, "loss": 2.4871, "step": 28670 }, { "epoch": 0.77, "learning_rate": 0.0002637705651756247, "loss": 2.3431, "step": 28671 }, { "epoch": 0.77, "learning_rate": 0.00026371166575565885, "loss": 2.3195, "step": 28672 }, { "epoch": 0.77, "learning_rate": 0.0002636527719136812, "loss": 2.4689, "step": 28673 }, { "epoch": 0.77, "learning_rate": 0.0002635938836501387, "loss": 2.628, "step": 28674 }, { "epoch": 0.77, "learning_rate": 0.00026353500096547766, "loss": 2.6178, "step": 28675 }, { "epoch": 0.77, "learning_rate": 0.0002634761238601435, "loss": 2.8164, "step": 28676 }, { "epoch": 0.77, "learning_rate": 0.0002634172523345826, "loss": 2.3667, "step": 28677 }, { "epoch": 0.77, "learning_rate": 0.000263358386389241, "loss": 3.0041, "step": 28678 }, { "epoch": 0.77, "learning_rate": 0.00026329952602456444, "loss": 2.8417, "step": 28679 }, { "epoch": 0.77, "learning_rate": 0.0002632406712409989, "loss": 2.2612, "step": 28680 }, { "epoch": 0.77, "learning_rate": 0.00026318182203899034, "loss": 2.6016, "step": 28681 }, { "epoch": 0.77, "learning_rate": 0.0002631229784189846, "loss": 2.31, "step": 28682 }, { "epoch": 0.77, "learning_rate": 0.0002630641403814277, "loss": 2.1921, "step": 28683 }, { "epoch": 0.77, "learning_rate": 0.0002630053079267648, "loss": 2.2789, "step": 28684 }, { "epoch": 0.77, "learning_rate": 0.00026294648105544197, "loss": 2.9093, "step": 28685 }, { "epoch": 0.77, "learning_rate": 0.00026288765976790476, "loss": 2.2746, "step": 28686 }, { "epoch": 0.77, "learning_rate": 0.0002628288440645988, "loss": 2.9689, "step": 28687 }, { "epoch": 0.77, "learning_rate": 0.00026277003394597023, "loss": 2.409, "step": 28688 }, { "epoch": 0.77, "learning_rate": 0.00026271122941246363, "loss": 2.335, "step": 28689 }, { "epoch": 0.77, "learning_rate": 0.000262652430464525, "loss": 2.6411, "step": 28690 }, { "epoch": 0.77, "learning_rate": 0.0002625936371026, "loss": 2.4709, "step": 28691 }, { "epoch": 0.77, "learning_rate": 0.00026253484932713345, "loss": 2.8195, "step": 28692 }, { "epoch": 0.77, "learning_rate": 0.00026247606713857073, "loss": 2.2565, "step": 28693 }, { "epoch": 0.77, "learning_rate": 0.0002624172905373582, "loss": 2.573, "step": 28694 }, { "epoch": 0.77, "learning_rate": 0.00026235851952393995, "loss": 2.3814, "step": 28695 }, { "epoch": 0.77, "learning_rate": 0.0002622997540987617, "loss": 2.8294, "step": 28696 }, { "epoch": 0.77, "learning_rate": 0.000262240994262269, "loss": 2.5752, "step": 28697 }, { "epoch": 0.77, "learning_rate": 0.0002621822400149063, "loss": 2.6559, "step": 28698 }, { "epoch": 0.77, "learning_rate": 0.000262123491357119, "loss": 2.1325, "step": 28699 }, { "epoch": 0.77, "learning_rate": 0.00026206474828935225, "loss": 3.046, "step": 28700 }, { "epoch": 0.77, "learning_rate": 0.000262006010812051, "loss": 2.151, "step": 28701 }, { "epoch": 0.77, "learning_rate": 0.0002619472789256606, "loss": 2.5484, "step": 28702 }, { "epoch": 0.77, "learning_rate": 0.0002618885526306254, "loss": 2.4279, "step": 28703 }, { "epoch": 0.77, "learning_rate": 0.0002618298319273905, "loss": 2.6209, "step": 28704 }, { "epoch": 0.77, "learning_rate": 0.0002617711168164012, "loss": 2.4351, "step": 28705 }, { "epoch": 0.77, "learning_rate": 0.0002617124072981012, "loss": 2.4099, "step": 28706 }, { "epoch": 0.77, "learning_rate": 0.0002616537033729367, "loss": 2.6537, "step": 28707 }, { "epoch": 0.77, "learning_rate": 0.0002615950050413515, "loss": 2.3706, "step": 28708 }, { "epoch": 0.77, "learning_rate": 0.0002615363123037904, "loss": 2.3608, "step": 28709 }, { "epoch": 0.77, "learning_rate": 0.0002614776251606985, "loss": 2.6582, "step": 28710 }, { "epoch": 0.77, "learning_rate": 0.00026141894361251985, "loss": 2.7152, "step": 28711 }, { "epoch": 0.77, "learning_rate": 0.00026136026765969923, "loss": 2.6297, "step": 28712 }, { "epoch": 0.77, "learning_rate": 0.0002613015973026811, "loss": 2.4248, "step": 28713 }, { "epoch": 0.77, "learning_rate": 0.00026124293254191003, "loss": 2.1687, "step": 28714 }, { "epoch": 0.77, "learning_rate": 0.0002611842733778307, "loss": 2.2208, "step": 28715 }, { "epoch": 0.77, "learning_rate": 0.000261125619810887, "loss": 2.457, "step": 28716 }, { "epoch": 0.77, "learning_rate": 0.0002610669718415234, "loss": 2.8249, "step": 28717 }, { "epoch": 0.77, "learning_rate": 0.0002610083294701847, "loss": 2.1664, "step": 28718 }, { "epoch": 0.77, "learning_rate": 0.0002609496926973142, "loss": 2.5202, "step": 28719 }, { "epoch": 0.77, "learning_rate": 0.00026089106152335685, "loss": 2.8456, "step": 28720 }, { "epoch": 0.77, "learning_rate": 0.00026083243594875703, "loss": 2.9315, "step": 28721 }, { "epoch": 0.77, "learning_rate": 0.00026077381597395833, "loss": 2.6651, "step": 28722 }, { "epoch": 0.77, "learning_rate": 0.0002607152015994053, "loss": 2.1381, "step": 28723 }, { "epoch": 0.77, "learning_rate": 0.00026065659282554143, "loss": 1.9305, "step": 28724 }, { "epoch": 0.77, "learning_rate": 0.00026059798965281103, "loss": 2.0833, "step": 28725 }, { "epoch": 0.77, "learning_rate": 0.000260539392081658, "loss": 2.6493, "step": 28726 }, { "epoch": 0.77, "learning_rate": 0.0002604808001125264, "loss": 1.9957, "step": 28727 }, { "epoch": 0.77, "learning_rate": 0.00026042221374585994, "loss": 3.028, "step": 28728 }, { "epoch": 0.77, "learning_rate": 0.000260363632982103, "loss": 2.5769, "step": 28729 }, { "epoch": 0.77, "learning_rate": 0.00026030505782169856, "loss": 2.3259, "step": 28730 }, { "epoch": 0.77, "learning_rate": 0.0002602464882650908, "loss": 2.4272, "step": 28731 }, { "epoch": 0.77, "learning_rate": 0.0002601879243127234, "loss": 2.5898, "step": 28732 }, { "epoch": 0.77, "learning_rate": 0.00026012936596504, "loss": 2.0252, "step": 28733 }, { "epoch": 0.77, "learning_rate": 0.0002600708132224845, "loss": 2.4477, "step": 28734 }, { "epoch": 0.77, "learning_rate": 0.0002600122660855, "loss": 2.0998, "step": 28735 }, { "epoch": 0.77, "learning_rate": 0.00025995372455453025, "loss": 2.7342, "step": 28736 }, { "epoch": 0.77, "learning_rate": 0.00025989518863001905, "loss": 2.5305, "step": 28737 }, { "epoch": 0.77, "learning_rate": 0.0002598366583124093, "loss": 2.4974, "step": 28738 }, { "epoch": 0.77, "learning_rate": 0.00025977813360214476, "loss": 2.3459, "step": 28739 }, { "epoch": 0.77, "learning_rate": 0.00025971961449966865, "loss": 2.2256, "step": 28740 }, { "epoch": 0.77, "learning_rate": 0.0002596611010054244, "loss": 2.3512, "step": 28741 }, { "epoch": 0.77, "learning_rate": 0.0002596025931198557, "loss": 2.5608, "step": 28742 }, { "epoch": 0.77, "learning_rate": 0.0002595440908434049, "loss": 2.163, "step": 28743 }, { "epoch": 0.77, "learning_rate": 0.0002594855941765158, "loss": 2.1043, "step": 28744 }, { "epoch": 0.77, "learning_rate": 0.0002594271031196315, "loss": 2.2119, "step": 28745 }, { "epoch": 0.77, "learning_rate": 0.000259368617673195, "loss": 2.2921, "step": 28746 }, { "epoch": 0.77, "learning_rate": 0.00025931013783764945, "loss": 2.417, "step": 28747 }, { "epoch": 0.77, "learning_rate": 0.00025925166361343813, "loss": 2.4809, "step": 28748 }, { "epoch": 0.77, "learning_rate": 0.0002591931950010035, "loss": 2.2775, "step": 28749 }, { "epoch": 0.77, "learning_rate": 0.0002591347320007891, "loss": 2.425, "step": 28750 }, { "epoch": 0.77, "learning_rate": 0.0002590762746132371, "loss": 2.1507, "step": 28751 }, { "epoch": 0.77, "learning_rate": 0.0002590178228387909, "loss": 2.2284, "step": 28752 }, { "epoch": 0.77, "learning_rate": 0.00025895937667789326, "loss": 2.318, "step": 28753 }, { "epoch": 0.77, "learning_rate": 0.00025890093613098675, "loss": 2.98, "step": 28754 }, { "epoch": 0.77, "learning_rate": 0.0002588425011985144, "loss": 2.1981, "step": 28755 }, { "epoch": 0.77, "learning_rate": 0.0002587840718809189, "loss": 2.15, "step": 28756 }, { "epoch": 0.77, "learning_rate": 0.0002587256481786425, "loss": 2.3835, "step": 28757 }, { "epoch": 0.77, "learning_rate": 0.0002586672300921281, "loss": 2.4812, "step": 28758 }, { "epoch": 0.77, "learning_rate": 0.0002586088176218182, "loss": 2.1707, "step": 28759 }, { "epoch": 0.77, "learning_rate": 0.00025855041076815546, "loss": 2.4613, "step": 28760 }, { "epoch": 0.77, "learning_rate": 0.00025849200953158237, "loss": 2.679, "step": 28761 }, { "epoch": 0.77, "learning_rate": 0.00025843361391254105, "loss": 2.2088, "step": 28762 }, { "epoch": 0.77, "learning_rate": 0.00025837522391147403, "loss": 2.6272, "step": 28763 }, { "epoch": 0.77, "learning_rate": 0.00025831683952882414, "loss": 2.3491, "step": 28764 }, { "epoch": 0.77, "learning_rate": 0.0002582584607650329, "loss": 2.6957, "step": 28765 }, { "epoch": 0.77, "learning_rate": 0.0002582000876205426, "loss": 2.6233, "step": 28766 }, { "epoch": 0.77, "learning_rate": 0.0002581417200957965, "loss": 2.7062, "step": 28767 }, { "epoch": 0.77, "learning_rate": 0.0002580833581912357, "loss": 2.7233, "step": 28768 }, { "epoch": 0.77, "learning_rate": 0.00025802500190730314, "loss": 2.9548, "step": 28769 }, { "epoch": 0.77, "learning_rate": 0.0002579666512444402, "loss": 2.9276, "step": 28770 }, { "epoch": 0.77, "learning_rate": 0.00025790830620308914, "loss": 2.2585, "step": 28771 }, { "epoch": 0.77, "learning_rate": 0.0002578499667836922, "loss": 2.8761, "step": 28772 }, { "epoch": 0.77, "learning_rate": 0.00025779163298669116, "loss": 2.2286, "step": 28773 }, { "epoch": 0.77, "learning_rate": 0.000257733304812528, "loss": 2.0296, "step": 28774 }, { "epoch": 0.77, "learning_rate": 0.00025767498226164496, "loss": 2.4676, "step": 28775 }, { "epoch": 0.77, "learning_rate": 0.00025761666533448326, "loss": 2.595, "step": 28776 }, { "epoch": 0.77, "learning_rate": 0.0002575583540314853, "loss": 2.5646, "step": 28777 }, { "epoch": 0.77, "learning_rate": 0.00025750004835309217, "loss": 2.7111, "step": 28778 }, { "epoch": 0.77, "learning_rate": 0.00025744174829974554, "loss": 2.537, "step": 28779 }, { "epoch": 0.77, "learning_rate": 0.00025738345387188823, "loss": 2.7389, "step": 28780 }, { "epoch": 0.77, "learning_rate": 0.0002573251650699606, "loss": 2.5776, "step": 28781 }, { "epoch": 0.77, "learning_rate": 0.00025726688189440497, "loss": 2.5436, "step": 28782 }, { "epoch": 0.77, "learning_rate": 0.00025720860434566285, "loss": 2.6988, "step": 28783 }, { "epoch": 0.77, "learning_rate": 0.0002571503324241752, "loss": 2.4211, "step": 28784 }, { "epoch": 0.77, "learning_rate": 0.00025709206613038394, "loss": 2.6322, "step": 28785 }, { "epoch": 0.77, "learning_rate": 0.0002570338054647302, "loss": 1.8878, "step": 28786 }, { "epoch": 0.77, "learning_rate": 0.00025697555042765566, "loss": 2.3792, "step": 28787 }, { "epoch": 0.77, "learning_rate": 0.0002569173010196018, "loss": 2.7776, "step": 28788 }, { "epoch": 0.77, "learning_rate": 0.0002568590572410092, "loss": 2.354, "step": 28789 }, { "epoch": 0.77, "learning_rate": 0.0002568008190923197, "loss": 2.6628, "step": 28790 }, { "epoch": 0.77, "learning_rate": 0.0002567425865739744, "loss": 2.4861, "step": 28791 }, { "epoch": 0.77, "learning_rate": 0.00025668435968641403, "loss": 2.2025, "step": 28792 }, { "epoch": 0.77, "learning_rate": 0.00025662613843008053, "loss": 2.6696, "step": 28793 }, { "epoch": 0.77, "learning_rate": 0.0002565679228054142, "loss": 2.7744, "step": 28794 }, { "epoch": 0.77, "learning_rate": 0.0002565097128128564, "loss": 2.3013, "step": 28795 }, { "epoch": 0.77, "learning_rate": 0.0002564515084528484, "loss": 2.1854, "step": 28796 }, { "epoch": 0.77, "learning_rate": 0.00025639330972583043, "loss": 2.8591, "step": 28797 }, { "epoch": 0.77, "learning_rate": 0.00025633511663224385, "loss": 2.6127, "step": 28798 }, { "epoch": 0.77, "learning_rate": 0.00025627692917252955, "loss": 2.5962, "step": 28799 }, { "epoch": 0.77, "learning_rate": 0.00025621874734712825, "loss": 2.5598, "step": 28800 }, { "epoch": 0.77, "learning_rate": 0.00025616057115648096, "loss": 2.3994, "step": 28801 }, { "epoch": 0.77, "learning_rate": 0.00025610240060102796, "loss": 2.3228, "step": 28802 }, { "epoch": 0.77, "learning_rate": 0.00025604423568121015, "loss": 2.1237, "step": 28803 }, { "epoch": 0.77, "learning_rate": 0.00025598607639746863, "loss": 2.7619, "step": 28804 }, { "epoch": 0.77, "learning_rate": 0.0002559279227502428, "loss": 2.1088, "step": 28805 }, { "epoch": 0.77, "learning_rate": 0.0002558697747399744, "loss": 2.5471, "step": 28806 }, { "epoch": 0.77, "learning_rate": 0.0002558116323671038, "loss": 2.549, "step": 28807 }, { "epoch": 0.77, "learning_rate": 0.000255753495632071, "loss": 2.5074, "step": 28808 }, { "epoch": 0.77, "learning_rate": 0.0002556953645353166, "loss": 2.2864, "step": 28809 }, { "epoch": 0.77, "learning_rate": 0.0002556372390772813, "loss": 2.3324, "step": 28810 }, { "epoch": 0.77, "learning_rate": 0.00025557911925840494, "loss": 2.4629, "step": 28811 }, { "epoch": 0.77, "learning_rate": 0.0002555210050791281, "loss": 1.8842, "step": 28812 }, { "epoch": 0.77, "learning_rate": 0.0002554628965398911, "loss": 2.4424, "step": 28813 }, { "epoch": 0.77, "learning_rate": 0.000255404793641134, "loss": 2.5872, "step": 28814 }, { "epoch": 0.77, "learning_rate": 0.0002553466963832973, "loss": 2.6185, "step": 28815 }, { "epoch": 0.77, "learning_rate": 0.0002552886047668207, "loss": 2.4259, "step": 28816 }, { "epoch": 0.77, "learning_rate": 0.00025523051879214445, "loss": 2.3543, "step": 28817 }, { "epoch": 0.77, "learning_rate": 0.0002551724384597086, "loss": 2.1383, "step": 28818 }, { "epoch": 0.77, "learning_rate": 0.0002551143637699532, "loss": 2.2366, "step": 28819 }, { "epoch": 0.77, "learning_rate": 0.0002550562947233186, "loss": 2.4507, "step": 28820 }, { "epoch": 0.77, "learning_rate": 0.0002549982313202439, "loss": 2.5954, "step": 28821 }, { "epoch": 0.77, "learning_rate": 0.0002549401735611695, "loss": 2.5623, "step": 28822 }, { "epoch": 0.77, "learning_rate": 0.00025488212144653545, "loss": 2.0445, "step": 28823 }, { "epoch": 0.77, "learning_rate": 0.0002548240749767808, "loss": 2.6666, "step": 28824 }, { "epoch": 0.77, "learning_rate": 0.0002547660341523459, "loss": 2.5894, "step": 28825 }, { "epoch": 0.77, "learning_rate": 0.00025470799897367024, "loss": 2.333, "step": 28826 }, { "epoch": 0.77, "learning_rate": 0.0002546499694411936, "loss": 2.3005, "step": 28827 }, { "epoch": 0.77, "learning_rate": 0.0002545919455553557, "loss": 2.6048, "step": 28828 }, { "epoch": 0.77, "learning_rate": 0.0002545339273165956, "loss": 2.5376, "step": 28829 }, { "epoch": 0.77, "learning_rate": 0.00025447591472535334, "loss": 2.583, "step": 28830 }, { "epoch": 0.77, "learning_rate": 0.0002544179077820682, "loss": 2.8544, "step": 28831 }, { "epoch": 0.77, "learning_rate": 0.00025435990648717976, "loss": 2.18, "step": 28832 }, { "epoch": 0.77, "learning_rate": 0.0002543019108411273, "loss": 2.3409, "step": 28833 }, { "epoch": 0.77, "learning_rate": 0.00025424392084435056, "loss": 2.3482, "step": 28834 }, { "epoch": 0.77, "learning_rate": 0.0002541859364972883, "loss": 2.8477, "step": 28835 }, { "epoch": 0.77, "learning_rate": 0.00025412795780038023, "loss": 2.5671, "step": 28836 }, { "epoch": 0.77, "learning_rate": 0.0002540699847540652, "loss": 2.2562, "step": 28837 }, { "epoch": 0.77, "learning_rate": 0.00025401201735878256, "loss": 2.9297, "step": 28838 }, { "epoch": 0.78, "learning_rate": 0.0002539540556149714, "loss": 2.6003, "step": 28839 }, { "epoch": 0.78, "learning_rate": 0.00025389609952307114, "loss": 2.6528, "step": 28840 }, { "epoch": 0.78, "learning_rate": 0.00025383814908352053, "loss": 2.3477, "step": 28841 }, { "epoch": 0.78, "learning_rate": 0.000253780204296759, "loss": 3.3899, "step": 28842 }, { "epoch": 0.78, "learning_rate": 0.00025372226516322494, "loss": 2.5397, "step": 28843 }, { "epoch": 0.78, "learning_rate": 0.00025366433168335755, "loss": 2.4509, "step": 28844 }, { "epoch": 0.78, "learning_rate": 0.00025360640385759583, "loss": 2.5321, "step": 28845 }, { "epoch": 0.78, "learning_rate": 0.0002535484816863786, "loss": 2.7226, "step": 28846 }, { "epoch": 0.78, "learning_rate": 0.0002534905651701448, "loss": 2.5628, "step": 28847 }, { "epoch": 0.78, "learning_rate": 0.00025343265430933273, "loss": 2.3912, "step": 28848 }, { "epoch": 0.78, "learning_rate": 0.0002533747491043814, "loss": 2.632, "step": 28849 }, { "epoch": 0.78, "learning_rate": 0.00025331684955572976, "loss": 2.3537, "step": 28850 }, { "epoch": 0.78, "learning_rate": 0.00025325895566381595, "loss": 2.87, "step": 28851 }, { "epoch": 0.78, "learning_rate": 0.0002532010674290784, "loss": 2.4534, "step": 28852 }, { "epoch": 0.78, "learning_rate": 0.00025314318485195677, "loss": 1.9863, "step": 28853 }, { "epoch": 0.78, "learning_rate": 0.0002530853079328884, "loss": 1.8354, "step": 28854 }, { "epoch": 0.78, "learning_rate": 0.00025302743667231253, "loss": 2.3133, "step": 28855 }, { "epoch": 0.78, "learning_rate": 0.00025296957107066696, "loss": 2.3386, "step": 28856 }, { "epoch": 0.78, "learning_rate": 0.0002529117111283905, "loss": 2.6697, "step": 28857 }, { "epoch": 0.78, "learning_rate": 0.00025285385684592124, "loss": 2.589, "step": 28858 }, { "epoch": 0.78, "learning_rate": 0.0002527960082236975, "loss": 2.7942, "step": 28859 }, { "epoch": 0.78, "learning_rate": 0.00025273816526215776, "loss": 3.0172, "step": 28860 }, { "epoch": 0.78, "learning_rate": 0.00025268032796174037, "loss": 2.8602, "step": 28861 }, { "epoch": 0.78, "learning_rate": 0.0002526224963228828, "loss": 2.4432, "step": 28862 }, { "epoch": 0.78, "learning_rate": 0.0002525646703460239, "loss": 3.0165, "step": 28863 }, { "epoch": 0.78, "learning_rate": 0.000252506850031601, "loss": 1.9532, "step": 28864 }, { "epoch": 0.78, "learning_rate": 0.0002524490353800527, "loss": 2.7727, "step": 28865 }, { "epoch": 0.78, "learning_rate": 0.0002523912263918172, "loss": 2.7196, "step": 28866 }, { "epoch": 0.78, "learning_rate": 0.00025233342306733175, "loss": 2.2069, "step": 28867 }, { "epoch": 0.78, "learning_rate": 0.00025227562540703475, "loss": 2.3602, "step": 28868 }, { "epoch": 0.78, "learning_rate": 0.00025221783341136406, "loss": 2.6881, "step": 28869 }, { "epoch": 0.78, "learning_rate": 0.00025216004708075723, "loss": 2.7756, "step": 28870 }, { "epoch": 0.78, "learning_rate": 0.00025210226641565216, "loss": 2.634, "step": 28871 }, { "epoch": 0.78, "learning_rate": 0.00025204449141648654, "loss": 2.2154, "step": 28872 }, { "epoch": 0.78, "learning_rate": 0.0002519867220836981, "loss": 2.7363, "step": 28873 }, { "epoch": 0.78, "learning_rate": 0.0002519289584177249, "loss": 2.1534, "step": 28874 }, { "epoch": 0.78, "learning_rate": 0.0002518712004190039, "loss": 2.4172, "step": 28875 }, { "epoch": 0.78, "learning_rate": 0.0002518134480879728, "loss": 2.5398, "step": 28876 }, { "epoch": 0.78, "learning_rate": 0.00025175570142506933, "loss": 2.252, "step": 28877 }, { "epoch": 0.78, "learning_rate": 0.0002516979604307309, "loss": 2.8013, "step": 28878 }, { "epoch": 0.78, "learning_rate": 0.00025164022510539496, "loss": 2.702, "step": 28879 }, { "epoch": 0.78, "learning_rate": 0.00025158249544949917, "loss": 2.454, "step": 28880 }, { "epoch": 0.78, "learning_rate": 0.00025152477146348027, "loss": 2.7156, "step": 28881 }, { "epoch": 0.78, "learning_rate": 0.0002514670531477762, "loss": 2.6392, "step": 28882 }, { "epoch": 0.78, "learning_rate": 0.0002514093405028236, "loss": 2.3326, "step": 28883 }, { "epoch": 0.78, "learning_rate": 0.00025135163352905997, "loss": 2.4939, "step": 28884 }, { "epoch": 0.78, "learning_rate": 0.00025129393222692254, "loss": 2.4632, "step": 28885 }, { "epoch": 0.78, "learning_rate": 0.00025123623659684845, "loss": 2.2533, "step": 28886 }, { "epoch": 0.78, "learning_rate": 0.00025117854663927477, "loss": 2.6476, "step": 28887 }, { "epoch": 0.78, "learning_rate": 0.00025112086235463884, "loss": 2.3771, "step": 28888 }, { "epoch": 0.78, "learning_rate": 0.000251063183743377, "loss": 2.4003, "step": 28889 }, { "epoch": 0.78, "learning_rate": 0.0002510055108059267, "loss": 2.5455, "step": 28890 }, { "epoch": 0.78, "learning_rate": 0.0002509478435427246, "loss": 2.4949, "step": 28891 }, { "epoch": 0.78, "learning_rate": 0.00025089018195420786, "loss": 2.5459, "step": 28892 }, { "epoch": 0.78, "learning_rate": 0.00025083252604081343, "loss": 2.4508, "step": 28893 }, { "epoch": 0.78, "learning_rate": 0.00025077487580297755, "loss": 2.4502, "step": 28894 }, { "epoch": 0.78, "learning_rate": 0.0002507172312411372, "loss": 2.2718, "step": 28895 }, { "epoch": 0.78, "learning_rate": 0.00025065959235572944, "loss": 2.6225, "step": 28896 }, { "epoch": 0.78, "learning_rate": 0.0002506019591471904, "loss": 2.2893, "step": 28897 }, { "epoch": 0.78, "learning_rate": 0.0002505443316159569, "loss": 2.9379, "step": 28898 }, { "epoch": 0.78, "learning_rate": 0.00025048670976246556, "loss": 2.3353, "step": 28899 }, { "epoch": 0.78, "learning_rate": 0.00025042909358715293, "loss": 2.4369, "step": 28900 }, { "epoch": 0.78, "learning_rate": 0.00025037148309045576, "loss": 2.2926, "step": 28901 }, { "epoch": 0.78, "learning_rate": 0.00025031387827280995, "loss": 1.8746, "step": 28902 }, { "epoch": 0.78, "learning_rate": 0.0002502562791346521, "loss": 2.2729, "step": 28903 }, { "epoch": 0.78, "learning_rate": 0.00025019868567641867, "loss": 2.2954, "step": 28904 }, { "epoch": 0.78, "learning_rate": 0.000250141097898546, "loss": 2.5075, "step": 28905 }, { "epoch": 0.78, "learning_rate": 0.0002500835158014705, "loss": 2.6854, "step": 28906 }, { "epoch": 0.78, "learning_rate": 0.000250025939385628, "loss": 2.2388, "step": 28907 }, { "epoch": 0.78, "learning_rate": 0.0002499683686514549, "loss": 2.7575, "step": 28908 }, { "epoch": 0.78, "learning_rate": 0.00024991080359938755, "loss": 2.6354, "step": 28909 }, { "epoch": 0.78, "learning_rate": 0.00024985324422986167, "loss": 2.5517, "step": 28910 }, { "epoch": 0.78, "learning_rate": 0.0002497956905433131, "loss": 2.1288, "step": 28911 }, { "epoch": 0.78, "learning_rate": 0.0002497381425401789, "loss": 2.7376, "step": 28912 }, { "epoch": 0.78, "learning_rate": 0.0002496806002208941, "loss": 2.869, "step": 28913 }, { "epoch": 0.78, "learning_rate": 0.00024962306358589494, "loss": 2.4904, "step": 28914 }, { "epoch": 0.78, "learning_rate": 0.00024956553263561756, "loss": 2.198, "step": 28915 }, { "epoch": 0.78, "learning_rate": 0.0002495080073704973, "loss": 2.5724, "step": 28916 }, { "epoch": 0.78, "learning_rate": 0.0002494504877909701, "loss": 2.3852, "step": 28917 }, { "epoch": 0.78, "learning_rate": 0.00024939297389747197, "loss": 2.7091, "step": 28918 }, { "epoch": 0.78, "learning_rate": 0.0002493354656904383, "loss": 1.9494, "step": 28919 }, { "epoch": 0.78, "learning_rate": 0.0002492779631703054, "loss": 1.7892, "step": 28920 }, { "epoch": 0.78, "learning_rate": 0.0002492204663375081, "loss": 2.3046, "step": 28921 }, { "epoch": 0.78, "learning_rate": 0.0002491629751924822, "loss": 2.1499, "step": 28922 }, { "epoch": 0.78, "learning_rate": 0.0002491054897356637, "loss": 2.0552, "step": 28923 }, { "epoch": 0.78, "learning_rate": 0.0002490480099674872, "loss": 2.611, "step": 28924 }, { "epoch": 0.78, "learning_rate": 0.00024899053588838937, "loss": 2.5174, "step": 28925 }, { "epoch": 0.78, "learning_rate": 0.0002489330674988046, "loss": 2.8288, "step": 28926 }, { "epoch": 0.78, "learning_rate": 0.0002488756047991686, "loss": 2.411, "step": 28927 }, { "epoch": 0.78, "learning_rate": 0.00024881814778991707, "loss": 2.7051, "step": 28928 }, { "epoch": 0.78, "learning_rate": 0.0002487606964714847, "loss": 2.5625, "step": 28929 }, { "epoch": 0.78, "learning_rate": 0.000248703250844307, "loss": 2.2496, "step": 28930 }, { "epoch": 0.78, "learning_rate": 0.0002486458109088191, "loss": 2.2652, "step": 28931 }, { "epoch": 0.78, "learning_rate": 0.0002485883766654562, "loss": 2.4193, "step": 28932 }, { "epoch": 0.78, "learning_rate": 0.0002485309481146537, "loss": 2.8006, "step": 28933 }, { "epoch": 0.78, "learning_rate": 0.0002484735252568461, "loss": 2.3154, "step": 28934 }, { "epoch": 0.78, "learning_rate": 0.00024841610809246873, "loss": 2.3683, "step": 28935 }, { "epoch": 0.78, "learning_rate": 0.00024835869662195685, "loss": 3.0722, "step": 28936 }, { "epoch": 0.78, "learning_rate": 0.0002483012908457445, "loss": 2.4686, "step": 28937 }, { "epoch": 0.78, "learning_rate": 0.00024824389076426746, "loss": 2.7582, "step": 28938 }, { "epoch": 0.78, "learning_rate": 0.00024818649637796067, "loss": 2.6003, "step": 28939 }, { "epoch": 0.78, "learning_rate": 0.0002481291076872583, "loss": 2.2728, "step": 28940 }, { "epoch": 0.78, "learning_rate": 0.00024807172469259553, "loss": 2.5299, "step": 28941 }, { "epoch": 0.78, "learning_rate": 0.00024801434739440677, "loss": 2.6734, "step": 28942 }, { "epoch": 0.78, "learning_rate": 0.0002479569757931268, "loss": 2.4615, "step": 28943 }, { "epoch": 0.78, "learning_rate": 0.00024789960988919036, "loss": 2.8806, "step": 28944 }, { "epoch": 0.78, "learning_rate": 0.000247842249683032, "loss": 2.2486, "step": 28945 }, { "epoch": 0.78, "learning_rate": 0.00024778489517508626, "loss": 2.6093, "step": 28946 }, { "epoch": 0.78, "learning_rate": 0.0002477275463657881, "loss": 2.2966, "step": 28947 }, { "epoch": 0.78, "learning_rate": 0.0002476702032555711, "loss": 2.6768, "step": 28948 }, { "epoch": 0.78, "learning_rate": 0.00024761286584487055, "loss": 2.6562, "step": 28949 }, { "epoch": 0.78, "learning_rate": 0.0002475555341341197, "loss": 2.4324, "step": 28950 }, { "epoch": 0.78, "learning_rate": 0.000247498208123754, "loss": 2.4355, "step": 28951 }, { "epoch": 0.78, "learning_rate": 0.0002474408878142076, "loss": 2.4197, "step": 28952 }, { "epoch": 0.78, "learning_rate": 0.0002473835732059142, "loss": 2.7278, "step": 28953 }, { "epoch": 0.78, "learning_rate": 0.00024732626429930827, "loss": 1.9069, "step": 28954 }, { "epoch": 0.78, "learning_rate": 0.0002472689610948242, "loss": 2.3562, "step": 28955 }, { "epoch": 0.78, "learning_rate": 0.0002472116635928958, "loss": 2.7159, "step": 28956 }, { "epoch": 0.78, "learning_rate": 0.0002471543717939572, "loss": 2.5262, "step": 28957 }, { "epoch": 0.78, "learning_rate": 0.00024709708569844237, "loss": 2.164, "step": 28958 }, { "epoch": 0.78, "learning_rate": 0.0002470398053067855, "loss": 2.5366, "step": 28959 }, { "epoch": 0.78, "learning_rate": 0.00024698253061942077, "loss": 2.4261, "step": 28960 }, { "epoch": 0.78, "learning_rate": 0.0002469252616367814, "loss": 2.2794, "step": 28961 }, { "epoch": 0.78, "learning_rate": 0.00024686799835930165, "loss": 2.5698, "step": 28962 }, { "epoch": 0.78, "learning_rate": 0.0002468107407874153, "loss": 2.6848, "step": 28963 }, { "epoch": 0.78, "learning_rate": 0.00024675348892155613, "loss": 2.1649, "step": 28964 }, { "epoch": 0.78, "learning_rate": 0.00024669624276215784, "loss": 2.0711, "step": 28965 }, { "epoch": 0.78, "learning_rate": 0.0002466390023096544, "loss": 2.7309, "step": 28966 }, { "epoch": 0.78, "learning_rate": 0.00024658176756447894, "loss": 2.379, "step": 28967 }, { "epoch": 0.78, "learning_rate": 0.0002465245385270656, "loss": 2.5073, "step": 28968 }, { "epoch": 0.78, "learning_rate": 0.00024646731519784737, "loss": 2.6752, "step": 28969 }, { "epoch": 0.78, "learning_rate": 0.000246410097577258, "loss": 2.2955, "step": 28970 }, { "epoch": 0.78, "learning_rate": 0.000246352885665731, "loss": 2.627, "step": 28971 }, { "epoch": 0.78, "learning_rate": 0.0002462956794636998, "loss": 2.6364, "step": 28972 }, { "epoch": 0.78, "learning_rate": 0.0002462384789715978, "loss": 2.5529, "step": 28973 }, { "epoch": 0.78, "learning_rate": 0.00024618128418985865, "loss": 2.449, "step": 28974 }, { "epoch": 0.78, "learning_rate": 0.000246124095118915, "loss": 2.5587, "step": 28975 }, { "epoch": 0.78, "learning_rate": 0.0002460669117592004, "loss": 2.3281, "step": 28976 }, { "epoch": 0.78, "learning_rate": 0.000246009734111148, "loss": 2.5425, "step": 28977 }, { "epoch": 0.78, "learning_rate": 0.00024595256217519124, "loss": 2.5568, "step": 28978 }, { "epoch": 0.78, "learning_rate": 0.00024589539595176323, "loss": 2.5558, "step": 28979 }, { "epoch": 0.78, "learning_rate": 0.0002458382354412967, "loss": 2.56, "step": 28980 }, { "epoch": 0.78, "learning_rate": 0.0002457810806442248, "loss": 2.5003, "step": 28981 }, { "epoch": 0.78, "learning_rate": 0.00024572393156098085, "loss": 2.646, "step": 28982 }, { "epoch": 0.78, "learning_rate": 0.0002456667881919973, "loss": 2.3351, "step": 28983 }, { "epoch": 0.78, "learning_rate": 0.00024560965053770724, "loss": 2.1684, "step": 28984 }, { "epoch": 0.78, "learning_rate": 0.00024555251859854357, "loss": 2.2814, "step": 28985 }, { "epoch": 0.78, "learning_rate": 0.0002454953923749392, "loss": 2.8711, "step": 28986 }, { "epoch": 0.78, "learning_rate": 0.00024543827186732716, "loss": 2.3506, "step": 28987 }, { "epoch": 0.78, "learning_rate": 0.0002453811570761395, "loss": 2.3106, "step": 28988 }, { "epoch": 0.78, "learning_rate": 0.0002453240480018094, "loss": 2.6787, "step": 28989 }, { "epoch": 0.78, "learning_rate": 0.00024526694464476926, "loss": 2.05, "step": 28990 }, { "epoch": 0.78, "learning_rate": 0.0002452098470054519, "loss": 2.4621, "step": 28991 }, { "epoch": 0.78, "learning_rate": 0.0002451527550842898, "loss": 2.9305, "step": 28992 }, { "epoch": 0.78, "learning_rate": 0.0002450956688817158, "loss": 1.887, "step": 28993 }, { "epoch": 0.78, "learning_rate": 0.0002450385883981616, "loss": 2.3056, "step": 28994 }, { "epoch": 0.78, "learning_rate": 0.00024498151363406054, "loss": 2.4275, "step": 28995 }, { "epoch": 0.78, "learning_rate": 0.0002449244445898441, "loss": 2.7256, "step": 28996 }, { "epoch": 0.78, "learning_rate": 0.0002448673812659449, "loss": 2.2659, "step": 28997 }, { "epoch": 0.78, "learning_rate": 0.0002448103236627959, "loss": 2.1072, "step": 28998 }, { "epoch": 0.78, "learning_rate": 0.00024475327178082864, "loss": 2.6347, "step": 28999 }, { "epoch": 0.78, "learning_rate": 0.00024469622562047557, "loss": 2.6663, "step": 29000 }, { "epoch": 0.78, "learning_rate": 0.0002446391851821692, "loss": 2.866, "step": 29001 }, { "epoch": 0.78, "learning_rate": 0.0002445821504663409, "loss": 2.53, "step": 29002 }, { "epoch": 0.78, "learning_rate": 0.00024452512147342333, "loss": 2.5116, "step": 29003 }, { "epoch": 0.78, "learning_rate": 0.0002444680982038482, "loss": 2.5568, "step": 29004 }, { "epoch": 0.78, "learning_rate": 0.00024441108065804783, "loss": 1.9564, "step": 29005 }, { "epoch": 0.78, "learning_rate": 0.0002443540688364543, "loss": 2.6788, "step": 29006 }, { "epoch": 0.78, "learning_rate": 0.0002442970627394988, "loss": 2.4657, "step": 29007 }, { "epoch": 0.78, "learning_rate": 0.00024424006236761374, "loss": 2.3984, "step": 29008 }, { "epoch": 0.78, "learning_rate": 0.0002441830677212312, "loss": 2.5223, "step": 29009 }, { "epoch": 0.78, "learning_rate": 0.00024412607880078198, "loss": 2.6252, "step": 29010 }, { "epoch": 0.78, "learning_rate": 0.0002440690956066991, "loss": 2.5562, "step": 29011 }, { "epoch": 0.78, "learning_rate": 0.00024401211813941326, "loss": 2.5304, "step": 29012 }, { "epoch": 0.78, "learning_rate": 0.00024395514639935644, "loss": 2.3862, "step": 29013 }, { "epoch": 0.78, "learning_rate": 0.00024389818038696054, "loss": 2.4965, "step": 29014 }, { "epoch": 0.78, "learning_rate": 0.00024384122010265652, "loss": 2.621, "step": 29015 }, { "epoch": 0.78, "learning_rate": 0.00024378426554687638, "loss": 2.2109, "step": 29016 }, { "epoch": 0.78, "learning_rate": 0.00024372731672005134, "loss": 2.2399, "step": 29017 }, { "epoch": 0.78, "learning_rate": 0.0002436703736226129, "loss": 2.5626, "step": 29018 }, { "epoch": 0.78, "learning_rate": 0.00024361343625499288, "loss": 2.744, "step": 29019 }, { "epoch": 0.78, "learning_rate": 0.0002435565046176219, "loss": 3.0467, "step": 29020 }, { "epoch": 0.78, "learning_rate": 0.00024349957871093155, "loss": 2.4352, "step": 29021 }, { "epoch": 0.78, "learning_rate": 0.00024344265853535352, "loss": 2.3863, "step": 29022 }, { "epoch": 0.78, "learning_rate": 0.0002433857440913181, "loss": 2.3208, "step": 29023 }, { "epoch": 0.78, "learning_rate": 0.0002433288353792572, "loss": 2.3353, "step": 29024 }, { "epoch": 0.78, "learning_rate": 0.0002432719323996021, "loss": 2.422, "step": 29025 }, { "epoch": 0.78, "learning_rate": 0.0002432150351527832, "loss": 2.3178, "step": 29026 }, { "epoch": 0.78, "learning_rate": 0.00024315814363923196, "loss": 2.6911, "step": 29027 }, { "epoch": 0.78, "learning_rate": 0.00024310125785937954, "loss": 2.4164, "step": 29028 }, { "epoch": 0.78, "learning_rate": 0.0002430443778136564, "loss": 2.4275, "step": 29029 }, { "epoch": 0.78, "learning_rate": 0.00024298750350249378, "loss": 2.6076, "step": 29030 }, { "epoch": 0.78, "learning_rate": 0.0002429306349263225, "loss": 2.6674, "step": 29031 }, { "epoch": 0.78, "learning_rate": 0.00024287377208557338, "loss": 2.3543, "step": 29032 }, { "epoch": 0.78, "learning_rate": 0.00024281691498067738, "loss": 2.2872, "step": 29033 }, { "epoch": 0.78, "learning_rate": 0.00024276006361206482, "loss": 2.7984, "step": 29034 }, { "epoch": 0.78, "learning_rate": 0.0002427032179801667, "loss": 2.6167, "step": 29035 }, { "epoch": 0.78, "learning_rate": 0.00024264637808541357, "loss": 2.3196, "step": 29036 }, { "epoch": 0.78, "learning_rate": 0.00024258954392823606, "loss": 2.6264, "step": 29037 }, { "epoch": 0.78, "learning_rate": 0.00024253271550906508, "loss": 2.1297, "step": 29038 }, { "epoch": 0.78, "learning_rate": 0.0002424758928283305, "loss": 2.1246, "step": 29039 }, { "epoch": 0.78, "learning_rate": 0.00024241907588646317, "loss": 2.288, "step": 29040 }, { "epoch": 0.78, "learning_rate": 0.00024236226468389365, "loss": 1.9011, "step": 29041 }, { "epoch": 0.78, "learning_rate": 0.00024230545922105195, "loss": 2.8536, "step": 29042 }, { "epoch": 0.78, "learning_rate": 0.00024224865949836838, "loss": 2.7501, "step": 29043 }, { "epoch": 0.78, "learning_rate": 0.00024219186551627405, "loss": 2.4185, "step": 29044 }, { "epoch": 0.78, "learning_rate": 0.00024213507727519835, "loss": 2.1245, "step": 29045 }, { "epoch": 0.78, "learning_rate": 0.00024207829477557207, "loss": 2.0932, "step": 29046 }, { "epoch": 0.78, "learning_rate": 0.0002420215180178249, "loss": 2.6648, "step": 29047 }, { "epoch": 0.78, "learning_rate": 0.00024196474700238714, "loss": 2.8066, "step": 29048 }, { "epoch": 0.78, "learning_rate": 0.00024190798172968897, "loss": 2.3473, "step": 29049 }, { "epoch": 0.78, "learning_rate": 0.00024185122220016044, "loss": 2.3089, "step": 29050 }, { "epoch": 0.78, "learning_rate": 0.00024179446841423135, "loss": 2.2895, "step": 29051 }, { "epoch": 0.78, "learning_rate": 0.0002417377203723322, "loss": 2.5554, "step": 29052 }, { "epoch": 0.78, "learning_rate": 0.00024168097807489232, "loss": 2.4506, "step": 29053 }, { "epoch": 0.78, "learning_rate": 0.00024162424152234196, "loss": 2.188, "step": 29054 }, { "epoch": 0.78, "learning_rate": 0.00024156751071511051, "loss": 2.4583, "step": 29055 }, { "epoch": 0.78, "learning_rate": 0.00024151078565362761, "loss": 2.4852, "step": 29056 }, { "epoch": 0.78, "learning_rate": 0.00024145406633832413, "loss": 2.5449, "step": 29057 }, { "epoch": 0.78, "learning_rate": 0.0002413973527696286, "loss": 2.2114, "step": 29058 }, { "epoch": 0.78, "learning_rate": 0.00024134064494797113, "loss": 2.5018, "step": 29059 }, { "epoch": 0.78, "learning_rate": 0.00024128394287378164, "loss": 2.6673, "step": 29060 }, { "epoch": 0.78, "learning_rate": 0.00024122724654748908, "loss": 2.3351, "step": 29061 }, { "epoch": 0.78, "learning_rate": 0.0002411705559695232, "loss": 2.3996, "step": 29062 }, { "epoch": 0.78, "learning_rate": 0.00024111387114031358, "loss": 2.4775, "step": 29063 }, { "epoch": 0.78, "learning_rate": 0.00024105719206028953, "loss": 3.2807, "step": 29064 }, { "epoch": 0.78, "learning_rate": 0.00024100051872988083, "loss": 2.2618, "step": 29065 }, { "epoch": 0.78, "learning_rate": 0.0002409438511495161, "loss": 2.4997, "step": 29066 }, { "epoch": 0.78, "learning_rate": 0.00024088718931962518, "loss": 2.7759, "step": 29067 }, { "epoch": 0.78, "learning_rate": 0.00024083053324063742, "loss": 2.1266, "step": 29068 }, { "epoch": 0.78, "learning_rate": 0.0002407738829129813, "loss": 2.6054, "step": 29069 }, { "epoch": 0.78, "learning_rate": 0.00024071723833708682, "loss": 2.4554, "step": 29070 }, { "epoch": 0.78, "learning_rate": 0.00024066059951338294, "loss": 2.4419, "step": 29071 }, { "epoch": 0.78, "learning_rate": 0.00024060396644229844, "loss": 2.5375, "step": 29072 }, { "epoch": 0.78, "learning_rate": 0.00024054733912426274, "loss": 2.3476, "step": 29073 }, { "epoch": 0.78, "learning_rate": 0.00024049071755970441, "loss": 3.0338, "step": 29074 }, { "epoch": 0.78, "learning_rate": 0.00024043410174905255, "loss": 1.9989, "step": 29075 }, { "epoch": 0.78, "learning_rate": 0.00024037749169273615, "loss": 2.4604, "step": 29076 }, { "epoch": 0.78, "learning_rate": 0.00024032088739118408, "loss": 1.9089, "step": 29077 }, { "epoch": 0.78, "learning_rate": 0.0002402642888448251, "loss": 2.5234, "step": 29078 }, { "epoch": 0.78, "learning_rate": 0.00024020769605408843, "loss": 2.6102, "step": 29079 }, { "epoch": 0.78, "learning_rate": 0.00024015110901940207, "loss": 2.5558, "step": 29080 }, { "epoch": 0.78, "learning_rate": 0.00024009452774119533, "loss": 2.8934, "step": 29081 }, { "epoch": 0.78, "learning_rate": 0.000240037952219896, "loss": 2.601, "step": 29082 }, { "epoch": 0.78, "learning_rate": 0.0002399813824559336, "loss": 2.5745, "step": 29083 }, { "epoch": 0.78, "learning_rate": 0.00023992481844973667, "loss": 2.5336, "step": 29084 }, { "epoch": 0.78, "learning_rate": 0.00023986826020173303, "loss": 2.3694, "step": 29085 }, { "epoch": 0.78, "learning_rate": 0.00023981170771235173, "loss": 2.4357, "step": 29086 }, { "epoch": 0.78, "learning_rate": 0.00023975516098202122, "loss": 2.1496, "step": 29087 }, { "epoch": 0.78, "learning_rate": 0.00023969862001116938, "loss": 2.8543, "step": 29088 }, { "epoch": 0.78, "learning_rate": 0.00023964208480022487, "loss": 2.5873, "step": 29089 }, { "epoch": 0.78, "learning_rate": 0.00023958555534961602, "loss": 2.3202, "step": 29090 }, { "epoch": 0.78, "learning_rate": 0.000239529031659771, "loss": 2.8254, "step": 29091 }, { "epoch": 0.78, "learning_rate": 0.00023947251373111845, "loss": 2.5555, "step": 29092 }, { "epoch": 0.78, "learning_rate": 0.00023941600156408583, "loss": 2.2354, "step": 29093 }, { "epoch": 0.78, "learning_rate": 0.0002393594951591016, "loss": 2.651, "step": 29094 }, { "epoch": 0.78, "learning_rate": 0.00023930299451659377, "loss": 2.2989, "step": 29095 }, { "epoch": 0.78, "learning_rate": 0.00023924649963699053, "loss": 2.4887, "step": 29096 }, { "epoch": 0.78, "learning_rate": 0.00023919001052072008, "loss": 2.5514, "step": 29097 }, { "epoch": 0.78, "learning_rate": 0.0002391335271682099, "loss": 2.1377, "step": 29098 }, { "epoch": 0.78, "learning_rate": 0.00023907704957988797, "loss": 2.7698, "step": 29099 }, { "epoch": 0.78, "learning_rate": 0.00023902057775618258, "loss": 2.5637, "step": 29100 }, { "epoch": 0.78, "learning_rate": 0.00023896411169752098, "loss": 2.4237, "step": 29101 }, { "epoch": 0.78, "learning_rate": 0.00023890765140433112, "loss": 2.2406, "step": 29102 }, { "epoch": 0.78, "learning_rate": 0.00023885119687704092, "loss": 2.2927, "step": 29103 }, { "epoch": 0.78, "learning_rate": 0.00023879474811607792, "loss": 2.4393, "step": 29104 }, { "epoch": 0.78, "learning_rate": 0.00023873830512186989, "loss": 2.7223, "step": 29105 }, { "epoch": 0.78, "learning_rate": 0.0002386818678948446, "loss": 2.4979, "step": 29106 }, { "epoch": 0.78, "learning_rate": 0.00023862543643542912, "loss": 2.5209, "step": 29107 }, { "epoch": 0.78, "learning_rate": 0.00023856901074405113, "loss": 2.5112, "step": 29108 }, { "epoch": 0.78, "learning_rate": 0.00023851259082113818, "loss": 2.191, "step": 29109 }, { "epoch": 0.78, "learning_rate": 0.00023845617666711782, "loss": 2.2298, "step": 29110 }, { "epoch": 0.78, "learning_rate": 0.0002383997682824175, "loss": 2.5963, "step": 29111 }, { "epoch": 0.78, "learning_rate": 0.00023834336566746418, "loss": 2.6865, "step": 29112 }, { "epoch": 0.78, "learning_rate": 0.00023828696882268518, "loss": 2.4097, "step": 29113 }, { "epoch": 0.78, "learning_rate": 0.00023823057774850832, "loss": 2.7887, "step": 29114 }, { "epoch": 0.78, "learning_rate": 0.0002381741924453602, "loss": 2.6563, "step": 29115 }, { "epoch": 0.78, "learning_rate": 0.00023811781291366809, "loss": 2.4778, "step": 29116 }, { "epoch": 0.78, "learning_rate": 0.00023806143915385924, "loss": 2.7798, "step": 29117 }, { "epoch": 0.78, "learning_rate": 0.0002380050711663607, "loss": 2.7821, "step": 29118 }, { "epoch": 0.78, "learning_rate": 0.00023794870895159982, "loss": 2.584, "step": 29119 }, { "epoch": 0.78, "learning_rate": 0.00023789235251000295, "loss": 2.2518, "step": 29120 }, { "epoch": 0.78, "learning_rate": 0.0002378360018419974, "loss": 2.4047, "step": 29121 }, { "epoch": 0.78, "learning_rate": 0.00023777965694801007, "loss": 2.5238, "step": 29122 }, { "epoch": 0.78, "learning_rate": 0.0002377233178284677, "loss": 2.3458, "step": 29123 }, { "epoch": 0.78, "learning_rate": 0.00023766698448379753, "loss": 2.772, "step": 29124 }, { "epoch": 0.78, "learning_rate": 0.00023761065691442574, "loss": 2.2955, "step": 29125 }, { "epoch": 0.78, "learning_rate": 0.00023755433512077928, "loss": 2.6851, "step": 29126 }, { "epoch": 0.78, "learning_rate": 0.00023749801910328517, "loss": 2.3432, "step": 29127 }, { "epoch": 0.78, "learning_rate": 0.00023744170886236938, "loss": 2.5184, "step": 29128 }, { "epoch": 0.78, "learning_rate": 0.00023738540439845868, "loss": 2.8806, "step": 29129 }, { "epoch": 0.78, "learning_rate": 0.0002373291057119803, "loss": 2.4069, "step": 29130 }, { "epoch": 0.78, "learning_rate": 0.00023727281280336, "loss": 2.7265, "step": 29131 }, { "epoch": 0.78, "learning_rate": 0.00023721652567302488, "loss": 2.7269, "step": 29132 }, { "epoch": 0.78, "learning_rate": 0.0002371602443214006, "loss": 2.2443, "step": 29133 }, { "epoch": 0.78, "learning_rate": 0.00023710396874891394, "loss": 2.6889, "step": 29134 }, { "epoch": 0.78, "learning_rate": 0.0002370476989559912, "loss": 1.9206, "step": 29135 }, { "epoch": 0.78, "learning_rate": 0.00023699143494305874, "loss": 2.5505, "step": 29136 }, { "epoch": 0.78, "learning_rate": 0.00023693517671054276, "loss": 2.514, "step": 29137 }, { "epoch": 0.78, "learning_rate": 0.00023687892425886981, "loss": 2.5991, "step": 29138 }, { "epoch": 0.78, "learning_rate": 0.00023682267758846532, "loss": 2.6574, "step": 29139 }, { "epoch": 0.78, "learning_rate": 0.00023676643669975572, "loss": 2.4753, "step": 29140 }, { "epoch": 0.78, "learning_rate": 0.0002367102015931676, "loss": 2.2279, "step": 29141 }, { "epoch": 0.78, "learning_rate": 0.00023665397226912578, "loss": 2.1568, "step": 29142 }, { "epoch": 0.78, "learning_rate": 0.00023659774872805762, "loss": 2.745, "step": 29143 }, { "epoch": 0.78, "learning_rate": 0.0002365415309703882, "loss": 2.4911, "step": 29144 }, { "epoch": 0.78, "learning_rate": 0.00023648531899654357, "loss": 2.3873, "step": 29145 }, { "epoch": 0.78, "learning_rate": 0.00023642911280695, "loss": 2.6815, "step": 29146 }, { "epoch": 0.78, "learning_rate": 0.00023637291240203274, "loss": 2.7115, "step": 29147 }, { "epoch": 0.78, "learning_rate": 0.00023631671778221765, "loss": 2.3623, "step": 29148 }, { "epoch": 0.78, "learning_rate": 0.00023626052894793059, "loss": 2.5455, "step": 29149 }, { "epoch": 0.78, "learning_rate": 0.00023620434589959727, "loss": 1.9768, "step": 29150 }, { "epoch": 0.78, "learning_rate": 0.00023614816863764355, "loss": 3.004, "step": 29151 }, { "epoch": 0.78, "learning_rate": 0.0002360919971624944, "loss": 3.0082, "step": 29152 }, { "epoch": 0.78, "learning_rate": 0.00023603583147457574, "loss": 2.6252, "step": 29153 }, { "epoch": 0.78, "learning_rate": 0.00023597967157431332, "loss": 2.3945, "step": 29154 }, { "epoch": 0.78, "learning_rate": 0.00023592351746213182, "loss": 2.5776, "step": 29155 }, { "epoch": 0.78, "learning_rate": 0.0002358673691384573, "loss": 2.4756, "step": 29156 }, { "epoch": 0.78, "learning_rate": 0.00023581122660371533, "loss": 2.2053, "step": 29157 }, { "epoch": 0.78, "learning_rate": 0.0002357550898583306, "loss": 2.6792, "step": 29158 }, { "epoch": 0.78, "learning_rate": 0.00023569895890272895, "loss": 2.4549, "step": 29159 }, { "epoch": 0.78, "learning_rate": 0.00023564283373733508, "loss": 2.5759, "step": 29160 }, { "epoch": 0.78, "learning_rate": 0.0002355867143625744, "loss": 2.7896, "step": 29161 }, { "epoch": 0.78, "learning_rate": 0.00023553060077887222, "loss": 2.2975, "step": 29162 }, { "epoch": 0.78, "learning_rate": 0.00023547449298665346, "loss": 2.5566, "step": 29163 }, { "epoch": 0.78, "learning_rate": 0.00023541839098634322, "loss": 2.7692, "step": 29164 }, { "epoch": 0.78, "learning_rate": 0.0002353622947783669, "loss": 2.3787, "step": 29165 }, { "epoch": 0.78, "learning_rate": 0.00023530620436314876, "loss": 2.3739, "step": 29166 }, { "epoch": 0.78, "learning_rate": 0.00023525011974111443, "loss": 2.1329, "step": 29167 }, { "epoch": 0.78, "learning_rate": 0.00023519404091268794, "loss": 2.6744, "step": 29168 }, { "epoch": 0.78, "learning_rate": 0.00023513796787829488, "loss": 2.5539, "step": 29169 }, { "epoch": 0.78, "learning_rate": 0.00023508190063836022, "loss": 2.5102, "step": 29170 }, { "epoch": 0.78, "learning_rate": 0.0002350258391933079, "loss": 2.7788, "step": 29171 }, { "epoch": 0.78, "learning_rate": 0.00023496978354356314, "loss": 2.1922, "step": 29172 }, { "epoch": 0.78, "learning_rate": 0.00023491373368955082, "loss": 2.0303, "step": 29173 }, { "epoch": 0.78, "learning_rate": 0.00023485768963169495, "loss": 2.335, "step": 29174 }, { "epoch": 0.78, "learning_rate": 0.00023480165137042041, "loss": 2.6694, "step": 29175 }, { "epoch": 0.78, "learning_rate": 0.00023474561890615188, "loss": 2.8589, "step": 29176 }, { "epoch": 0.78, "learning_rate": 0.00023468959223931364, "loss": 2.4547, "step": 29177 }, { "epoch": 0.78, "learning_rate": 0.00023463357137033049, "loss": 2.5959, "step": 29178 }, { "epoch": 0.78, "learning_rate": 0.0002345775562996263, "loss": 2.3369, "step": 29179 }, { "epoch": 0.78, "learning_rate": 0.00023452154702762563, "loss": 2.4738, "step": 29180 }, { "epoch": 0.78, "learning_rate": 0.0002344655435547529, "loss": 2.3122, "step": 29181 }, { "epoch": 0.78, "learning_rate": 0.00023440954588143238, "loss": 2.3298, "step": 29182 }, { "epoch": 0.78, "learning_rate": 0.00023435355400808834, "loss": 2.5473, "step": 29183 }, { "epoch": 0.78, "learning_rate": 0.00023429756793514513, "loss": 2.5475, "step": 29184 }, { "epoch": 0.78, "learning_rate": 0.00023424158766302628, "loss": 2.8217, "step": 29185 }, { "epoch": 0.78, "learning_rate": 0.0002341856131921566, "loss": 2.5897, "step": 29186 }, { "epoch": 0.78, "learning_rate": 0.0002341296445229595, "loss": 2.2203, "step": 29187 }, { "epoch": 0.78, "learning_rate": 0.0002340736816558593, "loss": 2.5721, "step": 29188 }, { "epoch": 0.78, "learning_rate": 0.0002340177245912799, "loss": 2.7725, "step": 29189 }, { "epoch": 0.78, "learning_rate": 0.00023396177332964542, "loss": 2.5249, "step": 29190 }, { "epoch": 0.78, "learning_rate": 0.00023390582787137949, "loss": 2.1203, "step": 29191 }, { "epoch": 0.78, "learning_rate": 0.00023384988821690633, "loss": 2.3187, "step": 29192 }, { "epoch": 0.78, "learning_rate": 0.00023379395436664907, "loss": 3.0286, "step": 29193 }, { "epoch": 0.78, "learning_rate": 0.00023373802632103201, "loss": 2.3132, "step": 29194 }, { "epoch": 0.78, "learning_rate": 0.00023368210408047853, "loss": 2.3849, "step": 29195 }, { "epoch": 0.78, "learning_rate": 0.00023362618764541244, "loss": 2.1974, "step": 29196 }, { "epoch": 0.78, "learning_rate": 0.00023357027701625767, "loss": 2.7563, "step": 29197 }, { "epoch": 0.78, "learning_rate": 0.0002335143721934372, "loss": 2.9302, "step": 29198 }, { "epoch": 0.78, "learning_rate": 0.00023345847317737478, "loss": 2.5211, "step": 29199 }, { "epoch": 0.78, "learning_rate": 0.00023340257996849411, "loss": 2.7067, "step": 29200 }, { "epoch": 0.78, "learning_rate": 0.00023334669256721796, "loss": 2.669, "step": 29201 }, { "epoch": 0.78, "learning_rate": 0.00023329081097397077, "loss": 2.9845, "step": 29202 }, { "epoch": 0.78, "learning_rate": 0.00023323493518917504, "loss": 2.1745, "step": 29203 }, { "epoch": 0.78, "learning_rate": 0.0002331790652132544, "loss": 2.655, "step": 29204 }, { "epoch": 0.78, "learning_rate": 0.00023312320104663232, "loss": 2.598, "step": 29205 }, { "epoch": 0.78, "learning_rate": 0.0002330673426897314, "loss": 2.7064, "step": 29206 }, { "epoch": 0.78, "learning_rate": 0.0002330114901429753, "loss": 2.3018, "step": 29207 }, { "epoch": 0.78, "learning_rate": 0.00023295564340678688, "loss": 2.4786, "step": 29208 }, { "epoch": 0.78, "learning_rate": 0.0002328998024815895, "loss": 2.5628, "step": 29209 }, { "epoch": 0.78, "learning_rate": 0.00023284396736780632, "loss": 2.4611, "step": 29210 }, { "epoch": 0.79, "learning_rate": 0.00023278813806585974, "loss": 2.9346, "step": 29211 }, { "epoch": 0.79, "learning_rate": 0.00023273231457617317, "loss": 2.2741, "step": 29212 }, { "epoch": 0.79, "learning_rate": 0.0002326764968991696, "loss": 2.9822, "step": 29213 }, { "epoch": 0.79, "learning_rate": 0.00023262068503527122, "loss": 2.2788, "step": 29214 }, { "epoch": 0.79, "learning_rate": 0.00023256487898490154, "loss": 2.3667, "step": 29215 }, { "epoch": 0.79, "learning_rate": 0.00023250907874848348, "loss": 2.6034, "step": 29216 }, { "epoch": 0.79, "learning_rate": 0.00023245328432643908, "loss": 2.6253, "step": 29217 }, { "epoch": 0.79, "learning_rate": 0.00023239749571919144, "loss": 2.9973, "step": 29218 }, { "epoch": 0.79, "learning_rate": 0.00023234171292716333, "loss": 2.7164, "step": 29219 }, { "epoch": 0.79, "learning_rate": 0.00023228593595077697, "loss": 2.0909, "step": 29220 }, { "epoch": 0.79, "learning_rate": 0.00023223016479045512, "loss": 2.5722, "step": 29221 }, { "epoch": 0.79, "learning_rate": 0.00023217439944662023, "loss": 2.251, "step": 29222 }, { "epoch": 0.79, "learning_rate": 0.00023211863991969472, "loss": 2.5248, "step": 29223 }, { "epoch": 0.79, "learning_rate": 0.0002320628862101015, "loss": 2.4042, "step": 29224 }, { "epoch": 0.79, "learning_rate": 0.00023200713831826226, "loss": 2.6778, "step": 29225 }, { "epoch": 0.79, "learning_rate": 0.0002319513962445997, "loss": 2.3112, "step": 29226 }, { "epoch": 0.79, "learning_rate": 0.00023189565998953598, "loss": 2.4462, "step": 29227 }, { "epoch": 0.79, "learning_rate": 0.0002318399295534934, "loss": 2.3296, "step": 29228 }, { "epoch": 0.79, "learning_rate": 0.00023178420493689446, "loss": 2.6513, "step": 29229 }, { "epoch": 0.79, "learning_rate": 0.00023172848614016073, "loss": 2.9332, "step": 29230 }, { "epoch": 0.79, "learning_rate": 0.0002316727731637147, "loss": 2.4712, "step": 29231 }, { "epoch": 0.79, "learning_rate": 0.00023161706600797872, "loss": 2.7074, "step": 29232 }, { "epoch": 0.79, "learning_rate": 0.00023156136467337407, "loss": 2.7242, "step": 29233 }, { "epoch": 0.79, "learning_rate": 0.00023150566916032322, "loss": 2.2225, "step": 29234 }, { "epoch": 0.79, "learning_rate": 0.00023144997946924795, "loss": 2.6046, "step": 29235 }, { "epoch": 0.79, "learning_rate": 0.00023139429560057023, "loss": 2.4335, "step": 29236 }, { "epoch": 0.79, "learning_rate": 0.0002313386175547123, "loss": 2.8513, "step": 29237 }, { "epoch": 0.79, "learning_rate": 0.00023128294533209526, "loss": 2.4413, "step": 29238 }, { "epoch": 0.79, "learning_rate": 0.0002312272789331411, "loss": 2.4625, "step": 29239 }, { "epoch": 0.79, "learning_rate": 0.00023117161835827172, "loss": 2.2845, "step": 29240 }, { "epoch": 0.79, "learning_rate": 0.00023111596360790866, "loss": 2.1283, "step": 29241 }, { "epoch": 0.79, "learning_rate": 0.00023106031468247357, "loss": 2.448, "step": 29242 }, { "epoch": 0.79, "learning_rate": 0.00023100467158238848, "loss": 2.4056, "step": 29243 }, { "epoch": 0.79, "learning_rate": 0.00023094903430807414, "loss": 2.5626, "step": 29244 }, { "epoch": 0.79, "learning_rate": 0.00023089340285995265, "loss": 2.5979, "step": 29245 }, { "epoch": 0.79, "learning_rate": 0.000230837777238445, "loss": 2.649, "step": 29246 }, { "epoch": 0.79, "learning_rate": 0.0002307821574439729, "loss": 2.7482, "step": 29247 }, { "epoch": 0.79, "learning_rate": 0.00023072654347695766, "loss": 2.3581, "step": 29248 }, { "epoch": 0.79, "learning_rate": 0.00023067093533782047, "loss": 2.9098, "step": 29249 }, { "epoch": 0.79, "learning_rate": 0.0002306153330269828, "loss": 2.5618, "step": 29250 }, { "epoch": 0.79, "learning_rate": 0.00023055973654486606, "loss": 2.5828, "step": 29251 }, { "epoch": 0.79, "learning_rate": 0.00023050414589189094, "loss": 2.3238, "step": 29252 }, { "epoch": 0.79, "learning_rate": 0.00023044856106847888, "loss": 2.1829, "step": 29253 }, { "epoch": 0.79, "learning_rate": 0.0002303929820750509, "loss": 2.9052, "step": 29254 }, { "epoch": 0.79, "learning_rate": 0.00023033740891202805, "loss": 2.4873, "step": 29255 }, { "epoch": 0.79, "learning_rate": 0.0002302818415798318, "loss": 2.5941, "step": 29256 }, { "epoch": 0.79, "learning_rate": 0.00023022628007888225, "loss": 2.1877, "step": 29257 }, { "epoch": 0.79, "learning_rate": 0.00023017072440960085, "loss": 2.7905, "step": 29258 }, { "epoch": 0.79, "learning_rate": 0.00023011517457240872, "loss": 2.8101, "step": 29259 }, { "epoch": 0.79, "learning_rate": 0.00023005963056772617, "loss": 3.0749, "step": 29260 }, { "epoch": 0.79, "learning_rate": 0.00023000409239597375, "loss": 2.3247, "step": 29261 }, { "epoch": 0.79, "learning_rate": 0.00022994856005757337, "loss": 2.5584, "step": 29262 }, { "epoch": 0.79, "learning_rate": 0.00022989303355294466, "loss": 2.17, "step": 29263 }, { "epoch": 0.79, "learning_rate": 0.000229837512882509, "loss": 2.4825, "step": 29264 }, { "epoch": 0.79, "learning_rate": 0.0002297819980466863, "loss": 2.4402, "step": 29265 }, { "epoch": 0.79, "learning_rate": 0.00022972648904589756, "loss": 2.1999, "step": 29266 }, { "epoch": 0.79, "learning_rate": 0.00022967098588056313, "loss": 2.4353, "step": 29267 }, { "epoch": 0.79, "learning_rate": 0.0002296154885511037, "loss": 2.513, "step": 29268 }, { "epoch": 0.79, "learning_rate": 0.0002295599970579395, "loss": 2.3028, "step": 29269 }, { "epoch": 0.79, "learning_rate": 0.0002295045114014913, "loss": 2.7645, "step": 29270 }, { "epoch": 0.79, "learning_rate": 0.000229449031582179, "loss": 2.6234, "step": 29271 }, { "epoch": 0.79, "learning_rate": 0.00022939355760042324, "loss": 2.4203, "step": 29272 }, { "epoch": 0.79, "learning_rate": 0.0002293380894566439, "loss": 2.4347, "step": 29273 }, { "epoch": 0.79, "learning_rate": 0.00022928262715126113, "loss": 2.6365, "step": 29274 }, { "epoch": 0.79, "learning_rate": 0.0002292271706846959, "loss": 2.4914, "step": 29275 }, { "epoch": 0.79, "learning_rate": 0.00022917172005736754, "loss": 2.6166, "step": 29276 }, { "epoch": 0.79, "learning_rate": 0.00022911627526969646, "loss": 2.7578, "step": 29277 }, { "epoch": 0.79, "learning_rate": 0.00022906083632210294, "loss": 2.875, "step": 29278 }, { "epoch": 0.79, "learning_rate": 0.0002290054032150064, "loss": 2.3975, "step": 29279 }, { "epoch": 0.79, "learning_rate": 0.00022894997594882706, "loss": 2.1037, "step": 29280 }, { "epoch": 0.79, "learning_rate": 0.00022889455452398488, "loss": 2.5907, "step": 29281 }, { "epoch": 0.79, "learning_rate": 0.0002288391389408997, "loss": 2.5445, "step": 29282 }, { "epoch": 0.79, "learning_rate": 0.00022878372919999158, "loss": 2.6897, "step": 29283 }, { "epoch": 0.79, "learning_rate": 0.00022872832530167986, "loss": 2.2659, "step": 29284 }, { "epoch": 0.79, "learning_rate": 0.00022867292724638432, "loss": 2.4352, "step": 29285 }, { "epoch": 0.79, "learning_rate": 0.0002286175350345252, "loss": 2.5469, "step": 29286 }, { "epoch": 0.79, "learning_rate": 0.00022856214866652104, "loss": 2.5453, "step": 29287 }, { "epoch": 0.79, "learning_rate": 0.00022850676814279247, "loss": 1.9073, "step": 29288 }, { "epoch": 0.79, "learning_rate": 0.00022845139346375898, "loss": 1.9789, "step": 29289 }, { "epoch": 0.79, "learning_rate": 0.00022839602462983944, "loss": 2.5512, "step": 29290 }, { "epoch": 0.79, "learning_rate": 0.00022834066164145405, "loss": 2.8594, "step": 29291 }, { "epoch": 0.79, "learning_rate": 0.0002282853044990215, "loss": 2.6337, "step": 29292 }, { "epoch": 0.79, "learning_rate": 0.00022822995320296148, "loss": 2.4818, "step": 29293 }, { "epoch": 0.79, "learning_rate": 0.00022817460775369347, "loss": 2.256, "step": 29294 }, { "epoch": 0.79, "learning_rate": 0.00022811926815163652, "loss": 2.611, "step": 29295 }, { "epoch": 0.79, "learning_rate": 0.00022806393439721008, "loss": 2.7601, "step": 29296 }, { "epoch": 0.79, "learning_rate": 0.00022800860649083355, "loss": 2.5888, "step": 29297 }, { "epoch": 0.79, "learning_rate": 0.0002279532844329254, "loss": 1.9324, "step": 29298 }, { "epoch": 0.79, "learning_rate": 0.00022789796822390553, "loss": 2.3, "step": 29299 }, { "epoch": 0.79, "learning_rate": 0.00022784265786419201, "loss": 2.4547, "step": 29300 }, { "epoch": 0.79, "learning_rate": 0.00022778735335420475, "loss": 2.515, "step": 29301 }, { "epoch": 0.79, "learning_rate": 0.00022773205469436275, "loss": 2.3263, "step": 29302 }, { "epoch": 0.79, "learning_rate": 0.00022767676188508435, "loss": 2.8183, "step": 29303 }, { "epoch": 0.79, "learning_rate": 0.00022762147492678874, "loss": 2.3666, "step": 29304 }, { "epoch": 0.79, "learning_rate": 0.00022756619381989496, "loss": 2.4936, "step": 29305 }, { "epoch": 0.79, "learning_rate": 0.00022751091856482142, "loss": 2.3874, "step": 29306 }, { "epoch": 0.79, "learning_rate": 0.0002274556491619869, "loss": 2.2889, "step": 29307 }, { "epoch": 0.79, "learning_rate": 0.0002274003856118104, "loss": 2.3196, "step": 29308 }, { "epoch": 0.79, "learning_rate": 0.0002273451279147104, "loss": 2.4296, "step": 29309 }, { "epoch": 0.79, "learning_rate": 0.00022728987607110586, "loss": 2.3344, "step": 29310 }, { "epoch": 0.79, "learning_rate": 0.00022723463008141476, "loss": 2.4742, "step": 29311 }, { "epoch": 0.79, "learning_rate": 0.00022717938994605604, "loss": 2.5189, "step": 29312 }, { "epoch": 0.79, "learning_rate": 0.00022712415566544797, "loss": 2.7121, "step": 29313 }, { "epoch": 0.79, "learning_rate": 0.00022706892724000928, "loss": 2.5434, "step": 29314 }, { "epoch": 0.79, "learning_rate": 0.00022701370467015836, "loss": 2.8329, "step": 29315 }, { "epoch": 0.79, "learning_rate": 0.00022695848795631314, "loss": 2.3165, "step": 29316 }, { "epoch": 0.79, "learning_rate": 0.00022690327709889226, "loss": 2.0275, "step": 29317 }, { "epoch": 0.79, "learning_rate": 0.00022684807209831414, "loss": 2.3738, "step": 29318 }, { "epoch": 0.79, "learning_rate": 0.0002267928729549966, "loss": 2.3143, "step": 29319 }, { "epoch": 0.79, "learning_rate": 0.00022673767966935798, "loss": 2.7881, "step": 29320 }, { "epoch": 0.79, "learning_rate": 0.00022668249224181648, "loss": 2.0178, "step": 29321 }, { "epoch": 0.79, "learning_rate": 0.0002266273106727901, "loss": 2.5107, "step": 29322 }, { "epoch": 0.79, "learning_rate": 0.00022657213496269702, "loss": 2.9616, "step": 29323 }, { "epoch": 0.79, "learning_rate": 0.0002265169651119554, "loss": 2.684, "step": 29324 }, { "epoch": 0.79, "learning_rate": 0.0002264618011209827, "loss": 2.8547, "step": 29325 }, { "epoch": 0.79, "learning_rate": 0.0002264066429901971, "loss": 2.2624, "step": 29326 }, { "epoch": 0.79, "learning_rate": 0.00022635149072001648, "loss": 2.6579, "step": 29327 }, { "epoch": 0.79, "learning_rate": 0.00022629634431085865, "loss": 2.4683, "step": 29328 }, { "epoch": 0.79, "learning_rate": 0.0002262412037631416, "loss": 2.5728, "step": 29329 }, { "epoch": 0.79, "learning_rate": 0.00022618606907728268, "loss": 2.7648, "step": 29330 }, { "epoch": 0.79, "learning_rate": 0.00022613094025369975, "loss": 2.232, "step": 29331 }, { "epoch": 0.79, "learning_rate": 0.0002260758172928107, "loss": 2.2227, "step": 29332 }, { "epoch": 0.79, "learning_rate": 0.00022602070019503263, "loss": 2.5348, "step": 29333 }, { "epoch": 0.79, "learning_rate": 0.00022596558896078334, "loss": 2.4534, "step": 29334 }, { "epoch": 0.79, "learning_rate": 0.0002259104835904804, "loss": 2.3565, "step": 29335 }, { "epoch": 0.79, "learning_rate": 0.0002258553840845412, "loss": 2.6753, "step": 29336 }, { "epoch": 0.79, "learning_rate": 0.00022580029044338347, "loss": 2.0855, "step": 29337 }, { "epoch": 0.79, "learning_rate": 0.00022574520266742404, "loss": 2.4285, "step": 29338 }, { "epoch": 0.79, "learning_rate": 0.00022569012075708062, "loss": 2.5591, "step": 29339 }, { "epoch": 0.79, "learning_rate": 0.0002256350447127703, "loss": 2.5454, "step": 29340 }, { "epoch": 0.79, "learning_rate": 0.00022557997453491054, "loss": 2.5151, "step": 29341 }, { "epoch": 0.79, "learning_rate": 0.00022552491022391862, "loss": 2.4272, "step": 29342 }, { "epoch": 0.79, "learning_rate": 0.0002254698517802114, "loss": 2.3876, "step": 29343 }, { "epoch": 0.79, "learning_rate": 0.00022541479920420594, "loss": 2.0366, "step": 29344 }, { "epoch": 0.79, "learning_rate": 0.0002253597524963198, "loss": 2.345, "step": 29345 }, { "epoch": 0.79, "learning_rate": 0.00022530471165696942, "loss": 2.6865, "step": 29346 }, { "epoch": 0.79, "learning_rate": 0.0002252496766865718, "loss": 2.6056, "step": 29347 }, { "epoch": 0.79, "learning_rate": 0.00022519464758554464, "loss": 2.0121, "step": 29348 }, { "epoch": 0.79, "learning_rate": 0.00022513962435430403, "loss": 2.9334, "step": 29349 }, { "epoch": 0.79, "learning_rate": 0.00022508460699326738, "loss": 2.2818, "step": 29350 }, { "epoch": 0.79, "learning_rate": 0.00022502959550285096, "loss": 1.8982, "step": 29351 }, { "epoch": 0.79, "learning_rate": 0.00022497458988347176, "loss": 2.5376, "step": 29352 }, { "epoch": 0.79, "learning_rate": 0.0002249195901355464, "loss": 2.6331, "step": 29353 }, { "epoch": 0.79, "learning_rate": 0.00022486459625949173, "loss": 2.5834, "step": 29354 }, { "epoch": 0.79, "learning_rate": 0.00022480960825572427, "loss": 2.2379, "step": 29355 }, { "epoch": 0.79, "learning_rate": 0.000224754626124661, "loss": 2.7881, "step": 29356 }, { "epoch": 0.79, "learning_rate": 0.00022469964986671776, "loss": 2.317, "step": 29357 }, { "epoch": 0.79, "learning_rate": 0.0002246446794823116, "loss": 2.362, "step": 29358 }, { "epoch": 0.79, "learning_rate": 0.0002245897149718582, "loss": 2.8079, "step": 29359 }, { "epoch": 0.79, "learning_rate": 0.0002245347563357747, "loss": 2.3332, "step": 29360 }, { "epoch": 0.79, "learning_rate": 0.0002244798035744776, "loss": 2.2538, "step": 29361 }, { "epoch": 0.79, "learning_rate": 0.00022442485668838254, "loss": 2.2139, "step": 29362 }, { "epoch": 0.79, "learning_rate": 0.0002243699156779062, "loss": 2.562, "step": 29363 }, { "epoch": 0.79, "learning_rate": 0.0002243149805434649, "loss": 2.8757, "step": 29364 }, { "epoch": 0.79, "learning_rate": 0.00022426005128547432, "loss": 2.8449, "step": 29365 }, { "epoch": 0.79, "learning_rate": 0.00022420512790435098, "loss": 2.5238, "step": 29366 }, { "epoch": 0.79, "learning_rate": 0.00022415021040051087, "loss": 2.6514, "step": 29367 }, { "epoch": 0.79, "learning_rate": 0.00022409529877437007, "loss": 2.4842, "step": 29368 }, { "epoch": 0.79, "learning_rate": 0.00022404039302634482, "loss": 2.5578, "step": 29369 }, { "epoch": 0.79, "learning_rate": 0.00022398549315685046, "loss": 2.6858, "step": 29370 }, { "epoch": 0.79, "learning_rate": 0.00022393059916630344, "loss": 2.5229, "step": 29371 }, { "epoch": 0.79, "learning_rate": 0.00022387571105511928, "loss": 2.7727, "step": 29372 }, { "epoch": 0.79, "learning_rate": 0.00022382082882371412, "loss": 2.5037, "step": 29373 }, { "epoch": 0.79, "learning_rate": 0.00022376595247250352, "loss": 2.5066, "step": 29374 }, { "epoch": 0.79, "learning_rate": 0.00022371108200190359, "loss": 2.3477, "step": 29375 }, { "epoch": 0.79, "learning_rate": 0.00022365621741232943, "loss": 2.3512, "step": 29376 }, { "epoch": 0.79, "learning_rate": 0.00022360135870419718, "loss": 2.6415, "step": 29377 }, { "epoch": 0.79, "learning_rate": 0.00022354650587792202, "loss": 3.3671, "step": 29378 }, { "epoch": 0.79, "learning_rate": 0.00022349165893391975, "loss": 1.9675, "step": 29379 }, { "epoch": 0.79, "learning_rate": 0.00022343681787260583, "loss": 2.7157, "step": 29380 }, { "epoch": 0.79, "learning_rate": 0.0002233819826943957, "loss": 2.4554, "step": 29381 }, { "epoch": 0.79, "learning_rate": 0.00022332715339970477, "loss": 2.7627, "step": 29382 }, { "epoch": 0.79, "learning_rate": 0.00022327232998894887, "loss": 2.136, "step": 29383 }, { "epoch": 0.79, "learning_rate": 0.00022321751246254262, "loss": 2.9043, "step": 29384 }, { "epoch": 0.79, "learning_rate": 0.0002231627008209016, "loss": 2.624, "step": 29385 }, { "epoch": 0.79, "learning_rate": 0.00022310789506444108, "loss": 2.7092, "step": 29386 }, { "epoch": 0.79, "learning_rate": 0.0002230530951935762, "loss": 2.759, "step": 29387 }, { "epoch": 0.79, "learning_rate": 0.00022299830120872246, "loss": 2.4555, "step": 29388 }, { "epoch": 0.79, "learning_rate": 0.00022294351311029448, "loss": 2.5574, "step": 29389 }, { "epoch": 0.79, "learning_rate": 0.0002228887308987074, "loss": 2.2721, "step": 29390 }, { "epoch": 0.79, "learning_rate": 0.0002228339545743767, "loss": 2.8979, "step": 29391 }, { "epoch": 0.79, "learning_rate": 0.0002227791841377168, "loss": 2.7433, "step": 29392 }, { "epoch": 0.79, "learning_rate": 0.0002227244195891428, "loss": 2.5526, "step": 29393 }, { "epoch": 0.79, "learning_rate": 0.0002226696609290696, "loss": 2.3594, "step": 29394 }, { "epoch": 0.79, "learning_rate": 0.00022261490815791206, "loss": 2.2127, "step": 29395 }, { "epoch": 0.79, "learning_rate": 0.00022256016127608535, "loss": 2.5327, "step": 29396 }, { "epoch": 0.79, "learning_rate": 0.00022250542028400355, "loss": 2.6475, "step": 29397 }, { "epoch": 0.79, "learning_rate": 0.00022245068518208166, "loss": 2.8952, "step": 29398 }, { "epoch": 0.79, "learning_rate": 0.00022239595597073436, "loss": 2.4085, "step": 29399 }, { "epoch": 0.79, "learning_rate": 0.00022234123265037632, "loss": 2.307, "step": 29400 }, { "epoch": 0.79, "learning_rate": 0.00022228651522142206, "loss": 2.7889, "step": 29401 }, { "epoch": 0.79, "learning_rate": 0.00022223180368428642, "loss": 2.4591, "step": 29402 }, { "epoch": 0.79, "learning_rate": 0.00022217709803938325, "loss": 2.207, "step": 29403 }, { "epoch": 0.79, "learning_rate": 0.00022212239828712753, "loss": 2.7185, "step": 29404 }, { "epoch": 0.79, "learning_rate": 0.00022206770442793333, "loss": 3.0241, "step": 29405 }, { "epoch": 0.79, "learning_rate": 0.00022201301646221472, "loss": 2.7856, "step": 29406 }, { "epoch": 0.79, "learning_rate": 0.00022195833439038703, "loss": 2.1498, "step": 29407 }, { "epoch": 0.79, "learning_rate": 0.00022190365821286363, "loss": 2.4277, "step": 29408 }, { "epoch": 0.79, "learning_rate": 0.00022184898793005904, "loss": 2.2066, "step": 29409 }, { "epoch": 0.79, "learning_rate": 0.0002217943235423876, "loss": 2.2861, "step": 29410 }, { "epoch": 0.79, "learning_rate": 0.0002217396650502629, "loss": 2.7186, "step": 29411 }, { "epoch": 0.79, "learning_rate": 0.00022168501245409944, "loss": 2.5209, "step": 29412 }, { "epoch": 0.79, "learning_rate": 0.00022163036575431117, "loss": 2.8079, "step": 29413 }, { "epoch": 0.79, "learning_rate": 0.00022157572495131207, "loss": 2.1396, "step": 29414 }, { "epoch": 0.79, "learning_rate": 0.00022152109004551645, "loss": 2.2809, "step": 29415 }, { "epoch": 0.79, "learning_rate": 0.0002214664610373376, "loss": 2.6471, "step": 29416 }, { "epoch": 0.79, "learning_rate": 0.00022141183792718955, "loss": 2.7422, "step": 29417 }, { "epoch": 0.79, "learning_rate": 0.00022135722071548648, "loss": 2.3182, "step": 29418 }, { "epoch": 0.79, "learning_rate": 0.00022130260940264146, "loss": 2.4604, "step": 29419 }, { "epoch": 0.79, "learning_rate": 0.0002212480039890692, "loss": 2.5726, "step": 29420 }, { "epoch": 0.79, "learning_rate": 0.00022119340447518244, "loss": 2.7877, "step": 29421 }, { "epoch": 0.79, "learning_rate": 0.00022113881086139532, "loss": 2.5366, "step": 29422 }, { "epoch": 0.79, "learning_rate": 0.00022108422314812148, "loss": 2.3554, "step": 29423 }, { "epoch": 0.79, "learning_rate": 0.0002210296413357742, "loss": 2.4419, "step": 29424 }, { "epoch": 0.79, "learning_rate": 0.00022097506542476697, "loss": 2.4674, "step": 29425 }, { "epoch": 0.79, "learning_rate": 0.0002209204954155134, "loss": 2.5454, "step": 29426 }, { "epoch": 0.79, "learning_rate": 0.0002208659313084269, "loss": 2.66, "step": 29427 }, { "epoch": 0.79, "learning_rate": 0.0002208113731039211, "loss": 2.2226, "step": 29428 }, { "epoch": 0.79, "learning_rate": 0.00022075682080240866, "loss": 2.274, "step": 29429 }, { "epoch": 0.79, "learning_rate": 0.00022070227440430324, "loss": 2.4307, "step": 29430 }, { "epoch": 0.79, "learning_rate": 0.00022064773391001835, "loss": 2.6337, "step": 29431 }, { "epoch": 0.79, "learning_rate": 0.00022059319931996648, "loss": 2.1793, "step": 29432 }, { "epoch": 0.79, "learning_rate": 0.00022053867063456133, "loss": 2.8458, "step": 29433 }, { "epoch": 0.79, "learning_rate": 0.0002204841478542161, "loss": 2.9013, "step": 29434 }, { "epoch": 0.79, "learning_rate": 0.00022042963097934344, "loss": 2.6983, "step": 29435 }, { "epoch": 0.79, "learning_rate": 0.00022037512001035642, "loss": 2.3299, "step": 29436 }, { "epoch": 0.79, "learning_rate": 0.00022032061494766842, "loss": 2.2922, "step": 29437 }, { "epoch": 0.79, "learning_rate": 0.00022026611579169177, "loss": 2.3057, "step": 29438 }, { "epoch": 0.79, "learning_rate": 0.00022021162254283965, "loss": 2.0502, "step": 29439 }, { "epoch": 0.79, "learning_rate": 0.0002201571352015248, "loss": 2.6914, "step": 29440 }, { "epoch": 0.79, "learning_rate": 0.0002201026537681602, "loss": 2.0283, "step": 29441 }, { "epoch": 0.79, "learning_rate": 0.0002200481782431586, "loss": 2.0769, "step": 29442 }, { "epoch": 0.79, "learning_rate": 0.00021999370862693237, "loss": 2.7036, "step": 29443 }, { "epoch": 0.79, "learning_rate": 0.00021993924491989426, "loss": 2.4203, "step": 29444 }, { "epoch": 0.79, "learning_rate": 0.00021988478712245708, "loss": 2.3642, "step": 29445 }, { "epoch": 0.79, "learning_rate": 0.00021983033523503327, "loss": 2.7148, "step": 29446 }, { "epoch": 0.79, "learning_rate": 0.0002197758892580356, "loss": 2.1353, "step": 29447 }, { "epoch": 0.79, "learning_rate": 0.00021972144919187598, "loss": 1.9487, "step": 29448 }, { "epoch": 0.79, "learning_rate": 0.00021966701503696716, "loss": 2.7396, "step": 29449 }, { "epoch": 0.79, "learning_rate": 0.00021961258679372187, "loss": 2.5752, "step": 29450 }, { "epoch": 0.79, "learning_rate": 0.00021955816446255183, "loss": 2.3351, "step": 29451 }, { "epoch": 0.79, "learning_rate": 0.0002195037480438695, "loss": 2.5915, "step": 29452 }, { "epoch": 0.79, "learning_rate": 0.00021944933753808738, "loss": 2.4938, "step": 29453 }, { "epoch": 0.79, "learning_rate": 0.00021939493294561741, "loss": 2.1072, "step": 29454 }, { "epoch": 0.79, "learning_rate": 0.00021934053426687217, "loss": 2.6821, "step": 29455 }, { "epoch": 0.79, "learning_rate": 0.00021928614150226324, "loss": 2.2106, "step": 29456 }, { "epoch": 0.79, "learning_rate": 0.0002192317546522029, "loss": 2.3283, "step": 29457 }, { "epoch": 0.79, "learning_rate": 0.00021917737371710322, "loss": 2.5599, "step": 29458 }, { "epoch": 0.79, "learning_rate": 0.00021912299869737616, "loss": 2.575, "step": 29459 }, { "epoch": 0.79, "learning_rate": 0.00021906862959343365, "loss": 2.4247, "step": 29460 }, { "epoch": 0.79, "learning_rate": 0.00021901426640568778, "loss": 2.39, "step": 29461 }, { "epoch": 0.79, "learning_rate": 0.00021895990913455, "loss": 2.4766, "step": 29462 }, { "epoch": 0.79, "learning_rate": 0.00021890555778043263, "loss": 2.3902, "step": 29463 }, { "epoch": 0.79, "learning_rate": 0.00021885121234374672, "loss": 2.3485, "step": 29464 }, { "epoch": 0.79, "learning_rate": 0.00021879687282490447, "loss": 2.2675, "step": 29465 }, { "epoch": 0.79, "learning_rate": 0.00021874253922431742, "loss": 2.7854, "step": 29466 }, { "epoch": 0.79, "learning_rate": 0.00021868821154239716, "loss": 2.6979, "step": 29467 }, { "epoch": 0.79, "learning_rate": 0.00021863388977955535, "loss": 2.5747, "step": 29468 }, { "epoch": 0.79, "learning_rate": 0.00021857957393620376, "loss": 2.6483, "step": 29469 }, { "epoch": 0.79, "learning_rate": 0.0002185252640127534, "loss": 2.5682, "step": 29470 }, { "epoch": 0.79, "learning_rate": 0.00021847096000961587, "loss": 2.6668, "step": 29471 }, { "epoch": 0.79, "learning_rate": 0.00021841666192720267, "loss": 2.274, "step": 29472 }, { "epoch": 0.79, "learning_rate": 0.00021836236976592504, "loss": 2.978, "step": 29473 }, { "epoch": 0.79, "learning_rate": 0.00021830808352619468, "loss": 2.3209, "step": 29474 }, { "epoch": 0.79, "learning_rate": 0.00021825380320842226, "loss": 2.3282, "step": 29475 }, { "epoch": 0.79, "learning_rate": 0.0002181995288130192, "loss": 2.3659, "step": 29476 }, { "epoch": 0.79, "learning_rate": 0.00021814526034039705, "loss": 2.7686, "step": 29477 }, { "epoch": 0.79, "learning_rate": 0.0002180909977909664, "loss": 2.6034, "step": 29478 }, { "epoch": 0.79, "learning_rate": 0.00021803674116513817, "loss": 2.4304, "step": 29479 }, { "epoch": 0.79, "learning_rate": 0.00021798249046332441, "loss": 1.9737, "step": 29480 }, { "epoch": 0.79, "learning_rate": 0.00021792824568593526, "loss": 2.3696, "step": 29481 }, { "epoch": 0.79, "learning_rate": 0.0002178740068333821, "loss": 2.7032, "step": 29482 }, { "epoch": 0.79, "learning_rate": 0.00021781977390607544, "loss": 2.2043, "step": 29483 }, { "epoch": 0.79, "learning_rate": 0.00021776554690442618, "loss": 2.2849, "step": 29484 }, { "epoch": 0.79, "learning_rate": 0.00021771132582884545, "loss": 2.5534, "step": 29485 }, { "epoch": 0.79, "learning_rate": 0.0002176571106797437, "loss": 1.9194, "step": 29486 }, { "epoch": 0.79, "learning_rate": 0.00021760290145753192, "loss": 2.2696, "step": 29487 }, { "epoch": 0.79, "learning_rate": 0.0002175486981626209, "loss": 2.8285, "step": 29488 }, { "epoch": 0.79, "learning_rate": 0.00021749450079542088, "loss": 2.381, "step": 29489 }, { "epoch": 0.79, "learning_rate": 0.00021744030935634285, "loss": 2.2387, "step": 29490 }, { "epoch": 0.79, "learning_rate": 0.0002173861238457968, "loss": 1.995, "step": 29491 }, { "epoch": 0.79, "learning_rate": 0.00021733194426419334, "loss": 2.6666, "step": 29492 }, { "epoch": 0.79, "learning_rate": 0.00021727777061194366, "loss": 2.4063, "step": 29493 }, { "epoch": 0.79, "learning_rate": 0.0002172236028894573, "loss": 2.3173, "step": 29494 }, { "epoch": 0.79, "learning_rate": 0.0002171694410971451, "loss": 2.46, "step": 29495 }, { "epoch": 0.79, "learning_rate": 0.00021711528523541746, "loss": 2.3592, "step": 29496 }, { "epoch": 0.79, "learning_rate": 0.00021706113530468418, "loss": 2.7396, "step": 29497 }, { "epoch": 0.79, "learning_rate": 0.00021700699130535584, "loss": 2.9709, "step": 29498 }, { "epoch": 0.79, "learning_rate": 0.00021695285323784254, "loss": 2.6045, "step": 29499 }, { "epoch": 0.79, "learning_rate": 0.0002168987211025544, "loss": 2.3229, "step": 29500 }, { "epoch": 0.79, "learning_rate": 0.00021684459489990172, "loss": 2.2672, "step": 29501 }, { "epoch": 0.79, "learning_rate": 0.00021679047463029423, "loss": 2.4532, "step": 29502 }, { "epoch": 0.79, "learning_rate": 0.00021673636029414202, "loss": 2.09, "step": 29503 }, { "epoch": 0.79, "learning_rate": 0.0002166822518918553, "loss": 2.2825, "step": 29504 }, { "epoch": 0.79, "learning_rate": 0.00021662814942384346, "loss": 2.5189, "step": 29505 }, { "epoch": 0.79, "learning_rate": 0.00021657405289051714, "loss": 2.6936, "step": 29506 }, { "epoch": 0.79, "learning_rate": 0.00021651996229228544, "loss": 2.941, "step": 29507 }, { "epoch": 0.79, "learning_rate": 0.00021646587762955838, "loss": 2.821, "step": 29508 }, { "epoch": 0.79, "learning_rate": 0.00021641179890274608, "loss": 2.789, "step": 29509 }, { "epoch": 0.79, "learning_rate": 0.00021635772611225767, "loss": 2.4484, "step": 29510 }, { "epoch": 0.79, "learning_rate": 0.00021630365925850303, "loss": 2.4636, "step": 29511 }, { "epoch": 0.79, "learning_rate": 0.0002162495983418916, "loss": 2.092, "step": 29512 }, { "epoch": 0.79, "learning_rate": 0.00021619554336283332, "loss": 2.4446, "step": 29513 }, { "epoch": 0.79, "learning_rate": 0.00021614149432173734, "loss": 2.2788, "step": 29514 }, { "epoch": 0.79, "learning_rate": 0.00021608745121901352, "loss": 2.2344, "step": 29515 }, { "epoch": 0.79, "learning_rate": 0.00021603341405507083, "loss": 2.5341, "step": 29516 }, { "epoch": 0.79, "learning_rate": 0.00021597938283031903, "loss": 2.4724, "step": 29517 }, { "epoch": 0.79, "learning_rate": 0.00021592535754516674, "loss": 2.4086, "step": 29518 }, { "epoch": 0.79, "learning_rate": 0.00021587133820002402, "loss": 2.291, "step": 29519 }, { "epoch": 0.79, "learning_rate": 0.00021581732479530015, "loss": 2.03, "step": 29520 }, { "epoch": 0.79, "learning_rate": 0.00021576331733140375, "loss": 2.3913, "step": 29521 }, { "epoch": 0.79, "learning_rate": 0.0002157093158087442, "loss": 2.3974, "step": 29522 }, { "epoch": 0.79, "learning_rate": 0.00021565532022773092, "loss": 2.6192, "step": 29523 }, { "epoch": 0.79, "learning_rate": 0.00021560133058877253, "loss": 2.205, "step": 29524 }, { "epoch": 0.79, "learning_rate": 0.00021554734689227818, "loss": 2.5621, "step": 29525 }, { "epoch": 0.79, "learning_rate": 0.0002154933691386569, "loss": 2.2583, "step": 29526 }, { "epoch": 0.79, "learning_rate": 0.0002154393973283175, "loss": 2.3808, "step": 29527 }, { "epoch": 0.79, "learning_rate": 0.00021538543146166933, "loss": 2.5184, "step": 29528 }, { "epoch": 0.79, "learning_rate": 0.00021533147153912058, "loss": 2.1843, "step": 29529 }, { "epoch": 0.79, "learning_rate": 0.00021527751756108028, "loss": 2.6212, "step": 29530 }, { "epoch": 0.79, "learning_rate": 0.0002152235695279573, "loss": 2.4718, "step": 29531 }, { "epoch": 0.79, "learning_rate": 0.0002151696274401601, "loss": 2.3909, "step": 29532 }, { "epoch": 0.79, "learning_rate": 0.00021511569129809783, "loss": 2.1548, "step": 29533 }, { "epoch": 0.79, "learning_rate": 0.00021506176110217858, "loss": 2.394, "step": 29534 }, { "epoch": 0.79, "learning_rate": 0.000215007836852811, "loss": 2.5346, "step": 29535 }, { "epoch": 0.79, "learning_rate": 0.0002149539185504039, "loss": 2.488, "step": 29536 }, { "epoch": 0.79, "learning_rate": 0.00021490000619536542, "loss": 2.5294, "step": 29537 }, { "epoch": 0.79, "learning_rate": 0.00021484609978810387, "loss": 2.4415, "step": 29538 }, { "epoch": 0.79, "learning_rate": 0.00021479219932902838, "loss": 2.5465, "step": 29539 }, { "epoch": 0.79, "learning_rate": 0.0002147383048185465, "loss": 2.3665, "step": 29540 }, { "epoch": 0.79, "learning_rate": 0.00021468441625706715, "loss": 2.3209, "step": 29541 }, { "epoch": 0.79, "learning_rate": 0.00021463053364499795, "loss": 2.3614, "step": 29542 }, { "epoch": 0.79, "learning_rate": 0.00021457665698274743, "loss": 2.2814, "step": 29543 }, { "epoch": 0.79, "learning_rate": 0.00021452278627072374, "loss": 2.5828, "step": 29544 }, { "epoch": 0.79, "learning_rate": 0.00021446892150933506, "loss": 2.7786, "step": 29545 }, { "epoch": 0.79, "learning_rate": 0.00021441506269898936, "loss": 2.6378, "step": 29546 }, { "epoch": 0.79, "learning_rate": 0.0002143612098400949, "loss": 2.4438, "step": 29547 }, { "epoch": 0.79, "learning_rate": 0.00021430736293305918, "loss": 2.3712, "step": 29548 }, { "epoch": 0.79, "learning_rate": 0.0002142535219782905, "loss": 2.8202, "step": 29549 }, { "epoch": 0.79, "learning_rate": 0.00021419968697619697, "loss": 2.2421, "step": 29550 }, { "epoch": 0.79, "learning_rate": 0.00021414585792718543, "loss": 2.5817, "step": 29551 }, { "epoch": 0.79, "learning_rate": 0.00021409203483166496, "loss": 2.2645, "step": 29552 }, { "epoch": 0.79, "learning_rate": 0.0002140382176900425, "loss": 2.6505, "step": 29553 }, { "epoch": 0.79, "learning_rate": 0.000213984406502726, "loss": 2.2345, "step": 29554 }, { "epoch": 0.79, "learning_rate": 0.00021393060127012332, "loss": 2.3753, "step": 29555 }, { "epoch": 0.79, "learning_rate": 0.0002138768019926416, "loss": 2.6912, "step": 29556 }, { "epoch": 0.79, "learning_rate": 0.0002138230086706887, "loss": 2.2435, "step": 29557 }, { "epoch": 0.79, "learning_rate": 0.00021376922130467214, "loss": 2.5744, "step": 29558 }, { "epoch": 0.79, "learning_rate": 0.00021371543989499942, "loss": 2.145, "step": 29559 }, { "epoch": 0.79, "learning_rate": 0.00021366166444207813, "loss": 2.4633, "step": 29560 }, { "epoch": 0.79, "learning_rate": 0.00021360789494631526, "loss": 2.3579, "step": 29561 }, { "epoch": 0.79, "learning_rate": 0.0002135541314081185, "loss": 2.5864, "step": 29562 }, { "epoch": 0.79, "learning_rate": 0.00021350037382789522, "loss": 2.3477, "step": 29563 }, { "epoch": 0.79, "learning_rate": 0.00021344662220605193, "loss": 2.5762, "step": 29564 }, { "epoch": 0.79, "learning_rate": 0.00021339287654299665, "loss": 2.6169, "step": 29565 }, { "epoch": 0.79, "learning_rate": 0.00021333913683913665, "loss": 1.9534, "step": 29566 }, { "epoch": 0.79, "learning_rate": 0.00021328540309487843, "loss": 2.4848, "step": 29567 }, { "epoch": 0.79, "learning_rate": 0.00021323167531062958, "loss": 2.4139, "step": 29568 }, { "epoch": 0.79, "learning_rate": 0.0002131779534867966, "loss": 2.6384, "step": 29569 }, { "epoch": 0.79, "learning_rate": 0.00021312423762378686, "loss": 2.5266, "step": 29570 }, { "epoch": 0.79, "learning_rate": 0.0002130705277220071, "loss": 2.364, "step": 29571 }, { "epoch": 0.79, "learning_rate": 0.00021301682378186437, "loss": 2.7329, "step": 29572 }, { "epoch": 0.79, "learning_rate": 0.00021296312580376553, "loss": 2.0766, "step": 29573 }, { "epoch": 0.79, "learning_rate": 0.00021290943378811768, "loss": 2.5222, "step": 29574 }, { "epoch": 0.79, "learning_rate": 0.00021285574773532678, "loss": 2.7881, "step": 29575 }, { "epoch": 0.79, "learning_rate": 0.00021280206764580045, "loss": 2.2988, "step": 29576 }, { "epoch": 0.79, "learning_rate": 0.00021274839351994424, "loss": 2.6955, "step": 29577 }, { "epoch": 0.79, "learning_rate": 0.00021269472535816582, "loss": 2.2013, "step": 29578 }, { "epoch": 0.79, "learning_rate": 0.00021264106316087162, "loss": 2.4977, "step": 29579 }, { "epoch": 0.79, "learning_rate": 0.00021258740692846779, "loss": 2.0156, "step": 29580 }, { "epoch": 0.79, "learning_rate": 0.00021253375666136087, "loss": 2.4839, "step": 29581 }, { "epoch": 0.79, "learning_rate": 0.0002124801123599578, "loss": 2.2353, "step": 29582 }, { "epoch": 0.8, "learning_rate": 0.0002124264740246642, "loss": 2.3981, "step": 29583 }, { "epoch": 0.8, "learning_rate": 0.0002123728416558869, "loss": 2.7627, "step": 29584 }, { "epoch": 0.8, "learning_rate": 0.0002123192152540322, "loss": 2.4687, "step": 29585 }, { "epoch": 0.8, "learning_rate": 0.00021226559481950626, "loss": 2.9471, "step": 29586 }, { "epoch": 0.8, "learning_rate": 0.0002122119803527155, "loss": 2.1422, "step": 29587 }, { "epoch": 0.8, "learning_rate": 0.0002121583718540657, "loss": 2.5408, "step": 29588 }, { "epoch": 0.8, "learning_rate": 0.00021210476932396338, "loss": 2.7221, "step": 29589 }, { "epoch": 0.8, "learning_rate": 0.00021205117276281427, "loss": 2.565, "step": 29590 }, { "epoch": 0.8, "learning_rate": 0.00021199758217102472, "loss": 2.5097, "step": 29591 }, { "epoch": 0.8, "learning_rate": 0.00021194399754900062, "loss": 2.0275, "step": 29592 }, { "epoch": 0.8, "learning_rate": 0.0002118904188971481, "loss": 1.7922, "step": 29593 }, { "epoch": 0.8, "learning_rate": 0.00021183684621587262, "loss": 2.5022, "step": 29594 }, { "epoch": 0.8, "learning_rate": 0.00021178327950558052, "loss": 2.7315, "step": 29595 }, { "epoch": 0.8, "learning_rate": 0.00021172971876667724, "loss": 2.6304, "step": 29596 }, { "epoch": 0.8, "learning_rate": 0.00021167616399956856, "loss": 2.2802, "step": 29597 }, { "epoch": 0.8, "learning_rate": 0.00021162261520466031, "loss": 2.5068, "step": 29598 }, { "epoch": 0.8, "learning_rate": 0.00021156907238235824, "loss": 2.3648, "step": 29599 }, { "epoch": 0.8, "learning_rate": 0.0002115155355330679, "loss": 2.3564, "step": 29600 }, { "epoch": 0.8, "learning_rate": 0.0002114620046571951, "loss": 2.869, "step": 29601 }, { "epoch": 0.8, "learning_rate": 0.000211408479755145, "loss": 2.4886, "step": 29602 }, { "epoch": 0.8, "learning_rate": 0.0002113549608273232, "loss": 2.5076, "step": 29603 }, { "epoch": 0.8, "learning_rate": 0.0002113014478741353, "loss": 2.5161, "step": 29604 }, { "epoch": 0.8, "learning_rate": 0.00021124794089598652, "loss": 2.6585, "step": 29605 }, { "epoch": 0.8, "learning_rate": 0.00021119443989328269, "loss": 2.3557, "step": 29606 }, { "epoch": 0.8, "learning_rate": 0.00021114094486642844, "loss": 2.1674, "step": 29607 }, { "epoch": 0.8, "learning_rate": 0.00021108745581582933, "loss": 2.1519, "step": 29608 }, { "epoch": 0.8, "learning_rate": 0.00021103397274189095, "loss": 2.9001, "step": 29609 }, { "epoch": 0.8, "learning_rate": 0.00021098049564501786, "loss": 2.6038, "step": 29610 }, { "epoch": 0.8, "learning_rate": 0.00021092702452561542, "loss": 2.1719, "step": 29611 }, { "epoch": 0.8, "learning_rate": 0.0002108735593840888, "loss": 2.1798, "step": 29612 }, { "epoch": 0.8, "learning_rate": 0.0002108201002208431, "loss": 2.3074, "step": 29613 }, { "epoch": 0.8, "learning_rate": 0.00021076664703628334, "loss": 2.7202, "step": 29614 }, { "epoch": 0.8, "learning_rate": 0.00021071319983081415, "loss": 2.178, "step": 29615 }, { "epoch": 0.8, "learning_rate": 0.00021065975860484065, "loss": 2.4971, "step": 29616 }, { "epoch": 0.8, "learning_rate": 0.00021060632335876772, "loss": 2.6727, "step": 29617 }, { "epoch": 0.8, "learning_rate": 0.00021055289409300016, "loss": 2.5928, "step": 29618 }, { "epoch": 0.8, "learning_rate": 0.00021049947080794296, "loss": 2.6627, "step": 29619 }, { "epoch": 0.8, "learning_rate": 0.00021044605350400037, "loss": 1.9658, "step": 29620 }, { "epoch": 0.8, "learning_rate": 0.00021039264218157728, "loss": 2.7249, "step": 29621 }, { "epoch": 0.8, "learning_rate": 0.00021033923684107868, "loss": 2.1844, "step": 29622 }, { "epoch": 0.8, "learning_rate": 0.00021028583748290865, "loss": 2.5092, "step": 29623 }, { "epoch": 0.8, "learning_rate": 0.00021023244410747156, "loss": 2.2647, "step": 29624 }, { "epoch": 0.8, "learning_rate": 0.0002101790567151728, "loss": 2.6425, "step": 29625 }, { "epoch": 0.8, "learning_rate": 0.000210125675306416, "loss": 2.3119, "step": 29626 }, { "epoch": 0.8, "learning_rate": 0.00021007229988160604, "loss": 2.5173, "step": 29627 }, { "epoch": 0.8, "learning_rate": 0.00021001893044114716, "loss": 2.4388, "step": 29628 }, { "epoch": 0.8, "learning_rate": 0.00020996556698544357, "loss": 2.3602, "step": 29629 }, { "epoch": 0.8, "learning_rate": 0.0002099122095148994, "loss": 2.2515, "step": 29630 }, { "epoch": 0.8, "learning_rate": 0.00020985885802991922, "loss": 2.5482, "step": 29631 }, { "epoch": 0.8, "learning_rate": 0.00020980551253090707, "loss": 2.2711, "step": 29632 }, { "epoch": 0.8, "learning_rate": 0.0002097521730182673, "loss": 2.7171, "step": 29633 }, { "epoch": 0.8, "learning_rate": 0.00020969883949240354, "loss": 2.5731, "step": 29634 }, { "epoch": 0.8, "learning_rate": 0.00020964551195372006, "loss": 2.584, "step": 29635 }, { "epoch": 0.8, "learning_rate": 0.00020959219040262111, "loss": 1.9223, "step": 29636 }, { "epoch": 0.8, "learning_rate": 0.00020953887483950983, "loss": 2.7447, "step": 29637 }, { "epoch": 0.8, "learning_rate": 0.00020948556526479133, "loss": 2.5779, "step": 29638 }, { "epoch": 0.8, "learning_rate": 0.00020943226167886863, "loss": 2.999, "step": 29639 }, { "epoch": 0.8, "learning_rate": 0.00020937896408214574, "loss": 2.2432, "step": 29640 }, { "epoch": 0.8, "learning_rate": 0.00020932567247502676, "loss": 2.8326, "step": 29641 }, { "epoch": 0.8, "learning_rate": 0.00020927238685791483, "loss": 2.7205, "step": 29642 }, { "epoch": 0.8, "learning_rate": 0.00020921910723121394, "loss": 2.2203, "step": 29643 }, { "epoch": 0.8, "learning_rate": 0.0002091658335953277, "loss": 2.1477, "step": 29644 }, { "epoch": 0.8, "learning_rate": 0.00020911256595065975, "loss": 2.7103, "step": 29645 }, { "epoch": 0.8, "learning_rate": 0.00020905930429761376, "loss": 3.0056, "step": 29646 }, { "epoch": 0.8, "learning_rate": 0.0002090060486365929, "loss": 2.3584, "step": 29647 }, { "epoch": 0.8, "learning_rate": 0.0002089527989680008, "loss": 2.5426, "step": 29648 }, { "epoch": 0.8, "learning_rate": 0.00020889955529224114, "loss": 2.3141, "step": 29649 }, { "epoch": 0.8, "learning_rate": 0.00020884631760971652, "loss": 2.4774, "step": 29650 }, { "epoch": 0.8, "learning_rate": 0.0002087930859208309, "loss": 2.3601, "step": 29651 }, { "epoch": 0.8, "learning_rate": 0.0002087398602259878, "loss": 2.5363, "step": 29652 }, { "epoch": 0.8, "learning_rate": 0.0002086866405255897, "loss": 2.6328, "step": 29653 }, { "epoch": 0.8, "learning_rate": 0.0002086334268200404, "loss": 2.052, "step": 29654 }, { "epoch": 0.8, "learning_rate": 0.00020858021910974257, "loss": 2.4357, "step": 29655 }, { "epoch": 0.8, "learning_rate": 0.00020852701739509938, "loss": 2.5171, "step": 29656 }, { "epoch": 0.8, "learning_rate": 0.0002084738216765142, "loss": 2.5608, "step": 29657 }, { "epoch": 0.8, "learning_rate": 0.00020842063195438966, "loss": 2.5368, "step": 29658 }, { "epoch": 0.8, "learning_rate": 0.00020836744822912902, "loss": 2.236, "step": 29659 }, { "epoch": 0.8, "learning_rate": 0.00020831427050113527, "loss": 2.5023, "step": 29660 }, { "epoch": 0.8, "learning_rate": 0.0002082610987708108, "loss": 2.423, "step": 29661 }, { "epoch": 0.8, "learning_rate": 0.00020820793303855868, "loss": 2.6409, "step": 29662 }, { "epoch": 0.8, "learning_rate": 0.00020815477330478173, "loss": 2.3944, "step": 29663 }, { "epoch": 0.8, "learning_rate": 0.0002081016195698826, "loss": 2.2742, "step": 29664 }, { "epoch": 0.8, "learning_rate": 0.00020804847183426435, "loss": 2.7346, "step": 29665 }, { "epoch": 0.8, "learning_rate": 0.00020799533009832906, "loss": 2.1876, "step": 29666 }, { "epoch": 0.8, "learning_rate": 0.00020794219436247942, "loss": 2.4484, "step": 29667 }, { "epoch": 0.8, "learning_rate": 0.00020788906462711844, "loss": 2.2925, "step": 29668 }, { "epoch": 0.8, "learning_rate": 0.00020783594089264802, "loss": 2.7653, "step": 29669 }, { "epoch": 0.8, "learning_rate": 0.00020778282315947095, "loss": 2.6579, "step": 29670 }, { "epoch": 0.8, "learning_rate": 0.00020772971142798947, "loss": 2.3743, "step": 29671 }, { "epoch": 0.8, "learning_rate": 0.00020767660569860613, "loss": 2.0149, "step": 29672 }, { "epoch": 0.8, "learning_rate": 0.0002076235059717234, "loss": 2.5424, "step": 29673 }, { "epoch": 0.8, "learning_rate": 0.0002075704122477431, "loss": 3.0272, "step": 29674 }, { "epoch": 0.8, "learning_rate": 0.00020751732452706763, "loss": 2.7398, "step": 29675 }, { "epoch": 0.8, "learning_rate": 0.00020746424281009923, "loss": 2.3203, "step": 29676 }, { "epoch": 0.8, "learning_rate": 0.00020741116709724005, "loss": 2.5857, "step": 29677 }, { "epoch": 0.8, "learning_rate": 0.00020735809738889221, "loss": 2.2083, "step": 29678 }, { "epoch": 0.8, "learning_rate": 0.00020730503368545796, "loss": 2.5635, "step": 29679 }, { "epoch": 0.8, "learning_rate": 0.0002072519759873388, "loss": 2.6634, "step": 29680 }, { "epoch": 0.8, "learning_rate": 0.00020719892429493713, "loss": 2.5417, "step": 29681 }, { "epoch": 0.8, "learning_rate": 0.00020714587860865441, "loss": 2.5986, "step": 29682 }, { "epoch": 0.8, "learning_rate": 0.00020709283892889286, "loss": 2.5725, "step": 29683 }, { "epoch": 0.8, "learning_rate": 0.00020703980525605415, "loss": 2.2459, "step": 29684 }, { "epoch": 0.8, "learning_rate": 0.00020698677759054007, "loss": 2.8099, "step": 29685 }, { "epoch": 0.8, "learning_rate": 0.00020693375593275242, "loss": 2.6147, "step": 29686 }, { "epoch": 0.8, "learning_rate": 0.00020688074028309312, "loss": 2.2693, "step": 29687 }, { "epoch": 0.8, "learning_rate": 0.00020682773064196325, "loss": 2.5772, "step": 29688 }, { "epoch": 0.8, "learning_rate": 0.00020677472700976474, "loss": 2.33, "step": 29689 }, { "epoch": 0.8, "learning_rate": 0.00020672172938689904, "loss": 3.0132, "step": 29690 }, { "epoch": 0.8, "learning_rate": 0.00020666873777376772, "loss": 2.3617, "step": 29691 }, { "epoch": 0.8, "learning_rate": 0.00020661575217077244, "loss": 2.1897, "step": 29692 }, { "epoch": 0.8, "learning_rate": 0.00020656277257831413, "loss": 2.5732, "step": 29693 }, { "epoch": 0.8, "learning_rate": 0.00020650979899679433, "loss": 2.0514, "step": 29694 }, { "epoch": 0.8, "learning_rate": 0.00020645683142661486, "loss": 2.7816, "step": 29695 }, { "epoch": 0.8, "learning_rate": 0.00020640386986817583, "loss": 2.6719, "step": 29696 }, { "epoch": 0.8, "learning_rate": 0.00020635091432187958, "loss": 2.5266, "step": 29697 }, { "epoch": 0.8, "learning_rate": 0.00020629796478812724, "loss": 2.2597, "step": 29698 }, { "epoch": 0.8, "learning_rate": 0.00020624502126731926, "loss": 2.8539, "step": 29699 }, { "epoch": 0.8, "learning_rate": 0.00020619208375985732, "loss": 2.513, "step": 29700 }, { "epoch": 0.8, "learning_rate": 0.00020613915226614212, "loss": 2.8964, "step": 29701 }, { "epoch": 0.8, "learning_rate": 0.00020608622678657462, "loss": 2.1654, "step": 29702 }, { "epoch": 0.8, "learning_rate": 0.000206033307321556, "loss": 2.5237, "step": 29703 }, { "epoch": 0.8, "learning_rate": 0.00020598039387148705, "loss": 2.6382, "step": 29704 }, { "epoch": 0.8, "learning_rate": 0.00020592748643676872, "loss": 1.917, "step": 29705 }, { "epoch": 0.8, "learning_rate": 0.00020587458501780198, "loss": 2.1331, "step": 29706 }, { "epoch": 0.8, "learning_rate": 0.00020582168961498726, "loss": 2.7151, "step": 29707 }, { "epoch": 0.8, "learning_rate": 0.00020576880022872568, "loss": 2.2563, "step": 29708 }, { "epoch": 0.8, "learning_rate": 0.00020571591685941703, "loss": 2.7193, "step": 29709 }, { "epoch": 0.8, "learning_rate": 0.0002056630395074629, "loss": 2.3495, "step": 29710 }, { "epoch": 0.8, "learning_rate": 0.00020561016817326395, "loss": 2.7353, "step": 29711 }, { "epoch": 0.8, "learning_rate": 0.00020555730285721997, "loss": 2.8327, "step": 29712 }, { "epoch": 0.8, "learning_rate": 0.00020550444355973185, "loss": 2.4181, "step": 29713 }, { "epoch": 0.8, "learning_rate": 0.0002054515902812003, "loss": 2.3688, "step": 29714 }, { "epoch": 0.8, "learning_rate": 0.0002053987430220251, "loss": 2.1733, "step": 29715 }, { "epoch": 0.8, "learning_rate": 0.00020534590178260704, "loss": 2.4155, "step": 29716 }, { "epoch": 0.8, "learning_rate": 0.00020529306656334633, "loss": 2.5728, "step": 29717 }, { "epoch": 0.8, "learning_rate": 0.00020524023736464336, "loss": 2.1777, "step": 29718 }, { "epoch": 0.8, "learning_rate": 0.00020518741418689847, "loss": 2.4907, "step": 29719 }, { "epoch": 0.8, "learning_rate": 0.00020513459703051128, "loss": 2.6271, "step": 29720 }, { "epoch": 0.8, "learning_rate": 0.00020508178589588233, "loss": 2.3228, "step": 29721 }, { "epoch": 0.8, "learning_rate": 0.0002050289807834117, "loss": 2.619, "step": 29722 }, { "epoch": 0.8, "learning_rate": 0.0002049761816934994, "loss": 2.5642, "step": 29723 }, { "epoch": 0.8, "learning_rate": 0.00020492338862654558, "loss": 2.358, "step": 29724 }, { "epoch": 0.8, "learning_rate": 0.00020487060158294978, "loss": 2.7153, "step": 29725 }, { "epoch": 0.8, "learning_rate": 0.00020481782056311216, "loss": 2.6274, "step": 29726 }, { "epoch": 0.8, "learning_rate": 0.00020476504556743292, "loss": 2.6362, "step": 29727 }, { "epoch": 0.8, "learning_rate": 0.00020471227659631108, "loss": 2.5815, "step": 29728 }, { "epoch": 0.8, "learning_rate": 0.000204659513650147, "loss": 2.5458, "step": 29729 }, { "epoch": 0.8, "learning_rate": 0.00020460675672934016, "loss": 2.325, "step": 29730 }, { "epoch": 0.8, "learning_rate": 0.0002045540058342904, "loss": 2.7548, "step": 29731 }, { "epoch": 0.8, "learning_rate": 0.00020450126096539724, "loss": 2.3849, "step": 29732 }, { "epoch": 0.8, "learning_rate": 0.00020444852212306053, "loss": 2.5091, "step": 29733 }, { "epoch": 0.8, "learning_rate": 0.00020439578930767945, "loss": 2.5182, "step": 29734 }, { "epoch": 0.8, "learning_rate": 0.00020434306251965352, "loss": 2.2445, "step": 29735 }, { "epoch": 0.8, "learning_rate": 0.00020429034175938233, "loss": 2.6043, "step": 29736 }, { "epoch": 0.8, "learning_rate": 0.00020423762702726522, "loss": 2.4835, "step": 29737 }, { "epoch": 0.8, "learning_rate": 0.0002041849183237019, "loss": 2.3798, "step": 29738 }, { "epoch": 0.8, "learning_rate": 0.00020413221564909102, "loss": 2.3108, "step": 29739 }, { "epoch": 0.8, "learning_rate": 0.00020407951900383226, "loss": 3.0472, "step": 29740 }, { "epoch": 0.8, "learning_rate": 0.00020402682838832498, "loss": 2.376, "step": 29741 }, { "epoch": 0.8, "learning_rate": 0.00020397414380296785, "loss": 2.5539, "step": 29742 }, { "epoch": 0.8, "learning_rate": 0.00020392146524816037, "loss": 2.4931, "step": 29743 }, { "epoch": 0.8, "learning_rate": 0.00020386879272430146, "loss": 2.2803, "step": 29744 }, { "epoch": 0.8, "learning_rate": 0.00020381612623179035, "loss": 2.3936, "step": 29745 }, { "epoch": 0.8, "learning_rate": 0.0002037634657710261, "loss": 2.4543, "step": 29746 }, { "epoch": 0.8, "learning_rate": 0.0002037108113424072, "loss": 2.5587, "step": 29747 }, { "epoch": 0.8, "learning_rate": 0.0002036581629463329, "loss": 2.8961, "step": 29748 }, { "epoch": 0.8, "learning_rate": 0.00020360552058320202, "loss": 2.5229, "step": 29749 }, { "epoch": 0.8, "learning_rate": 0.00020355288425341324, "loss": 2.6467, "step": 29750 }, { "epoch": 0.8, "learning_rate": 0.0002035002539573657, "loss": 2.3798, "step": 29751 }, { "epoch": 0.8, "learning_rate": 0.0002034476296954576, "loss": 2.1388, "step": 29752 }, { "epoch": 0.8, "learning_rate": 0.0002033950114680878, "loss": 2.2547, "step": 29753 }, { "epoch": 0.8, "learning_rate": 0.00020334239927565534, "loss": 2.7904, "step": 29754 }, { "epoch": 0.8, "learning_rate": 0.0002032897931185581, "loss": 2.2932, "step": 29755 }, { "epoch": 0.8, "learning_rate": 0.0002032371929971947, "loss": 2.337, "step": 29756 }, { "epoch": 0.8, "learning_rate": 0.0002031845989119644, "loss": 3.1187, "step": 29757 }, { "epoch": 0.8, "learning_rate": 0.00020313201086326482, "loss": 2.9425, "step": 29758 }, { "epoch": 0.8, "learning_rate": 0.0002030794288514949, "loss": 2.5071, "step": 29759 }, { "epoch": 0.8, "learning_rate": 0.00020302685287705257, "loss": 2.4143, "step": 29760 }, { "epoch": 0.8, "learning_rate": 0.00020297428294033625, "loss": 2.518, "step": 29761 }, { "epoch": 0.8, "learning_rate": 0.00020292171904174428, "loss": 2.2058, "step": 29762 }, { "epoch": 0.8, "learning_rate": 0.00020286916118167497, "loss": 2.6637, "step": 29763 }, { "epoch": 0.8, "learning_rate": 0.00020281660936052626, "loss": 2.3787, "step": 29764 }, { "epoch": 0.8, "learning_rate": 0.0002027640635786967, "loss": 2.4693, "step": 29765 }, { "epoch": 0.8, "learning_rate": 0.00020271152383658376, "loss": 2.3339, "step": 29766 }, { "epoch": 0.8, "learning_rate": 0.00020265899013458612, "loss": 2.2911, "step": 29767 }, { "epoch": 0.8, "learning_rate": 0.0002026064624731011, "loss": 3.0566, "step": 29768 }, { "epoch": 0.8, "learning_rate": 0.00020255394085252665, "loss": 2.3317, "step": 29769 }, { "epoch": 0.8, "learning_rate": 0.00020250142527326154, "loss": 2.3094, "step": 29770 }, { "epoch": 0.8, "learning_rate": 0.0002024489157357029, "loss": 2.1818, "step": 29771 }, { "epoch": 0.8, "learning_rate": 0.0002023964122402485, "loss": 2.4095, "step": 29772 }, { "epoch": 0.8, "learning_rate": 0.00020234391478729662, "loss": 2.6162, "step": 29773 }, { "epoch": 0.8, "learning_rate": 0.00020229142337724448, "loss": 2.5954, "step": 29774 }, { "epoch": 0.8, "learning_rate": 0.00020223893801048977, "loss": 2.4527, "step": 29775 }, { "epoch": 0.8, "learning_rate": 0.00020218645868743025, "loss": 2.3686, "step": 29776 }, { "epoch": 0.8, "learning_rate": 0.0002021339854084635, "loss": 2.1738, "step": 29777 }, { "epoch": 0.8, "learning_rate": 0.00020208151817398734, "loss": 2.4154, "step": 29778 }, { "epoch": 0.8, "learning_rate": 0.00020202905698439867, "loss": 2.2799, "step": 29779 }, { "epoch": 0.8, "learning_rate": 0.00020197660184009515, "loss": 2.211, "step": 29780 }, { "epoch": 0.8, "learning_rate": 0.00020192415274147447, "loss": 2.2515, "step": 29781 }, { "epoch": 0.8, "learning_rate": 0.0002018717096889333, "loss": 2.7371, "step": 29782 }, { "epoch": 0.8, "learning_rate": 0.00020181927268286948, "loss": 2.1039, "step": 29783 }, { "epoch": 0.8, "learning_rate": 0.00020176684172368053, "loss": 2.271, "step": 29784 }, { "epoch": 0.8, "learning_rate": 0.00020171441681176306, "loss": 2.6696, "step": 29785 }, { "epoch": 0.8, "learning_rate": 0.00020166199794751462, "loss": 2.6221, "step": 29786 }, { "epoch": 0.8, "learning_rate": 0.00020160958513133187, "loss": 2.4979, "step": 29787 }, { "epoch": 0.8, "learning_rate": 0.0002015571783636122, "loss": 2.8698, "step": 29788 }, { "epoch": 0.8, "learning_rate": 0.0002015047776447526, "loss": 2.6507, "step": 29789 }, { "epoch": 0.8, "learning_rate": 0.00020145238297515001, "loss": 2.802, "step": 29790 }, { "epoch": 0.8, "learning_rate": 0.0002013999943552014, "loss": 2.5672, "step": 29791 }, { "epoch": 0.8, "learning_rate": 0.00020134761178530403, "loss": 2.4713, "step": 29792 }, { "epoch": 0.8, "learning_rate": 0.00020129523526585402, "loss": 2.4074, "step": 29793 }, { "epoch": 0.8, "learning_rate": 0.00020124286479724873, "loss": 2.5126, "step": 29794 }, { "epoch": 0.8, "learning_rate": 0.0002011905003798843, "loss": 2.2584, "step": 29795 }, { "epoch": 0.8, "learning_rate": 0.00020113814201415793, "loss": 2.2713, "step": 29796 }, { "epoch": 0.8, "learning_rate": 0.00020108578970046655, "loss": 2.9373, "step": 29797 }, { "epoch": 0.8, "learning_rate": 0.00020103344343920605, "loss": 2.1958, "step": 29798 }, { "epoch": 0.8, "learning_rate": 0.00020098110323077346, "loss": 2.6857, "step": 29799 }, { "epoch": 0.8, "learning_rate": 0.00020092876907556534, "loss": 2.5965, "step": 29800 }, { "epoch": 0.8, "learning_rate": 0.00020087644097397772, "loss": 1.8674, "step": 29801 }, { "epoch": 0.8, "learning_rate": 0.0002008241189264074, "loss": 2.3788, "step": 29802 }, { "epoch": 0.8, "learning_rate": 0.0002007718029332507, "loss": 2.5312, "step": 29803 }, { "epoch": 0.8, "learning_rate": 0.00020071949299490377, "loss": 2.6827, "step": 29804 }, { "epoch": 0.8, "learning_rate": 0.00020066718911176352, "loss": 2.5562, "step": 29805 }, { "epoch": 0.8, "learning_rate": 0.00020061489128422538, "loss": 2.867, "step": 29806 }, { "epoch": 0.8, "learning_rate": 0.00020056259951268585, "loss": 2.0268, "step": 29807 }, { "epoch": 0.8, "learning_rate": 0.00020051031379754124, "loss": 2.1222, "step": 29808 }, { "epoch": 0.8, "learning_rate": 0.0002004580341391875, "loss": 2.8278, "step": 29809 }, { "epoch": 0.8, "learning_rate": 0.00020040576053802073, "loss": 2.6584, "step": 29810 }, { "epoch": 0.8, "learning_rate": 0.00020035349299443728, "loss": 2.427, "step": 29811 }, { "epoch": 0.8, "learning_rate": 0.0002003012315088325, "loss": 2.2281, "step": 29812 }, { "epoch": 0.8, "learning_rate": 0.00020024897608160298, "loss": 2.6137, "step": 29813 }, { "epoch": 0.8, "learning_rate": 0.00020019672671314393, "loss": 2.8343, "step": 29814 }, { "epoch": 0.8, "learning_rate": 0.00020014448340385137, "loss": 2.7823, "step": 29815 }, { "epoch": 0.8, "learning_rate": 0.00020009224615412136, "loss": 2.3662, "step": 29816 }, { "epoch": 0.8, "learning_rate": 0.0002000400149643493, "loss": 2.5103, "step": 29817 }, { "epoch": 0.8, "learning_rate": 0.00019998778983493126, "loss": 2.8141, "step": 29818 }, { "epoch": 0.8, "learning_rate": 0.0001999355707662629, "loss": 2.2512, "step": 29819 }, { "epoch": 0.8, "learning_rate": 0.00019988335775873934, "loss": 2.4472, "step": 29820 }, { "epoch": 0.8, "learning_rate": 0.00019983115081275639, "loss": 2.5446, "step": 29821 }, { "epoch": 0.8, "learning_rate": 0.0001997789499287096, "loss": 2.6549, "step": 29822 }, { "epoch": 0.8, "learning_rate": 0.00019972675510699435, "loss": 2.6968, "step": 29823 }, { "epoch": 0.8, "learning_rate": 0.00019967456634800652, "loss": 2.3009, "step": 29824 }, { "epoch": 0.8, "learning_rate": 0.0001996223836521407, "loss": 2.2765, "step": 29825 }, { "epoch": 0.8, "learning_rate": 0.00019957020701979268, "loss": 2.657, "step": 29826 }, { "epoch": 0.8, "learning_rate": 0.00019951803645135792, "loss": 2.176, "step": 29827 }, { "epoch": 0.8, "learning_rate": 0.0001994658719472312, "loss": 2.6177, "step": 29828 }, { "epoch": 0.8, "learning_rate": 0.0001994137135078078, "loss": 2.3421, "step": 29829 }, { "epoch": 0.8, "learning_rate": 0.00019936156113348303, "loss": 2.5005, "step": 29830 }, { "epoch": 0.8, "learning_rate": 0.00019930941482465192, "loss": 2.3565, "step": 29831 }, { "epoch": 0.8, "learning_rate": 0.00019925727458170985, "loss": 2.4687, "step": 29832 }, { "epoch": 0.8, "learning_rate": 0.00019920514040505123, "loss": 2.0326, "step": 29833 }, { "epoch": 0.8, "learning_rate": 0.00019915301229507122, "loss": 2.4768, "step": 29834 }, { "epoch": 0.8, "learning_rate": 0.00019910089025216494, "loss": 2.5425, "step": 29835 }, { "epoch": 0.8, "learning_rate": 0.00019904877427672697, "loss": 1.9817, "step": 29836 }, { "epoch": 0.8, "learning_rate": 0.00019899666436915266, "loss": 2.367, "step": 29837 }, { "epoch": 0.8, "learning_rate": 0.0001989445605298361, "loss": 2.3995, "step": 29838 }, { "epoch": 0.8, "learning_rate": 0.0001988924627591724, "loss": 2.9768, "step": 29839 }, { "epoch": 0.8, "learning_rate": 0.00019884037105755636, "loss": 2.7356, "step": 29840 }, { "epoch": 0.8, "learning_rate": 0.00019878828542538229, "loss": 2.7362, "step": 29841 }, { "epoch": 0.8, "learning_rate": 0.00019873620586304452, "loss": 2.6572, "step": 29842 }, { "epoch": 0.8, "learning_rate": 0.00019868413237093864, "loss": 2.6149, "step": 29843 }, { "epoch": 0.8, "learning_rate": 0.00019863206494945818, "loss": 2.3592, "step": 29844 }, { "epoch": 0.8, "learning_rate": 0.00019858000359899798, "loss": 2.1052, "step": 29845 }, { "epoch": 0.8, "learning_rate": 0.00019852794831995259, "loss": 2.5944, "step": 29846 }, { "epoch": 0.8, "learning_rate": 0.00019847589911271601, "loss": 1.8985, "step": 29847 }, { "epoch": 0.8, "learning_rate": 0.00019842385597768265, "loss": 2.7121, "step": 29848 }, { "epoch": 0.8, "learning_rate": 0.00019837181891524681, "loss": 2.3739, "step": 29849 }, { "epoch": 0.8, "learning_rate": 0.00019831978792580275, "loss": 2.909, "step": 29850 }, { "epoch": 0.8, "learning_rate": 0.00019826776300974503, "loss": 2.2005, "step": 29851 }, { "epoch": 0.8, "learning_rate": 0.00019821574416746703, "loss": 2.6484, "step": 29852 }, { "epoch": 0.8, "learning_rate": 0.00019816373139936328, "loss": 2.5139, "step": 29853 }, { "epoch": 0.8, "learning_rate": 0.00019811172470582796, "loss": 2.1887, "step": 29854 }, { "epoch": 0.8, "learning_rate": 0.00019805972408725426, "loss": 2.292, "step": 29855 }, { "epoch": 0.8, "learning_rate": 0.00019800772954403734, "loss": 2.7378, "step": 29856 }, { "epoch": 0.8, "learning_rate": 0.0001979557410765702, "loss": 2.2218, "step": 29857 }, { "epoch": 0.8, "learning_rate": 0.000197903758685247, "loss": 2.0817, "step": 29858 }, { "epoch": 0.8, "learning_rate": 0.00019785178237046176, "loss": 2.9686, "step": 29859 }, { "epoch": 0.8, "learning_rate": 0.00019779981213260766, "loss": 2.1154, "step": 29860 }, { "epoch": 0.8, "learning_rate": 0.0001977478479720789, "loss": 2.3454, "step": 29861 }, { "epoch": 0.8, "learning_rate": 0.0001976958898892689, "loss": 2.5965, "step": 29862 }, { "epoch": 0.8, "learning_rate": 0.00019764393788457147, "loss": 2.9278, "step": 29863 }, { "epoch": 0.8, "learning_rate": 0.0001975919919583804, "loss": 2.1808, "step": 29864 }, { "epoch": 0.8, "learning_rate": 0.00019754005211108862, "loss": 2.0107, "step": 29865 }, { "epoch": 0.8, "learning_rate": 0.00019748811834309, "loss": 2.4951, "step": 29866 }, { "epoch": 0.8, "learning_rate": 0.0001974361906547778, "loss": 2.0616, "step": 29867 }, { "epoch": 0.8, "learning_rate": 0.00019738426904654561, "loss": 3.0015, "step": 29868 }, { "epoch": 0.8, "learning_rate": 0.00019733235351878677, "loss": 2.2583, "step": 29869 }, { "epoch": 0.8, "learning_rate": 0.00019728044407189472, "loss": 2.256, "step": 29870 }, { "epoch": 0.8, "learning_rate": 0.0001972285407062623, "loss": 2.9956, "step": 29871 }, { "epoch": 0.8, "learning_rate": 0.00019717664342228303, "loss": 2.7952, "step": 29872 }, { "epoch": 0.8, "learning_rate": 0.00019712475222034986, "loss": 2.4216, "step": 29873 }, { "epoch": 0.8, "learning_rate": 0.00019707286710085603, "loss": 2.5645, "step": 29874 }, { "epoch": 0.8, "learning_rate": 0.00019702098806419454, "loss": 2.6441, "step": 29875 }, { "epoch": 0.8, "learning_rate": 0.00019696911511075854, "loss": 2.7012, "step": 29876 }, { "epoch": 0.8, "learning_rate": 0.00019691724824094092, "loss": 2.2372, "step": 29877 }, { "epoch": 0.8, "learning_rate": 0.00019686538745513493, "loss": 2.6172, "step": 29878 }, { "epoch": 0.8, "learning_rate": 0.00019681353275373292, "loss": 2.6712, "step": 29879 }, { "epoch": 0.8, "learning_rate": 0.00019676168413712802, "loss": 1.9359, "step": 29880 }, { "epoch": 0.8, "learning_rate": 0.00019670984160571293, "loss": 2.6126, "step": 29881 }, { "epoch": 0.8, "learning_rate": 0.00019665800515988053, "loss": 2.3109, "step": 29882 }, { "epoch": 0.8, "learning_rate": 0.00019660617480002363, "loss": 2.7198, "step": 29883 }, { "epoch": 0.8, "learning_rate": 0.00019655435052653446, "loss": 2.2185, "step": 29884 }, { "epoch": 0.8, "learning_rate": 0.00019650253233980598, "loss": 2.6238, "step": 29885 }, { "epoch": 0.8, "learning_rate": 0.0001964507202402309, "loss": 1.8185, "step": 29886 }, { "epoch": 0.8, "learning_rate": 0.00019639891422820123, "loss": 2.6028, "step": 29887 }, { "epoch": 0.8, "learning_rate": 0.00019634711430410945, "loss": 2.3266, "step": 29888 }, { "epoch": 0.8, "learning_rate": 0.00019629532046834875, "loss": 3.026, "step": 29889 }, { "epoch": 0.8, "learning_rate": 0.0001962435327213108, "loss": 2.6082, "step": 29890 }, { "epoch": 0.8, "learning_rate": 0.00019619175106338837, "loss": 2.3163, "step": 29891 }, { "epoch": 0.8, "learning_rate": 0.0001961399754949733, "loss": 2.407, "step": 29892 }, { "epoch": 0.8, "learning_rate": 0.00019608820601645804, "loss": 2.4154, "step": 29893 }, { "epoch": 0.8, "learning_rate": 0.00019603644262823473, "loss": 2.107, "step": 29894 }, { "epoch": 0.8, "learning_rate": 0.0001959846853306957, "loss": 1.9231, "step": 29895 }, { "epoch": 0.8, "learning_rate": 0.00019593293412423297, "loss": 2.3653, "step": 29896 }, { "epoch": 0.8, "learning_rate": 0.00019588118900923878, "loss": 2.4687, "step": 29897 }, { "epoch": 0.8, "learning_rate": 0.00019582944998610462, "loss": 2.5423, "step": 29898 }, { "epoch": 0.8, "learning_rate": 0.00019577771705522307, "loss": 2.5688, "step": 29899 }, { "epoch": 0.8, "learning_rate": 0.00019572599021698556, "loss": 2.4203, "step": 29900 }, { "epoch": 0.8, "learning_rate": 0.0001956742694717839, "loss": 2.4636, "step": 29901 }, { "epoch": 0.8, "learning_rate": 0.00019562255482001058, "loss": 2.625, "step": 29902 }, { "epoch": 0.8, "learning_rate": 0.0001955708462620568, "loss": 2.5607, "step": 29903 }, { "epoch": 0.8, "learning_rate": 0.0001955191437983145, "loss": 2.1603, "step": 29904 }, { "epoch": 0.8, "learning_rate": 0.00019546744742917556, "loss": 1.8597, "step": 29905 }, { "epoch": 0.8, "learning_rate": 0.00019541575715503114, "loss": 2.7673, "step": 29906 }, { "epoch": 0.8, "learning_rate": 0.00019536407297627312, "loss": 2.2728, "step": 29907 }, { "epoch": 0.8, "learning_rate": 0.000195312394893293, "loss": 2.534, "step": 29908 }, { "epoch": 0.8, "learning_rate": 0.00019526072290648234, "loss": 2.6908, "step": 29909 }, { "epoch": 0.8, "learning_rate": 0.0001952090570162327, "loss": 2.3334, "step": 29910 }, { "epoch": 0.8, "learning_rate": 0.00019515739722293524, "loss": 2.5103, "step": 29911 }, { "epoch": 0.8, "learning_rate": 0.0001951057435269814, "loss": 2.359, "step": 29912 }, { "epoch": 0.8, "learning_rate": 0.00019505409592876288, "loss": 2.305, "step": 29913 }, { "epoch": 0.8, "learning_rate": 0.00019500245442867004, "loss": 2.0647, "step": 29914 }, { "epoch": 0.8, "learning_rate": 0.00019495081902709522, "loss": 2.6499, "step": 29915 }, { "epoch": 0.8, "learning_rate": 0.00019489918972442877, "loss": 2.7358, "step": 29916 }, { "epoch": 0.8, "learning_rate": 0.00019484756652106205, "loss": 2.4217, "step": 29917 }, { "epoch": 0.8, "learning_rate": 0.00019479594941738666, "loss": 2.3415, "step": 29918 }, { "epoch": 0.8, "learning_rate": 0.0001947443384137928, "loss": 2.1671, "step": 29919 }, { "epoch": 0.8, "learning_rate": 0.00019469273351067196, "loss": 2.2637, "step": 29920 }, { "epoch": 0.8, "learning_rate": 0.00019464113470841492, "loss": 2.8254, "step": 29921 }, { "epoch": 0.8, "learning_rate": 0.00019458954200741264, "loss": 2.2734, "step": 29922 }, { "epoch": 0.8, "learning_rate": 0.00019453795540805608, "loss": 2.4137, "step": 29923 }, { "epoch": 0.8, "learning_rate": 0.00019448637491073617, "loss": 2.4481, "step": 29924 }, { "epoch": 0.8, "learning_rate": 0.00019443480051584329, "loss": 1.8372, "step": 29925 }, { "epoch": 0.8, "learning_rate": 0.00019438323222376852, "loss": 2.319, "step": 29926 }, { "epoch": 0.8, "learning_rate": 0.0001943316700349018, "loss": 2.7594, "step": 29927 }, { "epoch": 0.8, "learning_rate": 0.00019428011394963463, "loss": 2.1514, "step": 29928 }, { "epoch": 0.8, "learning_rate": 0.00019422856396835754, "loss": 2.6491, "step": 29929 }, { "epoch": 0.8, "learning_rate": 0.00019417702009146055, "loss": 2.3432, "step": 29930 }, { "epoch": 0.8, "learning_rate": 0.00019412548231933425, "loss": 2.2603, "step": 29931 }, { "epoch": 0.8, "learning_rate": 0.00019407395065236966, "loss": 2.5286, "step": 29932 }, { "epoch": 0.8, "learning_rate": 0.00019402242509095635, "loss": 2.4563, "step": 29933 }, { "epoch": 0.8, "learning_rate": 0.00019397090563548513, "loss": 2.8695, "step": 29934 }, { "epoch": 0.8, "learning_rate": 0.00019391939228634615, "loss": 2.6026, "step": 29935 }, { "epoch": 0.8, "learning_rate": 0.00019386788504392982, "loss": 2.8546, "step": 29936 }, { "epoch": 0.8, "learning_rate": 0.00019381638390862644, "loss": 2.1391, "step": 29937 }, { "epoch": 0.8, "learning_rate": 0.00019376488888082577, "loss": 2.4003, "step": 29938 }, { "epoch": 0.8, "learning_rate": 0.00019371339996091818, "loss": 2.2175, "step": 29939 }, { "epoch": 0.8, "learning_rate": 0.00019366191714929371, "loss": 2.7504, "step": 29940 }, { "epoch": 0.8, "learning_rate": 0.00019361044044634247, "loss": 2.7407, "step": 29941 }, { "epoch": 0.8, "learning_rate": 0.0001935589698524546, "loss": 2.2839, "step": 29942 }, { "epoch": 0.8, "learning_rate": 0.00019350750536801942, "loss": 2.5397, "step": 29943 }, { "epoch": 0.8, "learning_rate": 0.00019345604699342735, "loss": 3.1331, "step": 29944 }, { "epoch": 0.8, "learning_rate": 0.00019340459472906823, "loss": 2.0659, "step": 29945 }, { "epoch": 0.8, "learning_rate": 0.00019335314857533138, "loss": 2.6357, "step": 29946 }, { "epoch": 0.8, "learning_rate": 0.000193301708532607, "loss": 2.1252, "step": 29947 }, { "epoch": 0.8, "learning_rate": 0.00019325027460128454, "loss": 2.5321, "step": 29948 }, { "epoch": 0.8, "learning_rate": 0.00019319884678175382, "loss": 2.297, "step": 29949 }, { "epoch": 0.8, "learning_rate": 0.00019314742507440464, "loss": 2.1038, "step": 29950 }, { "epoch": 0.8, "learning_rate": 0.00019309600947962615, "loss": 2.5267, "step": 29951 }, { "epoch": 0.8, "learning_rate": 0.00019304459999780788, "loss": 2.5719, "step": 29952 }, { "epoch": 0.8, "learning_rate": 0.00019299319662933957, "loss": 1.9476, "step": 29953 }, { "epoch": 0.8, "learning_rate": 0.00019294179937461042, "loss": 2.4005, "step": 29954 }, { "epoch": 0.81, "learning_rate": 0.00019289040823400994, "loss": 2.8653, "step": 29955 }, { "epoch": 0.81, "learning_rate": 0.00019283902320792778, "loss": 2.3062, "step": 29956 }, { "epoch": 0.81, "learning_rate": 0.00019278764429675254, "loss": 2.8289, "step": 29957 }, { "epoch": 0.81, "learning_rate": 0.0001927362715008738, "loss": 2.3086, "step": 29958 }, { "epoch": 0.81, "learning_rate": 0.0001926849048206809, "loss": 2.8888, "step": 29959 }, { "epoch": 0.81, "learning_rate": 0.00019263354425656267, "loss": 2.4614, "step": 29960 }, { "epoch": 0.81, "learning_rate": 0.0001925821898089084, "loss": 2.3464, "step": 29961 }, { "epoch": 0.81, "learning_rate": 0.00019253084147810706, "loss": 2.4344, "step": 29962 }, { "epoch": 0.81, "learning_rate": 0.00019247949926454766, "loss": 2.6485, "step": 29963 }, { "epoch": 0.81, "learning_rate": 0.00019242816316861956, "loss": 2.6531, "step": 29964 }, { "epoch": 0.81, "learning_rate": 0.00019237683319071097, "loss": 2.4707, "step": 29965 }, { "epoch": 0.81, "learning_rate": 0.00019232550933121119, "loss": 2.6953, "step": 29966 }, { "epoch": 0.81, "learning_rate": 0.00019227419159050885, "loss": 2.7865, "step": 29967 }, { "epoch": 0.81, "learning_rate": 0.0001922228799689929, "loss": 2.5229, "step": 29968 }, { "epoch": 0.81, "learning_rate": 0.00019217157446705226, "loss": 2.8363, "step": 29969 }, { "epoch": 0.81, "learning_rate": 0.00019212027508507502, "loss": 2.3042, "step": 29970 }, { "epoch": 0.81, "learning_rate": 0.00019206898182345022, "loss": 2.855, "step": 29971 }, { "epoch": 0.81, "learning_rate": 0.00019201769468256657, "loss": 2.6238, "step": 29972 }, { "epoch": 0.81, "learning_rate": 0.00019196641366281221, "loss": 2.9714, "step": 29973 }, { "epoch": 0.81, "learning_rate": 0.00019191513876457545, "loss": 2.0877, "step": 29974 }, { "epoch": 0.81, "learning_rate": 0.0001918638699882458, "loss": 2.3647, "step": 29975 }, { "epoch": 0.81, "learning_rate": 0.00019181260733421056, "loss": 2.9166, "step": 29976 }, { "epoch": 0.81, "learning_rate": 0.00019176135080285894, "loss": 2.8632, "step": 29977 }, { "epoch": 0.81, "learning_rate": 0.00019171010039457847, "loss": 2.2613, "step": 29978 }, { "epoch": 0.81, "learning_rate": 0.00019165885610975786, "loss": 2.5871, "step": 29979 }, { "epoch": 0.81, "learning_rate": 0.00019160761794878513, "loss": 2.2299, "step": 29980 }, { "epoch": 0.81, "learning_rate": 0.0001915563859120486, "loss": 2.299, "step": 29981 }, { "epoch": 0.81, "learning_rate": 0.00019150515999993644, "loss": 2.4671, "step": 29982 }, { "epoch": 0.81, "learning_rate": 0.0001914539402128368, "loss": 3.0387, "step": 29983 }, { "epoch": 0.81, "learning_rate": 0.00019140272655113734, "loss": 2.3796, "step": 29984 }, { "epoch": 0.81, "learning_rate": 0.00019135151901522653, "loss": 2.7058, "step": 29985 }, { "epoch": 0.81, "learning_rate": 0.00019130031760549173, "loss": 2.8158, "step": 29986 }, { "epoch": 0.81, "learning_rate": 0.00019124912232232094, "loss": 2.1092, "step": 29987 }, { "epoch": 0.81, "learning_rate": 0.00019119793316610268, "loss": 2.7242, "step": 29988 }, { "epoch": 0.81, "learning_rate": 0.00019114675013722404, "loss": 2.3435, "step": 29989 }, { "epoch": 0.81, "learning_rate": 0.00019109557323607296, "loss": 2.482, "step": 29990 }, { "epoch": 0.81, "learning_rate": 0.00019104440246303756, "loss": 1.9488, "step": 29991 }, { "epoch": 0.81, "learning_rate": 0.00019099323781850475, "loss": 2.6677, "step": 29992 }, { "epoch": 0.81, "learning_rate": 0.00019094207930286266, "loss": 2.6146, "step": 29993 }, { "epoch": 0.81, "learning_rate": 0.00019089092691649867, "loss": 2.5378, "step": 29994 }, { "epoch": 0.81, "learning_rate": 0.00019083978065980033, "loss": 2.3434, "step": 29995 }, { "epoch": 0.81, "learning_rate": 0.0001907886405331555, "loss": 2.6544, "step": 29996 }, { "epoch": 0.81, "learning_rate": 0.00019073750653695088, "loss": 2.7855, "step": 29997 }, { "epoch": 0.81, "learning_rate": 0.00019068637867157435, "loss": 2.1412, "step": 29998 }, { "epoch": 0.81, "learning_rate": 0.00019063525693741325, "loss": 2.3128, "step": 29999 }, { "epoch": 0.81, "learning_rate": 0.00019058414133485435, "loss": 2.6816, "step": 30000 }, { "epoch": 0.81, "learning_rate": 0.0001905330318642855, "loss": 2.3894, "step": 30001 }, { "epoch": 0.81, "learning_rate": 0.00019048192852609393, "loss": 2.4485, "step": 30002 }, { "epoch": 0.81, "learning_rate": 0.0001904308313206663, "loss": 2.7862, "step": 30003 }, { "epoch": 0.81, "learning_rate": 0.0001903797402483901, "loss": 2.7332, "step": 30004 }, { "epoch": 0.81, "learning_rate": 0.00019032865530965216, "loss": 2.6801, "step": 30005 }, { "epoch": 0.81, "learning_rate": 0.00019027757650483945, "loss": 2.4858, "step": 30006 }, { "epoch": 0.81, "learning_rate": 0.00019022650383433915, "loss": 2.3722, "step": 30007 }, { "epoch": 0.81, "learning_rate": 0.00019017543729853804, "loss": 2.3605, "step": 30008 }, { "epoch": 0.81, "learning_rate": 0.0001901243768978229, "loss": 2.1774, "step": 30009 }, { "epoch": 0.81, "learning_rate": 0.00019007332263258115, "loss": 2.8247, "step": 30010 }, { "epoch": 0.81, "learning_rate": 0.00019002227450319877, "loss": 2.4405, "step": 30011 }, { "epoch": 0.81, "learning_rate": 0.00018997123251006308, "loss": 2.5576, "step": 30012 }, { "epoch": 0.81, "learning_rate": 0.00018992019665355997, "loss": 2.8036, "step": 30013 }, { "epoch": 0.81, "learning_rate": 0.00018986916693407698, "loss": 2.5597, "step": 30014 }, { "epoch": 0.81, "learning_rate": 0.00018981814335200054, "loss": 2.7293, "step": 30015 }, { "epoch": 0.81, "learning_rate": 0.0001897671259077167, "loss": 2.1634, "step": 30016 }, { "epoch": 0.81, "learning_rate": 0.0001897161146016123, "loss": 2.1452, "step": 30017 }, { "epoch": 0.81, "learning_rate": 0.000189665109434074, "loss": 1.9585, "step": 30018 }, { "epoch": 0.81, "learning_rate": 0.0001896141104054877, "loss": 2.2196, "step": 30019 }, { "epoch": 0.81, "learning_rate": 0.00018956311751624, "loss": 2.4854, "step": 30020 }, { "epoch": 0.81, "learning_rate": 0.00018951213076671725, "loss": 2.4966, "step": 30021 }, { "epoch": 0.81, "learning_rate": 0.0001894611501573057, "loss": 2.7472, "step": 30022 }, { "epoch": 0.81, "learning_rate": 0.0001894101756883918, "loss": 2.6388, "step": 30023 }, { "epoch": 0.81, "learning_rate": 0.00018935920736036128, "loss": 2.2401, "step": 30024 }, { "epoch": 0.81, "learning_rate": 0.00018930824517360035, "loss": 2.6405, "step": 30025 }, { "epoch": 0.81, "learning_rate": 0.0001892572891284954, "loss": 2.2843, "step": 30026 }, { "epoch": 0.81, "learning_rate": 0.00018920633922543217, "loss": 2.362, "step": 30027 }, { "epoch": 0.81, "learning_rate": 0.000189155395464797, "loss": 2.6884, "step": 30028 }, { "epoch": 0.81, "learning_rate": 0.0001891044578469754, "loss": 2.4356, "step": 30029 }, { "epoch": 0.81, "learning_rate": 0.0001890535263723534, "loss": 2.3887, "step": 30030 }, { "epoch": 0.81, "learning_rate": 0.00018900260104131716, "loss": 2.5627, "step": 30031 }, { "epoch": 0.81, "learning_rate": 0.00018895168185425193, "loss": 2.3023, "step": 30032 }, { "epoch": 0.81, "learning_rate": 0.0001889007688115436, "loss": 2.7686, "step": 30033 }, { "epoch": 0.81, "learning_rate": 0.00018884986191357845, "loss": 2.6665, "step": 30034 }, { "epoch": 0.81, "learning_rate": 0.00018879896116074158, "loss": 2.5359, "step": 30035 }, { "epoch": 0.81, "learning_rate": 0.0001887480665534187, "loss": 2.8023, "step": 30036 }, { "epoch": 0.81, "learning_rate": 0.0001886971780919956, "loss": 2.4936, "step": 30037 }, { "epoch": 0.81, "learning_rate": 0.00018864629577685743, "loss": 2.2613, "step": 30038 }, { "epoch": 0.81, "learning_rate": 0.0001885954196083899, "loss": 2.5814, "step": 30039 }, { "epoch": 0.81, "learning_rate": 0.00018854454958697843, "loss": 2.2827, "step": 30040 }, { "epoch": 0.81, "learning_rate": 0.0001884936857130083, "loss": 2.6767, "step": 30041 }, { "epoch": 0.81, "learning_rate": 0.0001884428279868653, "loss": 2.301, "step": 30042 }, { "epoch": 0.81, "learning_rate": 0.0001883919764089339, "loss": 2.8746, "step": 30043 }, { "epoch": 0.81, "learning_rate": 0.00018834113097959993, "loss": 2.7558, "step": 30044 }, { "epoch": 0.81, "learning_rate": 0.00018829029169924871, "loss": 1.7409, "step": 30045 }, { "epoch": 0.81, "learning_rate": 0.0001882394585682645, "loss": 2.3119, "step": 30046 }, { "epoch": 0.81, "learning_rate": 0.0001881886315870336, "loss": 2.8098, "step": 30047 }, { "epoch": 0.81, "learning_rate": 0.00018813781075594017, "loss": 2.3156, "step": 30048 }, { "epoch": 0.81, "learning_rate": 0.0001880869960753696, "loss": 2.2477, "step": 30049 }, { "epoch": 0.81, "learning_rate": 0.00018803618754570706, "loss": 2.1364, "step": 30050 }, { "epoch": 0.81, "learning_rate": 0.00018798538516733699, "loss": 2.4895, "step": 30051 }, { "epoch": 0.81, "learning_rate": 0.0001879345889406443, "loss": 2.8608, "step": 30052 }, { "epoch": 0.81, "learning_rate": 0.00018788379886601416, "loss": 2.6352, "step": 30053 }, { "epoch": 0.81, "learning_rate": 0.000187833014943831, "loss": 2.4777, "step": 30054 }, { "epoch": 0.81, "learning_rate": 0.00018778223717448006, "loss": 2.5909, "step": 30055 }, { "epoch": 0.81, "learning_rate": 0.0001877314655583454, "loss": 2.6111, "step": 30056 }, { "epoch": 0.81, "learning_rate": 0.00018768070009581207, "loss": 2.641, "step": 30057 }, { "epoch": 0.81, "learning_rate": 0.00018762994078726458, "loss": 2.3649, "step": 30058 }, { "epoch": 0.81, "learning_rate": 0.00018757918763308702, "loss": 2.3629, "step": 30059 }, { "epoch": 0.81, "learning_rate": 0.00018752844063366447, "loss": 2.6491, "step": 30060 }, { "epoch": 0.81, "learning_rate": 0.00018747769978938157, "loss": 2.508, "step": 30061 }, { "epoch": 0.81, "learning_rate": 0.00018742696510062206, "loss": 2.7012, "step": 30062 }, { "epoch": 0.81, "learning_rate": 0.0001873762365677708, "loss": 2.6197, "step": 30063 }, { "epoch": 0.81, "learning_rate": 0.00018732551419121157, "loss": 2.8275, "step": 30064 }, { "epoch": 0.81, "learning_rate": 0.00018727479797132907, "loss": 2.3387, "step": 30065 }, { "epoch": 0.81, "learning_rate": 0.00018722408790850743, "loss": 2.175, "step": 30066 }, { "epoch": 0.81, "learning_rate": 0.00018717338400313068, "loss": 2.688, "step": 30067 }, { "epoch": 0.81, "learning_rate": 0.00018712268625558303, "loss": 2.7724, "step": 30068 }, { "epoch": 0.81, "learning_rate": 0.00018707199466624891, "loss": 2.7367, "step": 30069 }, { "epoch": 0.81, "learning_rate": 0.00018702130923551176, "loss": 2.4733, "step": 30070 }, { "epoch": 0.81, "learning_rate": 0.0001869706299637558, "loss": 2.5159, "step": 30071 }, { "epoch": 0.81, "learning_rate": 0.00018691995685136498, "loss": 2.6714, "step": 30072 }, { "epoch": 0.81, "learning_rate": 0.00018686928989872332, "loss": 2.8258, "step": 30073 }, { "epoch": 0.81, "learning_rate": 0.0001868186291062147, "loss": 2.1467, "step": 30074 }, { "epoch": 0.81, "learning_rate": 0.00018676797447422243, "loss": 2.4038, "step": 30075 }, { "epoch": 0.81, "learning_rate": 0.00018671732600313075, "loss": 2.3741, "step": 30076 }, { "epoch": 0.81, "learning_rate": 0.0001866666836933234, "loss": 2.0194, "step": 30077 }, { "epoch": 0.81, "learning_rate": 0.00018661604754518357, "loss": 2.9136, "step": 30078 }, { "epoch": 0.81, "learning_rate": 0.00018656541755909518, "loss": 2.5492, "step": 30079 }, { "epoch": 0.81, "learning_rate": 0.00018651479373544167, "loss": 2.4524, "step": 30080 }, { "epoch": 0.81, "learning_rate": 0.00018646417607460675, "loss": 2.4416, "step": 30081 }, { "epoch": 0.81, "learning_rate": 0.000186413564576974, "loss": 2.5806, "step": 30082 }, { "epoch": 0.81, "learning_rate": 0.00018636295924292633, "loss": 2.1606, "step": 30083 }, { "epoch": 0.81, "learning_rate": 0.00018631236007284746, "loss": 2.7471, "step": 30084 }, { "epoch": 0.81, "learning_rate": 0.00018626176706712072, "loss": 2.7794, "step": 30085 }, { "epoch": 0.81, "learning_rate": 0.00018621118022612925, "loss": 2.5032, "step": 30086 }, { "epoch": 0.81, "learning_rate": 0.00018616059955025644, "loss": 2.2091, "step": 30087 }, { "epoch": 0.81, "learning_rate": 0.0001861100250398857, "loss": 2.4209, "step": 30088 }, { "epoch": 0.81, "learning_rate": 0.0001860594566953996, "loss": 2.1668, "step": 30089 }, { "epoch": 0.81, "learning_rate": 0.00018600889451718183, "loss": 2.6572, "step": 30090 }, { "epoch": 0.81, "learning_rate": 0.00018595833850561493, "loss": 2.2555, "step": 30091 }, { "epoch": 0.81, "learning_rate": 0.00018590778866108205, "loss": 2.2555, "step": 30092 }, { "epoch": 0.81, "learning_rate": 0.00018585724498396627, "loss": 2.7303, "step": 30093 }, { "epoch": 0.81, "learning_rate": 0.00018580670747465035, "loss": 2.7089, "step": 30094 }, { "epoch": 0.81, "learning_rate": 0.00018575617613351736, "loss": 1.7394, "step": 30095 }, { "epoch": 0.81, "learning_rate": 0.00018570565096095028, "loss": 2.4751, "step": 30096 }, { "epoch": 0.81, "learning_rate": 0.0001856551319573312, "loss": 2.3589, "step": 30097 }, { "epoch": 0.81, "learning_rate": 0.00018560461912304338, "loss": 2.6766, "step": 30098 }, { "epoch": 0.81, "learning_rate": 0.00018555411245846931, "loss": 2.5198, "step": 30099 }, { "epoch": 0.81, "learning_rate": 0.0001855036119639917, "loss": 2.7712, "step": 30100 }, { "epoch": 0.81, "learning_rate": 0.0001854531176399934, "loss": 2.8819, "step": 30101 }, { "epoch": 0.81, "learning_rate": 0.00018540262948685626, "loss": 1.8823, "step": 30102 }, { "epoch": 0.81, "learning_rate": 0.00018535214750496333, "loss": 2.5125, "step": 30103 }, { "epoch": 0.81, "learning_rate": 0.00018530167169469704, "loss": 2.2499, "step": 30104 }, { "epoch": 0.81, "learning_rate": 0.00018525120205643942, "loss": 2.318, "step": 30105 }, { "epoch": 0.81, "learning_rate": 0.00018520073859057274, "loss": 2.2014, "step": 30106 }, { "epoch": 0.81, "learning_rate": 0.00018515028129748013, "loss": 2.3405, "step": 30107 }, { "epoch": 0.81, "learning_rate": 0.00018509983017754296, "loss": 2.5993, "step": 30108 }, { "epoch": 0.81, "learning_rate": 0.0001850493852311441, "loss": 2.7174, "step": 30109 }, { "epoch": 0.81, "learning_rate": 0.00018499894645866523, "loss": 2.6563, "step": 30110 }, { "epoch": 0.81, "learning_rate": 0.0001849485138604885, "loss": 2.5207, "step": 30111 }, { "epoch": 0.81, "learning_rate": 0.00018489808743699622, "loss": 2.6573, "step": 30112 }, { "epoch": 0.81, "learning_rate": 0.00018484766718857026, "loss": 2.8549, "step": 30113 }, { "epoch": 0.81, "learning_rate": 0.00018479725311559259, "loss": 2.4684, "step": 30114 }, { "epoch": 0.81, "learning_rate": 0.00018474684521844554, "loss": 2.7006, "step": 30115 }, { "epoch": 0.81, "learning_rate": 0.00018469644349751034, "loss": 2.6005, "step": 30116 }, { "epoch": 0.81, "learning_rate": 0.0001846460479531693, "loss": 2.4244, "step": 30117 }, { "epoch": 0.81, "learning_rate": 0.00018459565858580386, "loss": 2.3263, "step": 30118 }, { "epoch": 0.81, "learning_rate": 0.00018454527539579568, "loss": 2.3311, "step": 30119 }, { "epoch": 0.81, "learning_rate": 0.00018449489838352718, "loss": 2.7792, "step": 30120 }, { "epoch": 0.81, "learning_rate": 0.00018444452754937934, "loss": 2.3707, "step": 30121 }, { "epoch": 0.81, "learning_rate": 0.0001843941628937339, "loss": 2.4327, "step": 30122 }, { "epoch": 0.81, "learning_rate": 0.00018434380441697274, "loss": 2.2982, "step": 30123 }, { "epoch": 0.81, "learning_rate": 0.0001842934521194768, "loss": 2.5271, "step": 30124 }, { "epoch": 0.81, "learning_rate": 0.00018424310600162786, "loss": 2.3213, "step": 30125 }, { "epoch": 0.81, "learning_rate": 0.00018419276606380718, "loss": 2.9274, "step": 30126 }, { "epoch": 0.81, "learning_rate": 0.00018414243230639637, "loss": 2.4739, "step": 30127 }, { "epoch": 0.81, "learning_rate": 0.0001840921047297769, "loss": 2.5811, "step": 30128 }, { "epoch": 0.81, "learning_rate": 0.00018404178333432953, "loss": 2.757, "step": 30129 }, { "epoch": 0.81, "learning_rate": 0.00018399146812043567, "loss": 2.4859, "step": 30130 }, { "epoch": 0.81, "learning_rate": 0.00018394115908847687, "loss": 2.1219, "step": 30131 }, { "epoch": 0.81, "learning_rate": 0.0001838908562388334, "loss": 2.2014, "step": 30132 }, { "epoch": 0.81, "learning_rate": 0.0001838405595718874, "loss": 2.2087, "step": 30133 }, { "epoch": 0.81, "learning_rate": 0.0001837902690880192, "loss": 2.1547, "step": 30134 }, { "epoch": 0.81, "learning_rate": 0.00018373998478761, "loss": 2.3594, "step": 30135 }, { "epoch": 0.81, "learning_rate": 0.0001836897066710409, "loss": 2.6322, "step": 30136 }, { "epoch": 0.81, "learning_rate": 0.00018363943473869248, "loss": 2.1944, "step": 30137 }, { "epoch": 0.81, "learning_rate": 0.00018358916899094567, "loss": 3.2233, "step": 30138 }, { "epoch": 0.81, "learning_rate": 0.0001835389094281814, "loss": 2.1989, "step": 30139 }, { "epoch": 0.81, "learning_rate": 0.00018348865605078048, "loss": 2.4006, "step": 30140 }, { "epoch": 0.81, "learning_rate": 0.00018343840885912366, "loss": 2.2577, "step": 30141 }, { "epoch": 0.81, "learning_rate": 0.00018338816785359126, "loss": 2.2958, "step": 30142 }, { "epoch": 0.81, "learning_rate": 0.00018333793303456402, "loss": 2.5131, "step": 30143 }, { "epoch": 0.81, "learning_rate": 0.00018328770440242291, "loss": 2.407, "step": 30144 }, { "epoch": 0.81, "learning_rate": 0.00018323748195754762, "loss": 2.3237, "step": 30145 }, { "epoch": 0.81, "learning_rate": 0.0001831872657003194, "loss": 2.5609, "step": 30146 }, { "epoch": 0.81, "learning_rate": 0.0001831370556311187, "loss": 2.0067, "step": 30147 }, { "epoch": 0.81, "learning_rate": 0.00018308685175032536, "loss": 2.7281, "step": 30148 }, { "epoch": 0.81, "learning_rate": 0.00018303665405831993, "loss": 2.6164, "step": 30149 }, { "epoch": 0.81, "learning_rate": 0.00018298646255548312, "loss": 2.6616, "step": 30150 }, { "epoch": 0.81, "learning_rate": 0.00018293627724219442, "loss": 2.1417, "step": 30151 }, { "epoch": 0.81, "learning_rate": 0.0001828860981188345, "loss": 2.6057, "step": 30152 }, { "epoch": 0.81, "learning_rate": 0.0001828359251857834, "loss": 2.4857, "step": 30153 }, { "epoch": 0.81, "learning_rate": 0.00018278575844342116, "loss": 3.0918, "step": 30154 }, { "epoch": 0.81, "learning_rate": 0.00018273559789212823, "loss": 2.833, "step": 30155 }, { "epoch": 0.81, "learning_rate": 0.000182685443532284, "loss": 2.4711, "step": 30156 }, { "epoch": 0.81, "learning_rate": 0.00018263529536426883, "loss": 2.0125, "step": 30157 }, { "epoch": 0.81, "learning_rate": 0.0001825851533884624, "loss": 2.4237, "step": 30158 }, { "epoch": 0.81, "learning_rate": 0.0001825350176052447, "loss": 2.5307, "step": 30159 }, { "epoch": 0.81, "learning_rate": 0.00018248488801499597, "loss": 2.5011, "step": 30160 }, { "epoch": 0.81, "learning_rate": 0.00018243476461809517, "loss": 2.5738, "step": 30161 }, { "epoch": 0.81, "learning_rate": 0.00018238464741492254, "loss": 2.3839, "step": 30162 }, { "epoch": 0.81, "learning_rate": 0.00018233453640585783, "loss": 2.6712, "step": 30163 }, { "epoch": 0.81, "learning_rate": 0.00018228443159128016, "loss": 2.5395, "step": 30164 }, { "epoch": 0.81, "learning_rate": 0.00018223433297156954, "loss": 2.5663, "step": 30165 }, { "epoch": 0.81, "learning_rate": 0.00018218424054710548, "loss": 2.2055, "step": 30166 }, { "epoch": 0.81, "learning_rate": 0.00018213415431826729, "loss": 2.274, "step": 30167 }, { "epoch": 0.81, "learning_rate": 0.00018208407428543482, "loss": 3.0594, "step": 30168 }, { "epoch": 0.81, "learning_rate": 0.00018203400044898688, "loss": 2.4113, "step": 30169 }, { "epoch": 0.81, "learning_rate": 0.00018198393280930314, "loss": 1.9003, "step": 30170 }, { "epoch": 0.81, "learning_rate": 0.00018193387136676288, "loss": 2.7268, "step": 30171 }, { "epoch": 0.81, "learning_rate": 0.0001818838161217453, "loss": 2.6537, "step": 30172 }, { "epoch": 0.81, "learning_rate": 0.00018183376707462973, "loss": 2.2143, "step": 30173 }, { "epoch": 0.81, "learning_rate": 0.00018178372422579547, "loss": 2.4637, "step": 30174 }, { "epoch": 0.81, "learning_rate": 0.00018173368757562125, "loss": 2.2474, "step": 30175 }, { "epoch": 0.81, "learning_rate": 0.00018168365712448653, "loss": 2.3916, "step": 30176 }, { "epoch": 0.81, "learning_rate": 0.0001816336328727699, "loss": 2.6331, "step": 30177 }, { "epoch": 0.81, "learning_rate": 0.0001815836148208505, "loss": 2.9757, "step": 30178 }, { "epoch": 0.81, "learning_rate": 0.00018153360296910737, "loss": 2.1981, "step": 30179 }, { "epoch": 0.81, "learning_rate": 0.0001814835973179193, "loss": 2.4772, "step": 30180 }, { "epoch": 0.81, "learning_rate": 0.00018143359786766523, "loss": 2.4126, "step": 30181 }, { "epoch": 0.81, "learning_rate": 0.00018138360461872406, "loss": 2.3775, "step": 30182 }, { "epoch": 0.81, "learning_rate": 0.00018133361757147404, "loss": 2.6414, "step": 30183 }, { "epoch": 0.81, "learning_rate": 0.0001812836367262942, "loss": 2.6366, "step": 30184 }, { "epoch": 0.81, "learning_rate": 0.00018123366208356329, "loss": 2.4611, "step": 30185 }, { "epoch": 0.81, "learning_rate": 0.00018118369364365962, "loss": 2.6353, "step": 30186 }, { "epoch": 0.81, "learning_rate": 0.00018113373140696222, "loss": 1.7445, "step": 30187 }, { "epoch": 0.81, "learning_rate": 0.00018108377537384902, "loss": 2.0926, "step": 30188 }, { "epoch": 0.81, "learning_rate": 0.00018103382554469872, "loss": 2.9859, "step": 30189 }, { "epoch": 0.81, "learning_rate": 0.00018098388191989002, "loss": 2.617, "step": 30190 }, { "epoch": 0.81, "learning_rate": 0.00018093394449980073, "loss": 1.8185, "step": 30191 }, { "epoch": 0.81, "learning_rate": 0.00018088401328480907, "loss": 2.3174, "step": 30192 }, { "epoch": 0.81, "learning_rate": 0.00018083408827529435, "loss": 2.1403, "step": 30193 }, { "epoch": 0.81, "learning_rate": 0.0001807841694716338, "loss": 2.7483, "step": 30194 }, { "epoch": 0.81, "learning_rate": 0.0001807342568742062, "loss": 2.4395, "step": 30195 }, { "epoch": 0.81, "learning_rate": 0.00018068435048338916, "loss": 2.3637, "step": 30196 }, { "epoch": 0.81, "learning_rate": 0.00018063445029956095, "loss": 2.6182, "step": 30197 }, { "epoch": 0.81, "learning_rate": 0.00018058455632309967, "loss": 2.4747, "step": 30198 }, { "epoch": 0.81, "learning_rate": 0.00018053466855438328, "loss": 2.4889, "step": 30199 }, { "epoch": 0.81, "learning_rate": 0.00018048478699378979, "loss": 2.5492, "step": 30200 }, { "epoch": 0.81, "learning_rate": 0.00018043491164169723, "loss": 2.3962, "step": 30201 }, { "epoch": 0.81, "learning_rate": 0.0001803850424984831, "loss": 2.5968, "step": 30202 }, { "epoch": 0.81, "learning_rate": 0.0001803351795645255, "loss": 2.4234, "step": 30203 }, { "epoch": 0.81, "learning_rate": 0.00018028532284020148, "loss": 2.7203, "step": 30204 }, { "epoch": 0.81, "learning_rate": 0.00018023547232588966, "loss": 2.3696, "step": 30205 }, { "epoch": 0.81, "learning_rate": 0.0001801856280219676, "loss": 2.2289, "step": 30206 }, { "epoch": 0.81, "learning_rate": 0.0001801357899288124, "loss": 2.4047, "step": 30207 }, { "epoch": 0.81, "learning_rate": 0.00018008595804680182, "loss": 2.048, "step": 30208 }, { "epoch": 0.81, "learning_rate": 0.00018003613237631378, "loss": 2.4183, "step": 30209 }, { "epoch": 0.81, "learning_rate": 0.00017998631291772505, "loss": 2.5004, "step": 30210 }, { "epoch": 0.81, "learning_rate": 0.00017993649967141346, "loss": 2.3936, "step": 30211 }, { "epoch": 0.81, "learning_rate": 0.00017988669263775637, "loss": 2.0672, "step": 30212 }, { "epoch": 0.81, "learning_rate": 0.00017983689181713103, "loss": 2.6203, "step": 30213 }, { "epoch": 0.81, "learning_rate": 0.00017978709720991505, "loss": 2.679, "step": 30214 }, { "epoch": 0.81, "learning_rate": 0.0001797373088164851, "loss": 2.1082, "step": 30215 }, { "epoch": 0.81, "learning_rate": 0.00017968752663721866, "loss": 2.0523, "step": 30216 }, { "epoch": 0.81, "learning_rate": 0.00017963775067249277, "loss": 2.4921, "step": 30217 }, { "epoch": 0.81, "learning_rate": 0.0001795879809226847, "loss": 2.2847, "step": 30218 }, { "epoch": 0.81, "learning_rate": 0.00017953821738817143, "loss": 2.5646, "step": 30219 }, { "epoch": 0.81, "learning_rate": 0.00017948846006933018, "loss": 2.5462, "step": 30220 }, { "epoch": 0.81, "learning_rate": 0.00017943870896653736, "loss": 2.1735, "step": 30221 }, { "epoch": 0.81, "learning_rate": 0.00017938896408017046, "loss": 2.5401, "step": 30222 }, { "epoch": 0.81, "learning_rate": 0.00017933922541060588, "loss": 2.804, "step": 30223 }, { "epoch": 0.81, "learning_rate": 0.0001792894929582205, "loss": 2.5188, "step": 30224 }, { "epoch": 0.81, "learning_rate": 0.00017923976672339128, "loss": 2.4342, "step": 30225 }, { "epoch": 0.81, "learning_rate": 0.00017919004670649473, "loss": 2.7693, "step": 30226 }, { "epoch": 0.81, "learning_rate": 0.00017914033290790775, "loss": 2.5935, "step": 30227 }, { "epoch": 0.81, "learning_rate": 0.00017909062532800712, "loss": 2.4062, "step": 30228 }, { "epoch": 0.81, "learning_rate": 0.00017904092396716875, "loss": 2.6574, "step": 30229 }, { "epoch": 0.81, "learning_rate": 0.00017899122882576967, "loss": 2.1151, "step": 30230 }, { "epoch": 0.81, "learning_rate": 0.00017894153990418628, "loss": 2.5814, "step": 30231 }, { "epoch": 0.81, "learning_rate": 0.000178891857202795, "loss": 2.6485, "step": 30232 }, { "epoch": 0.81, "learning_rate": 0.00017884218072197235, "loss": 2.652, "step": 30233 }, { "epoch": 0.81, "learning_rate": 0.00017879251046209433, "loss": 2.4177, "step": 30234 }, { "epoch": 0.81, "learning_rate": 0.00017874284642353745, "loss": 2.3854, "step": 30235 }, { "epoch": 0.81, "learning_rate": 0.00017869318860667827, "loss": 2.3397, "step": 30236 }, { "epoch": 0.81, "learning_rate": 0.0001786435370118923, "loss": 2.1581, "step": 30237 }, { "epoch": 0.81, "learning_rate": 0.00017859389163955608, "loss": 2.5392, "step": 30238 }, { "epoch": 0.81, "learning_rate": 0.00017854425249004568, "loss": 2.4203, "step": 30239 }, { "epoch": 0.81, "learning_rate": 0.00017849461956373714, "loss": 2.8836, "step": 30240 }, { "epoch": 0.81, "learning_rate": 0.0001784449928610068, "loss": 2.6844, "step": 30241 }, { "epoch": 0.81, "learning_rate": 0.00017839537238223003, "loss": 2.4076, "step": 30242 }, { "epoch": 0.81, "learning_rate": 0.00017834575812778296, "loss": 2.5781, "step": 30243 }, { "epoch": 0.81, "learning_rate": 0.00017829615009804157, "loss": 2.5284, "step": 30244 }, { "epoch": 0.81, "learning_rate": 0.0001782465482933817, "loss": 1.9661, "step": 30245 }, { "epoch": 0.81, "learning_rate": 0.00017819695271417923, "loss": 2.3224, "step": 30246 }, { "epoch": 0.81, "learning_rate": 0.00017814736336080962, "loss": 2.2748, "step": 30247 }, { "epoch": 0.81, "learning_rate": 0.00017809778023364852, "loss": 2.1163, "step": 30248 }, { "epoch": 0.81, "learning_rate": 0.0001780482033330719, "loss": 2.5574, "step": 30249 }, { "epoch": 0.81, "learning_rate": 0.00017799863265945503, "loss": 2.3974, "step": 30250 }, { "epoch": 0.81, "learning_rate": 0.00017794906821317326, "loss": 2.1554, "step": 30251 }, { "epoch": 0.81, "learning_rate": 0.0001778995099946028, "loss": 2.1922, "step": 30252 }, { "epoch": 0.81, "learning_rate": 0.00017784995800411852, "loss": 2.5485, "step": 30253 }, { "epoch": 0.81, "learning_rate": 0.00017780041224209586, "loss": 2.5876, "step": 30254 }, { "epoch": 0.81, "learning_rate": 0.00017775087270891066, "loss": 2.8157, "step": 30255 }, { "epoch": 0.81, "learning_rate": 0.0001777013394049376, "loss": 2.7793, "step": 30256 }, { "epoch": 0.81, "learning_rate": 0.00017765181233055205, "loss": 2.3868, "step": 30257 }, { "epoch": 0.81, "learning_rate": 0.0001776022914861295, "loss": 2.8365, "step": 30258 }, { "epoch": 0.81, "learning_rate": 0.00017755277687204484, "loss": 2.4375, "step": 30259 }, { "epoch": 0.81, "learning_rate": 0.0001775032684886736, "loss": 2.7784, "step": 30260 }, { "epoch": 0.81, "learning_rate": 0.0001774537663363903, "loss": 2.3889, "step": 30261 }, { "epoch": 0.81, "learning_rate": 0.00017740427041557016, "loss": 2.2145, "step": 30262 }, { "epoch": 0.81, "learning_rate": 0.0001773547807265885, "loss": 2.3814, "step": 30263 }, { "epoch": 0.81, "learning_rate": 0.0001773052972698195, "loss": 2.0265, "step": 30264 }, { "epoch": 0.81, "learning_rate": 0.0001772558200456389, "loss": 2.3493, "step": 30265 }, { "epoch": 0.81, "learning_rate": 0.0001772063490544209, "loss": 2.4764, "step": 30266 }, { "epoch": 0.81, "learning_rate": 0.0001771568842965404, "loss": 2.366, "step": 30267 }, { "epoch": 0.81, "learning_rate": 0.0001771074257723726, "loss": 2.3415, "step": 30268 }, { "epoch": 0.81, "learning_rate": 0.00017705797348229157, "loss": 2.4134, "step": 30269 }, { "epoch": 0.81, "learning_rate": 0.00017700852742667217, "loss": 2.5081, "step": 30270 }, { "epoch": 0.81, "learning_rate": 0.00017695908760588896, "loss": 2.1311, "step": 30271 }, { "epoch": 0.81, "learning_rate": 0.00017690965402031666, "loss": 2.2186, "step": 30272 }, { "epoch": 0.81, "learning_rate": 0.00017686022667032987, "loss": 3.1558, "step": 30273 }, { "epoch": 0.81, "learning_rate": 0.0001768108055563027, "loss": 2.5089, "step": 30274 }, { "epoch": 0.81, "learning_rate": 0.00017676139067860952, "loss": 2.5469, "step": 30275 }, { "epoch": 0.81, "learning_rate": 0.00017671198203762518, "loss": 2.3399, "step": 30276 }, { "epoch": 0.81, "learning_rate": 0.00017666257963372322, "loss": 2.3625, "step": 30277 }, { "epoch": 0.81, "learning_rate": 0.0001766131834672786, "loss": 2.7095, "step": 30278 }, { "epoch": 0.81, "learning_rate": 0.00017656379353866547, "loss": 2.2826, "step": 30279 }, { "epoch": 0.81, "learning_rate": 0.0001765144098482576, "loss": 2.3766, "step": 30280 }, { "epoch": 0.81, "learning_rate": 0.00017646503239642964, "loss": 2.4025, "step": 30281 }, { "epoch": 0.81, "learning_rate": 0.00017641566118355511, "loss": 2.3115, "step": 30282 }, { "epoch": 0.81, "learning_rate": 0.00017636629621000822, "loss": 2.4656, "step": 30283 }, { "epoch": 0.81, "learning_rate": 0.00017631693747616306, "loss": 2.6227, "step": 30284 }, { "epoch": 0.81, "learning_rate": 0.00017626758498239358, "loss": 2.6081, "step": 30285 }, { "epoch": 0.81, "learning_rate": 0.0001762182387290735, "loss": 2.5218, "step": 30286 }, { "epoch": 0.81, "learning_rate": 0.00017616889871657705, "loss": 2.1519, "step": 30287 }, { "epoch": 0.81, "learning_rate": 0.0001761195649452775, "loss": 2.4127, "step": 30288 }, { "epoch": 0.81, "learning_rate": 0.00017607023741554907, "loss": 2.3262, "step": 30289 }, { "epoch": 0.81, "learning_rate": 0.00017602091612776473, "loss": 2.3518, "step": 30290 }, { "epoch": 0.81, "learning_rate": 0.00017597160108229882, "loss": 2.0759, "step": 30291 }, { "epoch": 0.81, "learning_rate": 0.00017592229227952506, "loss": 2.3834, "step": 30292 }, { "epoch": 0.81, "learning_rate": 0.00017587298971981637, "loss": 2.6933, "step": 30293 }, { "epoch": 0.81, "learning_rate": 0.00017582369340354666, "loss": 2.3907, "step": 30294 }, { "epoch": 0.81, "learning_rate": 0.0001757744033310894, "loss": 2.126, "step": 30295 }, { "epoch": 0.81, "learning_rate": 0.00017572511950281777, "loss": 2.3291, "step": 30296 }, { "epoch": 0.81, "learning_rate": 0.00017567584191910523, "loss": 2.5928, "step": 30297 }, { "epoch": 0.81, "learning_rate": 0.00017562657058032516, "loss": 2.5611, "step": 30298 }, { "epoch": 0.81, "learning_rate": 0.0001755773054868508, "loss": 2.3405, "step": 30299 }, { "epoch": 0.81, "learning_rate": 0.00017552804663905565, "loss": 3.0189, "step": 30300 }, { "epoch": 0.81, "learning_rate": 0.00017547879403731226, "loss": 2.2656, "step": 30301 }, { "epoch": 0.81, "learning_rate": 0.00017542954768199427, "loss": 2.3762, "step": 30302 }, { "epoch": 0.81, "learning_rate": 0.00017538030757347444, "loss": 2.364, "step": 30303 }, { "epoch": 0.81, "learning_rate": 0.0001753310737121261, "loss": 2.5572, "step": 30304 }, { "epoch": 0.81, "learning_rate": 0.0001752818460983221, "loss": 2.3246, "step": 30305 }, { "epoch": 0.81, "learning_rate": 0.00017523262473243562, "loss": 2.3866, "step": 30306 }, { "epoch": 0.81, "learning_rate": 0.00017518340961483902, "loss": 2.3988, "step": 30307 }, { "epoch": 0.81, "learning_rate": 0.0001751342007459058, "loss": 2.2731, "step": 30308 }, { "epoch": 0.81, "learning_rate": 0.00017508499812600808, "loss": 2.3314, "step": 30309 }, { "epoch": 0.81, "learning_rate": 0.00017503580175551892, "loss": 2.563, "step": 30310 }, { "epoch": 0.81, "learning_rate": 0.000174986611634811, "loss": 2.8642, "step": 30311 }, { "epoch": 0.81, "learning_rate": 0.00017493742776425713, "loss": 2.0541, "step": 30312 }, { "epoch": 0.81, "learning_rate": 0.0001748882501442297, "loss": 2.5008, "step": 30313 }, { "epoch": 0.81, "learning_rate": 0.00017483907877510163, "loss": 2.3163, "step": 30314 }, { "epoch": 0.81, "learning_rate": 0.00017478991365724495, "loss": 2.4645, "step": 30315 }, { "epoch": 0.81, "learning_rate": 0.00017474075479103235, "loss": 2.3724, "step": 30316 }, { "epoch": 0.81, "learning_rate": 0.00017469160217683632, "loss": 2.296, "step": 30317 }, { "epoch": 0.81, "learning_rate": 0.00017464245581502903, "loss": 2.4149, "step": 30318 }, { "epoch": 0.81, "learning_rate": 0.00017459331570598323, "loss": 2.4066, "step": 30319 }, { "epoch": 0.81, "learning_rate": 0.0001745441818500707, "loss": 2.3623, "step": 30320 }, { "epoch": 0.81, "learning_rate": 0.00017449505424766389, "loss": 2.3984, "step": 30321 }, { "epoch": 0.81, "learning_rate": 0.00017444593289913513, "loss": 2.2669, "step": 30322 }, { "epoch": 0.81, "learning_rate": 0.00017439681780485617, "loss": 2.5867, "step": 30323 }, { "epoch": 0.81, "learning_rate": 0.00017434770896519936, "loss": 3.051, "step": 30324 }, { "epoch": 0.81, "learning_rate": 0.00017429860638053663, "loss": 2.3934, "step": 30325 }, { "epoch": 0.81, "learning_rate": 0.00017424951005124, "loss": 2.4068, "step": 30326 }, { "epoch": 0.82, "learning_rate": 0.00017420041997768176, "loss": 2.4405, "step": 30327 }, { "epoch": 0.82, "learning_rate": 0.00017415133616023327, "loss": 2.7745, "step": 30328 }, { "epoch": 0.82, "learning_rate": 0.00017410225859926666, "loss": 2.2681, "step": 30329 }, { "epoch": 0.82, "learning_rate": 0.0001740531872951535, "loss": 2.5441, "step": 30330 }, { "epoch": 0.82, "learning_rate": 0.00017400412224826588, "loss": 2.6127, "step": 30331 }, { "epoch": 0.82, "learning_rate": 0.00017395506345897527, "loss": 2.4925, "step": 30332 }, { "epoch": 0.82, "learning_rate": 0.00017390601092765379, "loss": 2.315, "step": 30333 }, { "epoch": 0.82, "learning_rate": 0.00017385696465467226, "loss": 2.334, "step": 30334 }, { "epoch": 0.82, "learning_rate": 0.00017380792464040306, "loss": 2.5026, "step": 30335 }, { "epoch": 0.82, "learning_rate": 0.000173758890885217, "loss": 2.5189, "step": 30336 }, { "epoch": 0.82, "learning_rate": 0.00017370986338948558, "loss": 3.0224, "step": 30337 }, { "epoch": 0.82, "learning_rate": 0.00017366084215358102, "loss": 2.3199, "step": 30338 }, { "epoch": 0.82, "learning_rate": 0.00017361182717787405, "loss": 2.8429, "step": 30339 }, { "epoch": 0.82, "learning_rate": 0.00017356281846273602, "loss": 2.3361, "step": 30340 }, { "epoch": 0.82, "learning_rate": 0.00017351381600853855, "loss": 2.784, "step": 30341 }, { "epoch": 0.82, "learning_rate": 0.00017346481981565242, "loss": 2.7415, "step": 30342 }, { "epoch": 0.82, "learning_rate": 0.00017341582988444914, "loss": 2.3359, "step": 30343 }, { "epoch": 0.82, "learning_rate": 0.00017336684621529962, "loss": 2.7904, "step": 30344 }, { "epoch": 0.82, "learning_rate": 0.00017331786880857525, "loss": 2.2668, "step": 30345 }, { "epoch": 0.82, "learning_rate": 0.00017326889766464704, "loss": 2.2177, "step": 30346 }, { "epoch": 0.82, "learning_rate": 0.0001732199327838856, "loss": 2.8539, "step": 30347 }, { "epoch": 0.82, "learning_rate": 0.00017317097416666216, "loss": 2.5304, "step": 30348 }, { "epoch": 0.82, "learning_rate": 0.00017312202181334779, "loss": 2.6477, "step": 30349 }, { "epoch": 0.82, "learning_rate": 0.00017307307572431274, "loss": 2.9752, "step": 30350 }, { "epoch": 0.82, "learning_rate": 0.0001730241358999287, "loss": 2.2131, "step": 30351 }, { "epoch": 0.82, "learning_rate": 0.00017297520234056573, "loss": 2.2809, "step": 30352 }, { "epoch": 0.82, "learning_rate": 0.00017292627504659474, "loss": 2.3195, "step": 30353 }, { "epoch": 0.82, "learning_rate": 0.00017287735401838667, "loss": 2.7501, "step": 30354 }, { "epoch": 0.82, "learning_rate": 0.00017282843925631164, "loss": 2.9161, "step": 30355 }, { "epoch": 0.82, "learning_rate": 0.0001727795307607405, "loss": 2.5388, "step": 30356 }, { "epoch": 0.82, "learning_rate": 0.0001727306285320437, "loss": 2.2255, "step": 30357 }, { "epoch": 0.82, "learning_rate": 0.00017268173257059172, "loss": 2.2987, "step": 30358 }, { "epoch": 0.82, "learning_rate": 0.0001726328428767554, "loss": 2.6556, "step": 30359 }, { "epoch": 0.82, "learning_rate": 0.00017258395945090433, "loss": 2.9363, "step": 30360 }, { "epoch": 0.82, "learning_rate": 0.00017253508229340942, "loss": 2.0884, "step": 30361 }, { "epoch": 0.82, "learning_rate": 0.00017248621140464072, "loss": 2.0524, "step": 30362 }, { "epoch": 0.82, "learning_rate": 0.00017243734678496847, "loss": 2.5885, "step": 30363 }, { "epoch": 0.82, "learning_rate": 0.00017238848843476295, "loss": 2.2397, "step": 30364 }, { "epoch": 0.82, "learning_rate": 0.00017233963635439464, "loss": 2.0873, "step": 30365 }, { "epoch": 0.82, "learning_rate": 0.0001722907905442329, "loss": 2.4739, "step": 30366 }, { "epoch": 0.82, "learning_rate": 0.00017224195100464825, "loss": 2.1218, "step": 30367 }, { "epoch": 0.82, "learning_rate": 0.00017219311773601076, "loss": 2.5247, "step": 30368 }, { "epoch": 0.82, "learning_rate": 0.00017214429073868998, "loss": 2.4579, "step": 30369 }, { "epoch": 0.82, "learning_rate": 0.00017209547001305602, "loss": 2.3784, "step": 30370 }, { "epoch": 0.82, "learning_rate": 0.00017204665555947885, "loss": 2.426, "step": 30371 }, { "epoch": 0.82, "learning_rate": 0.00017199784737832814, "loss": 2.6388, "step": 30372 }, { "epoch": 0.82, "learning_rate": 0.0001719490454699739, "loss": 2.6412, "step": 30373 }, { "epoch": 0.82, "learning_rate": 0.00017190024983478546, "loss": 2.4978, "step": 30374 }, { "epoch": 0.82, "learning_rate": 0.0001718514604731327, "loss": 2.6696, "step": 30375 }, { "epoch": 0.82, "learning_rate": 0.00017180267738538523, "loss": 2.0627, "step": 30376 }, { "epoch": 0.82, "learning_rate": 0.00017175390057191253, "loss": 2.787, "step": 30377 }, { "epoch": 0.82, "learning_rate": 0.00017170513003308453, "loss": 2.6186, "step": 30378 }, { "epoch": 0.82, "learning_rate": 0.00017165636576927013, "loss": 2.2437, "step": 30379 }, { "epoch": 0.82, "learning_rate": 0.00017160760778083895, "loss": 2.2515, "step": 30380 }, { "epoch": 0.82, "learning_rate": 0.00017155885606816068, "loss": 2.2854, "step": 30381 }, { "epoch": 0.82, "learning_rate": 0.00017151011063160415, "loss": 2.6914, "step": 30382 }, { "epoch": 0.82, "learning_rate": 0.00017146137147153873, "loss": 2.3576, "step": 30383 }, { "epoch": 0.82, "learning_rate": 0.00017141263858833422, "loss": 2.3133, "step": 30384 }, { "epoch": 0.82, "learning_rate": 0.00017136391198235924, "loss": 2.8342, "step": 30385 }, { "epoch": 0.82, "learning_rate": 0.00017131519165398336, "loss": 2.6545, "step": 30386 }, { "epoch": 0.82, "learning_rate": 0.00017126647760357517, "loss": 2.4464, "step": 30387 }, { "epoch": 0.82, "learning_rate": 0.00017121776983150406, "loss": 2.6056, "step": 30388 }, { "epoch": 0.82, "learning_rate": 0.00017116906833813885, "loss": 2.4382, "step": 30389 }, { "epoch": 0.82, "learning_rate": 0.00017112037312384866, "loss": 2.5851, "step": 30390 }, { "epoch": 0.82, "learning_rate": 0.00017107168418900232, "loss": 2.4269, "step": 30391 }, { "epoch": 0.82, "learning_rate": 0.00017102300153396888, "loss": 2.4236, "step": 30392 }, { "epoch": 0.82, "learning_rate": 0.00017097432515911682, "loss": 2.5688, "step": 30393 }, { "epoch": 0.82, "learning_rate": 0.00017092565506481527, "loss": 2.2267, "step": 30394 }, { "epoch": 0.82, "learning_rate": 0.00017087699125143253, "loss": 2.0002, "step": 30395 }, { "epoch": 0.82, "learning_rate": 0.00017082833371933714, "loss": 2.4287, "step": 30396 }, { "epoch": 0.82, "learning_rate": 0.00017077968246889853, "loss": 2.5409, "step": 30397 }, { "epoch": 0.82, "learning_rate": 0.00017073103750048468, "loss": 2.4827, "step": 30398 }, { "epoch": 0.82, "learning_rate": 0.00017068239881446414, "loss": 2.6208, "step": 30399 }, { "epoch": 0.82, "learning_rate": 0.00017063376641120564, "loss": 2.8466, "step": 30400 }, { "epoch": 0.82, "learning_rate": 0.0001705851402910774, "loss": 2.0655, "step": 30401 }, { "epoch": 0.82, "learning_rate": 0.00017053652045444768, "loss": 2.7093, "step": 30402 }, { "epoch": 0.82, "learning_rate": 0.00017048790690168513, "loss": 2.6816, "step": 30403 }, { "epoch": 0.82, "learning_rate": 0.00017043929963315773, "loss": 2.261, "step": 30404 }, { "epoch": 0.82, "learning_rate": 0.00017039069864923428, "loss": 2.7449, "step": 30405 }, { "epoch": 0.82, "learning_rate": 0.00017034210395028228, "loss": 2.1802, "step": 30406 }, { "epoch": 0.82, "learning_rate": 0.00017029351553667017, "loss": 2.5303, "step": 30407 }, { "epoch": 0.82, "learning_rate": 0.00017024493340876625, "loss": 2.83, "step": 30408 }, { "epoch": 0.82, "learning_rate": 0.00017019635756693795, "loss": 2.6094, "step": 30409 }, { "epoch": 0.82, "learning_rate": 0.00017014778801155385, "loss": 2.8356, "step": 30410 }, { "epoch": 0.82, "learning_rate": 0.00017009922474298212, "loss": 2.469, "step": 30411 }, { "epoch": 0.82, "learning_rate": 0.00017005066776158996, "loss": 2.3023, "step": 30412 }, { "epoch": 0.82, "learning_rate": 0.0001700021170677458, "loss": 2.3138, "step": 30413 }, { "epoch": 0.82, "learning_rate": 0.00016995357266181698, "loss": 2.5128, "step": 30414 }, { "epoch": 0.82, "learning_rate": 0.0001699050345441715, "loss": 2.3518, "step": 30415 }, { "epoch": 0.82, "learning_rate": 0.00016985650271517704, "loss": 2.517, "step": 30416 }, { "epoch": 0.82, "learning_rate": 0.00016980797717520136, "loss": 2.5682, "step": 30417 }, { "epoch": 0.82, "learning_rate": 0.0001697594579246119, "loss": 2.455, "step": 30418 }, { "epoch": 0.82, "learning_rate": 0.00016971094496377672, "loss": 2.3465, "step": 30419 }, { "epoch": 0.82, "learning_rate": 0.0001696624382930627, "loss": 2.4314, "step": 30420 }, { "epoch": 0.82, "learning_rate": 0.00016961393791283785, "loss": 2.6694, "step": 30421 }, { "epoch": 0.82, "learning_rate": 0.00016956544382346883, "loss": 2.8007, "step": 30422 }, { "epoch": 0.82, "learning_rate": 0.0001695169560253238, "loss": 2.5219, "step": 30423 }, { "epoch": 0.82, "learning_rate": 0.00016946847451877013, "loss": 2.7019, "step": 30424 }, { "epoch": 0.82, "learning_rate": 0.0001694199993041745, "loss": 2.1551, "step": 30425 }, { "epoch": 0.82, "learning_rate": 0.00016937153038190444, "loss": 2.4529, "step": 30426 }, { "epoch": 0.82, "learning_rate": 0.0001693230677523274, "loss": 2.1275, "step": 30427 }, { "epoch": 0.82, "learning_rate": 0.00016927461141581014, "loss": 2.1352, "step": 30428 }, { "epoch": 0.82, "learning_rate": 0.00016922616137271984, "loss": 2.5532, "step": 30429 }, { "epoch": 0.82, "learning_rate": 0.00016917771762342372, "loss": 2.2928, "step": 30430 }, { "epoch": 0.82, "learning_rate": 0.00016912928016828854, "loss": 2.7625, "step": 30431 }, { "epoch": 0.82, "learning_rate": 0.00016908084900768162, "loss": 2.2703, "step": 30432 }, { "epoch": 0.82, "learning_rate": 0.00016903242414196952, "loss": 2.4556, "step": 30433 }, { "epoch": 0.82, "learning_rate": 0.00016898400557151906, "loss": 2.2806, "step": 30434 }, { "epoch": 0.82, "learning_rate": 0.00016893559329669727, "loss": 2.5649, "step": 30435 }, { "epoch": 0.82, "learning_rate": 0.0001688871873178709, "loss": 2.2964, "step": 30436 }, { "epoch": 0.82, "learning_rate": 0.00016883878763540683, "loss": 2.2764, "step": 30437 }, { "epoch": 0.82, "learning_rate": 0.00016879039424967125, "loss": 2.5399, "step": 30438 }, { "epoch": 0.82, "learning_rate": 0.00016874200716103093, "loss": 2.5153, "step": 30439 }, { "epoch": 0.82, "learning_rate": 0.00016869362636985296, "loss": 2.2337, "step": 30440 }, { "epoch": 0.82, "learning_rate": 0.00016864525187650314, "loss": 2.0698, "step": 30441 }, { "epoch": 0.82, "learning_rate": 0.00016859688368134828, "loss": 2.3602, "step": 30442 }, { "epoch": 0.82, "learning_rate": 0.00016854852178475478, "loss": 2.7505, "step": 30443 }, { "epoch": 0.82, "learning_rate": 0.00016850016618708897, "loss": 2.9604, "step": 30444 }, { "epoch": 0.82, "learning_rate": 0.00016845181688871725, "loss": 2.7756, "step": 30445 }, { "epoch": 0.82, "learning_rate": 0.0001684034738900062, "loss": 2.2261, "step": 30446 }, { "epoch": 0.82, "learning_rate": 0.00016835513719132145, "loss": 2.4081, "step": 30447 }, { "epoch": 0.82, "learning_rate": 0.00016830680679302956, "loss": 2.383, "step": 30448 }, { "epoch": 0.82, "learning_rate": 0.0001682584826954966, "loss": 2.8324, "step": 30449 }, { "epoch": 0.82, "learning_rate": 0.0001682101648990887, "loss": 2.3097, "step": 30450 }, { "epoch": 0.82, "learning_rate": 0.00016816185340417212, "loss": 2.2771, "step": 30451 }, { "epoch": 0.82, "learning_rate": 0.00016811354821111226, "loss": 2.4418, "step": 30452 }, { "epoch": 0.82, "learning_rate": 0.00016806524932027556, "loss": 2.1743, "step": 30453 }, { "epoch": 0.82, "learning_rate": 0.000168016956732028, "loss": 2.515, "step": 30454 }, { "epoch": 0.82, "learning_rate": 0.00016796867044673492, "loss": 2.3993, "step": 30455 }, { "epoch": 0.82, "learning_rate": 0.0001679203904647625, "loss": 2.6069, "step": 30456 }, { "epoch": 0.82, "learning_rate": 0.00016787211678647652, "loss": 2.3465, "step": 30457 }, { "epoch": 0.82, "learning_rate": 0.0001678238494122425, "loss": 2.3622, "step": 30458 }, { "epoch": 0.82, "learning_rate": 0.00016777558834242645, "loss": 2.5666, "step": 30459 }, { "epoch": 0.82, "learning_rate": 0.00016772733357739355, "loss": 2.0918, "step": 30460 }, { "epoch": 0.82, "learning_rate": 0.00016767908511750962, "loss": 2.5497, "step": 30461 }, { "epoch": 0.82, "learning_rate": 0.00016763084296314012, "loss": 2.2727, "step": 30462 }, { "epoch": 0.82, "learning_rate": 0.00016758260711465046, "loss": 2.1407, "step": 30463 }, { "epoch": 0.82, "learning_rate": 0.00016753437757240642, "loss": 2.2901, "step": 30464 }, { "epoch": 0.82, "learning_rate": 0.00016748615433677294, "loss": 2.3665, "step": 30465 }, { "epoch": 0.82, "learning_rate": 0.00016743793740811542, "loss": 2.531, "step": 30466 }, { "epoch": 0.82, "learning_rate": 0.00016738972678679955, "loss": 2.3733, "step": 30467 }, { "epoch": 0.82, "learning_rate": 0.00016734152247319, "loss": 2.5322, "step": 30468 }, { "epoch": 0.82, "learning_rate": 0.00016729332446765188, "loss": 2.5503, "step": 30469 }, { "epoch": 0.82, "learning_rate": 0.0001672451327705513, "loss": 2.4603, "step": 30470 }, { "epoch": 0.82, "learning_rate": 0.00016719694738225234, "loss": 2.3175, "step": 30471 }, { "epoch": 0.82, "learning_rate": 0.00016714876830312077, "loss": 2.786, "step": 30472 }, { "epoch": 0.82, "learning_rate": 0.00016710059553352085, "loss": 2.6313, "step": 30473 }, { "epoch": 0.82, "learning_rate": 0.000167052429073818, "loss": 2.3792, "step": 30474 }, { "epoch": 0.82, "learning_rate": 0.00016700426892437705, "loss": 2.4417, "step": 30475 }, { "epoch": 0.82, "learning_rate": 0.00016695611508556275, "loss": 2.1956, "step": 30476 }, { "epoch": 0.82, "learning_rate": 0.00016690796755774006, "loss": 2.1832, "step": 30477 }, { "epoch": 0.82, "learning_rate": 0.00016685982634127383, "loss": 1.9757, "step": 30478 }, { "epoch": 0.82, "learning_rate": 0.00016681169143652842, "loss": 2.1599, "step": 30479 }, { "epoch": 0.82, "learning_rate": 0.00016676356284386863, "loss": 2.6902, "step": 30480 }, { "epoch": 0.82, "learning_rate": 0.0001667154405636594, "loss": 2.5664, "step": 30481 }, { "epoch": 0.82, "learning_rate": 0.00016666732459626454, "loss": 2.5172, "step": 30482 }, { "epoch": 0.82, "learning_rate": 0.00016661921494204958, "loss": 2.2285, "step": 30483 }, { "epoch": 0.82, "learning_rate": 0.00016657111160137806, "loss": 2.2648, "step": 30484 }, { "epoch": 0.82, "learning_rate": 0.00016652301457461494, "loss": 2.5763, "step": 30485 }, { "epoch": 0.82, "learning_rate": 0.00016647492386212458, "loss": 2.68, "step": 30486 }, { "epoch": 0.82, "learning_rate": 0.00016642683946427105, "loss": 2.9687, "step": 30487 }, { "epoch": 0.82, "learning_rate": 0.00016637876138141873, "loss": 2.2523, "step": 30488 }, { "epoch": 0.82, "learning_rate": 0.00016633068961393184, "loss": 2.9524, "step": 30489 }, { "epoch": 0.82, "learning_rate": 0.00016628262416217455, "loss": 2.6578, "step": 30490 }, { "epoch": 0.82, "learning_rate": 0.00016623456502651136, "loss": 2.3878, "step": 30491 }, { "epoch": 0.82, "learning_rate": 0.00016618651220730573, "loss": 2.6341, "step": 30492 }, { "epoch": 0.82, "learning_rate": 0.00016613846570492208, "loss": 2.4856, "step": 30493 }, { "epoch": 0.82, "learning_rate": 0.00016609042551972452, "loss": 2.4943, "step": 30494 }, { "epoch": 0.82, "learning_rate": 0.00016604239165207636, "loss": 2.6296, "step": 30495 }, { "epoch": 0.82, "learning_rate": 0.00016599436410234215, "loss": 2.3646, "step": 30496 }, { "epoch": 0.82, "learning_rate": 0.00016594634287088583, "loss": 2.4809, "step": 30497 }, { "epoch": 0.82, "learning_rate": 0.00016589832795807068, "loss": 2.5002, "step": 30498 }, { "epoch": 0.82, "learning_rate": 0.00016585031936426086, "loss": 2.8428, "step": 30499 }, { "epoch": 0.82, "learning_rate": 0.00016580231708981962, "loss": 2.1443, "step": 30500 }, { "epoch": 0.82, "learning_rate": 0.0001657543211351109, "loss": 2.71, "step": 30501 }, { "epoch": 0.82, "learning_rate": 0.0001657063315004984, "loss": 2.5173, "step": 30502 }, { "epoch": 0.82, "learning_rate": 0.0001656583481863454, "loss": 2.4055, "step": 30503 }, { "epoch": 0.82, "learning_rate": 0.0001656103711930157, "loss": 2.6534, "step": 30504 }, { "epoch": 0.82, "learning_rate": 0.0001655624005208729, "loss": 2.6012, "step": 30505 }, { "epoch": 0.82, "learning_rate": 0.00016551443617027995, "loss": 2.5807, "step": 30506 }, { "epoch": 0.82, "learning_rate": 0.00016546647814160055, "loss": 2.4638, "step": 30507 }, { "epoch": 0.82, "learning_rate": 0.0001654185264351975, "loss": 2.1204, "step": 30508 }, { "epoch": 0.82, "learning_rate": 0.00016537058105143477, "loss": 2.3869, "step": 30509 }, { "epoch": 0.82, "learning_rate": 0.0001653226419906755, "loss": 2.1779, "step": 30510 }, { "epoch": 0.82, "learning_rate": 0.00016527470925328246, "loss": 2.4702, "step": 30511 }, { "epoch": 0.82, "learning_rate": 0.000165226782839619, "loss": 2.4712, "step": 30512 }, { "epoch": 0.82, "learning_rate": 0.00016517886275004833, "loss": 2.1673, "step": 30513 }, { "epoch": 0.82, "learning_rate": 0.00016513094898493318, "loss": 2.3294, "step": 30514 }, { "epoch": 0.82, "learning_rate": 0.00016508304154463671, "loss": 2.2734, "step": 30515 }, { "epoch": 0.82, "learning_rate": 0.00016503514042952183, "loss": 2.2104, "step": 30516 }, { "epoch": 0.82, "learning_rate": 0.00016498724563995137, "loss": 2.7522, "step": 30517 }, { "epoch": 0.82, "learning_rate": 0.00016493935717628861, "loss": 2.4719, "step": 30518 }, { "epoch": 0.82, "learning_rate": 0.0001648914750388957, "loss": 2.6591, "step": 30519 }, { "epoch": 0.82, "learning_rate": 0.00016484359922813564, "loss": 2.3607, "step": 30520 }, { "epoch": 0.82, "learning_rate": 0.00016479572974437118, "loss": 2.4088, "step": 30521 }, { "epoch": 0.82, "learning_rate": 0.00016474786658796504, "loss": 2.1348, "step": 30522 }, { "epoch": 0.82, "learning_rate": 0.00016470000975927956, "loss": 2.699, "step": 30523 }, { "epoch": 0.82, "learning_rate": 0.00016465215925867783, "loss": 2.4055, "step": 30524 }, { "epoch": 0.82, "learning_rate": 0.00016460431508652173, "loss": 2.4697, "step": 30525 }, { "epoch": 0.82, "learning_rate": 0.00016455647724317423, "loss": 2.2487, "step": 30526 }, { "epoch": 0.82, "learning_rate": 0.00016450864572899727, "loss": 2.3962, "step": 30527 }, { "epoch": 0.82, "learning_rate": 0.00016446082054435317, "loss": 2.889, "step": 30528 }, { "epoch": 0.82, "learning_rate": 0.00016441300168960505, "loss": 2.5954, "step": 30529 }, { "epoch": 0.82, "learning_rate": 0.00016436518916511435, "loss": 2.2191, "step": 30530 }, { "epoch": 0.82, "learning_rate": 0.00016431738297124354, "loss": 2.4258, "step": 30531 }, { "epoch": 0.82, "learning_rate": 0.00016426958310835504, "loss": 2.7501, "step": 30532 }, { "epoch": 0.82, "learning_rate": 0.00016422178957681066, "loss": 2.3847, "step": 30533 }, { "epoch": 0.82, "learning_rate": 0.00016417400237697256, "loss": 2.3953, "step": 30534 }, { "epoch": 0.82, "learning_rate": 0.00016412622150920264, "loss": 2.1506, "step": 30535 }, { "epoch": 0.82, "learning_rate": 0.0001640784469738632, "loss": 2.7576, "step": 30536 }, { "epoch": 0.82, "learning_rate": 0.00016403067877131616, "loss": 2.4734, "step": 30537 }, { "epoch": 0.82, "learning_rate": 0.00016398291690192303, "loss": 3.0279, "step": 30538 }, { "epoch": 0.82, "learning_rate": 0.0001639351613660458, "loss": 2.2428, "step": 30539 }, { "epoch": 0.82, "learning_rate": 0.00016388741216404656, "loss": 2.7342, "step": 30540 }, { "epoch": 0.82, "learning_rate": 0.00016383966929628635, "loss": 2.4862, "step": 30541 }, { "epoch": 0.82, "learning_rate": 0.00016379193276312777, "loss": 2.2786, "step": 30542 }, { "epoch": 0.82, "learning_rate": 0.00016374420256493172, "loss": 2.9434, "step": 30543 }, { "epoch": 0.82, "learning_rate": 0.00016369647870206018, "loss": 2.6782, "step": 30544 }, { "epoch": 0.82, "learning_rate": 0.00016364876117487483, "loss": 2.7427, "step": 30545 }, { "epoch": 0.82, "learning_rate": 0.0001636010499837367, "loss": 2.3227, "step": 30546 }, { "epoch": 0.82, "learning_rate": 0.00016355334512900744, "loss": 2.0938, "step": 30547 }, { "epoch": 0.82, "learning_rate": 0.0001635056466110485, "loss": 2.0237, "step": 30548 }, { "epoch": 0.82, "learning_rate": 0.00016345795443022126, "loss": 2.159, "step": 30549 }, { "epoch": 0.82, "learning_rate": 0.00016341026858688722, "loss": 2.6129, "step": 30550 }, { "epoch": 0.82, "learning_rate": 0.00016336258908140723, "loss": 2.6098, "step": 30551 }, { "epoch": 0.82, "learning_rate": 0.00016331491591414261, "loss": 2.252, "step": 30552 }, { "epoch": 0.82, "learning_rate": 0.00016326724908545488, "loss": 2.1409, "step": 30553 }, { "epoch": 0.82, "learning_rate": 0.0001632195885957043, "loss": 2.4948, "step": 30554 }, { "epoch": 0.82, "learning_rate": 0.0001631719344452529, "loss": 2.7545, "step": 30555 }, { "epoch": 0.82, "learning_rate": 0.00016312428663446145, "loss": 2.4838, "step": 30556 }, { "epoch": 0.82, "learning_rate": 0.00016307664516369057, "loss": 2.6064, "step": 30557 }, { "epoch": 0.82, "learning_rate": 0.0001630290100333014, "loss": 2.6471, "step": 30558 }, { "epoch": 0.82, "learning_rate": 0.00016298138124365514, "loss": 2.5484, "step": 30559 }, { "epoch": 0.82, "learning_rate": 0.00016293375879511196, "loss": 2.6648, "step": 30560 }, { "epoch": 0.82, "learning_rate": 0.00016288614268803305, "loss": 2.7091, "step": 30561 }, { "epoch": 0.82, "learning_rate": 0.00016283853292277896, "loss": 2.5853, "step": 30562 }, { "epoch": 0.82, "learning_rate": 0.00016279092949971052, "loss": 2.2388, "step": 30563 }, { "epoch": 0.82, "learning_rate": 0.00016274333241918847, "loss": 2.4442, "step": 30564 }, { "epoch": 0.82, "learning_rate": 0.0001626957416815732, "loss": 2.4582, "step": 30565 }, { "epoch": 0.82, "learning_rate": 0.00016264815728722515, "loss": 2.2989, "step": 30566 }, { "epoch": 0.82, "learning_rate": 0.00016260057923650495, "loss": 2.4711, "step": 30567 }, { "epoch": 0.82, "learning_rate": 0.0001625530075297731, "loss": 2.5894, "step": 30568 }, { "epoch": 0.82, "learning_rate": 0.00016250544216739015, "loss": 2.8201, "step": 30569 }, { "epoch": 0.82, "learning_rate": 0.0001624578831497161, "loss": 2.3437, "step": 30570 }, { "epoch": 0.82, "learning_rate": 0.0001624103304771113, "loss": 2.2206, "step": 30571 }, { "epoch": 0.82, "learning_rate": 0.00016236278414993632, "loss": 2.5361, "step": 30572 }, { "epoch": 0.82, "learning_rate": 0.00016231524416855092, "loss": 2.1268, "step": 30573 }, { "epoch": 0.82, "learning_rate": 0.00016226771053331546, "loss": 2.3159, "step": 30574 }, { "epoch": 0.82, "learning_rate": 0.0001622201832445901, "loss": 2.7467, "step": 30575 }, { "epoch": 0.82, "learning_rate": 0.00016217266230273474, "loss": 2.7073, "step": 30576 }, { "epoch": 0.82, "learning_rate": 0.00016212514770810982, "loss": 2.3266, "step": 30577 }, { "epoch": 0.82, "learning_rate": 0.00016207763946107467, "loss": 2.3988, "step": 30578 }, { "epoch": 0.82, "learning_rate": 0.0001620301375619896, "loss": 2.4076, "step": 30579 }, { "epoch": 0.82, "learning_rate": 0.00016198264201121437, "loss": 2.2795, "step": 30580 }, { "epoch": 0.82, "learning_rate": 0.00016193515280910886, "loss": 2.9828, "step": 30581 }, { "epoch": 0.82, "learning_rate": 0.00016188766995603278, "loss": 2.6752, "step": 30582 }, { "epoch": 0.82, "learning_rate": 0.00016184019345234603, "loss": 2.2192, "step": 30583 }, { "epoch": 0.82, "learning_rate": 0.000161792723298408, "loss": 2.8598, "step": 30584 }, { "epoch": 0.82, "learning_rate": 0.00016174525949457863, "loss": 2.4691, "step": 30585 }, { "epoch": 0.82, "learning_rate": 0.00016169780204121698, "loss": 2.4184, "step": 30586 }, { "epoch": 0.82, "learning_rate": 0.0001616503509386831, "loss": 2.3012, "step": 30587 }, { "epoch": 0.82, "learning_rate": 0.00016160290618733608, "loss": 2.733, "step": 30588 }, { "epoch": 0.82, "learning_rate": 0.00016155546778753572, "loss": 2.6532, "step": 30589 }, { "epoch": 0.82, "learning_rate": 0.00016150803573964113, "loss": 2.3643, "step": 30590 }, { "epoch": 0.82, "learning_rate": 0.000161460610044012, "loss": 2.4831, "step": 30591 }, { "epoch": 0.82, "learning_rate": 0.00016141319070100713, "loss": 2.7684, "step": 30592 }, { "epoch": 0.82, "learning_rate": 0.00016136577771098604, "loss": 2.3054, "step": 30593 }, { "epoch": 0.82, "learning_rate": 0.00016131837107430792, "loss": 2.5655, "step": 30594 }, { "epoch": 0.82, "learning_rate": 0.0001612709707913318, "loss": 3.0282, "step": 30595 }, { "epoch": 0.82, "learning_rate": 0.00016122357686241707, "loss": 2.5927, "step": 30596 }, { "epoch": 0.82, "learning_rate": 0.00016117618928792243, "loss": 2.0448, "step": 30597 }, { "epoch": 0.82, "learning_rate": 0.00016112880806820696, "loss": 2.4579, "step": 30598 }, { "epoch": 0.82, "learning_rate": 0.00016108143320362988, "loss": 2.7391, "step": 30599 }, { "epoch": 0.82, "learning_rate": 0.0001610340646945496, "loss": 2.805, "step": 30600 }, { "epoch": 0.82, "learning_rate": 0.0001609867025413251, "loss": 2.4186, "step": 30601 }, { "epoch": 0.82, "learning_rate": 0.00016093934674431588, "loss": 2.278, "step": 30602 }, { "epoch": 0.82, "learning_rate": 0.00016089199730387983, "loss": 2.3336, "step": 30603 }, { "epoch": 0.82, "learning_rate": 0.0001608446542203762, "loss": 2.4864, "step": 30604 }, { "epoch": 0.82, "learning_rate": 0.00016079731749416316, "loss": 2.589, "step": 30605 }, { "epoch": 0.82, "learning_rate": 0.00016074998712559973, "loss": 2.4261, "step": 30606 }, { "epoch": 0.82, "learning_rate": 0.00016070266311504433, "loss": 2.6629, "step": 30607 }, { "epoch": 0.82, "learning_rate": 0.00016065534546285542, "loss": 2.5647, "step": 30608 }, { "epoch": 0.82, "learning_rate": 0.00016060803416939162, "loss": 2.8196, "step": 30609 }, { "epoch": 0.82, "learning_rate": 0.00016056072923501154, "loss": 2.4197, "step": 30610 }, { "epoch": 0.82, "learning_rate": 0.00016051343066007296, "loss": 2.9472, "step": 30611 }, { "epoch": 0.82, "learning_rate": 0.00016046613844493486, "loss": 2.4148, "step": 30612 }, { "epoch": 0.82, "learning_rate": 0.00016041885258995502, "loss": 2.7445, "step": 30613 }, { "epoch": 0.82, "learning_rate": 0.00016037157309549155, "loss": 2.6472, "step": 30614 }, { "epoch": 0.82, "learning_rate": 0.00016032429996190334, "loss": 2.7185, "step": 30615 }, { "epoch": 0.82, "learning_rate": 0.00016027703318954802, "loss": 2.6957, "step": 30616 }, { "epoch": 0.82, "learning_rate": 0.00016022977277878358, "loss": 2.6741, "step": 30617 }, { "epoch": 0.82, "learning_rate": 0.0001601825187299687, "loss": 2.7182, "step": 30618 }, { "epoch": 0.82, "learning_rate": 0.0001601352710434605, "loss": 2.3193, "step": 30619 }, { "epoch": 0.82, "learning_rate": 0.00016008802971961744, "loss": 2.5291, "step": 30620 }, { "epoch": 0.82, "learning_rate": 0.00016004079475879718, "loss": 2.2502, "step": 30621 }, { "epoch": 0.82, "learning_rate": 0.00015999356616135785, "loss": 2.4514, "step": 30622 }, { "epoch": 0.82, "learning_rate": 0.00015994634392765716, "loss": 2.9587, "step": 30623 }, { "epoch": 0.82, "learning_rate": 0.00015989912805805263, "loss": 2.1058, "step": 30624 }, { "epoch": 0.82, "learning_rate": 0.00015985191855290214, "loss": 2.3452, "step": 30625 }, { "epoch": 0.82, "learning_rate": 0.00015980471541256346, "loss": 2.3925, "step": 30626 }, { "epoch": 0.82, "learning_rate": 0.00015975751863739362, "loss": 2.0635, "step": 30627 }, { "epoch": 0.82, "learning_rate": 0.0001597103282277509, "loss": 2.8256, "step": 30628 }, { "epoch": 0.82, "learning_rate": 0.00015966314418399265, "loss": 2.4268, "step": 30629 }, { "epoch": 0.82, "learning_rate": 0.00015961596650647592, "loss": 2.5395, "step": 30630 }, { "epoch": 0.82, "learning_rate": 0.00015956879519555867, "loss": 2.7233, "step": 30631 }, { "epoch": 0.82, "learning_rate": 0.00015952163025159782, "loss": 2.85, "step": 30632 }, { "epoch": 0.82, "learning_rate": 0.00015947447167495067, "loss": 2.3071, "step": 30633 }, { "epoch": 0.82, "learning_rate": 0.00015942731946597477, "loss": 2.4377, "step": 30634 }, { "epoch": 0.82, "learning_rate": 0.0001593801736250272, "loss": 2.4604, "step": 30635 }, { "epoch": 0.82, "learning_rate": 0.00015933303415246514, "loss": 2.2933, "step": 30636 }, { "epoch": 0.82, "learning_rate": 0.00015928590104864594, "loss": 2.5007, "step": 30637 }, { "epoch": 0.82, "learning_rate": 0.0001592387743139262, "loss": 2.4776, "step": 30638 }, { "epoch": 0.82, "learning_rate": 0.0001591916539486634, "loss": 2.6047, "step": 30639 }, { "epoch": 0.82, "learning_rate": 0.00015914453995321387, "loss": 2.6479, "step": 30640 }, { "epoch": 0.82, "learning_rate": 0.00015909743232793517, "loss": 2.5866, "step": 30641 }, { "epoch": 0.82, "learning_rate": 0.00015905033107318435, "loss": 2.4656, "step": 30642 }, { "epoch": 0.82, "learning_rate": 0.00015900323618931757, "loss": 2.4034, "step": 30643 }, { "epoch": 0.82, "learning_rate": 0.00015895614767669187, "loss": 1.9134, "step": 30644 }, { "epoch": 0.82, "learning_rate": 0.0001589090655356642, "loss": 2.5793, "step": 30645 }, { "epoch": 0.82, "learning_rate": 0.00015886198976659095, "loss": 2.2494, "step": 30646 }, { "epoch": 0.82, "learning_rate": 0.00015881492036982892, "loss": 2.4701, "step": 30647 }, { "epoch": 0.82, "learning_rate": 0.00015876785734573461, "loss": 3.1595, "step": 30648 }, { "epoch": 0.82, "learning_rate": 0.00015872080069466454, "loss": 2.3559, "step": 30649 }, { "epoch": 0.82, "learning_rate": 0.00015867375041697562, "loss": 2.4336, "step": 30650 }, { "epoch": 0.82, "learning_rate": 0.00015862670651302369, "loss": 2.604, "step": 30651 }, { "epoch": 0.82, "learning_rate": 0.00015857966898316544, "loss": 2.3916, "step": 30652 }, { "epoch": 0.82, "learning_rate": 0.00015853263782775707, "loss": 2.4021, "step": 30653 }, { "epoch": 0.82, "learning_rate": 0.00015848561304715515, "loss": 2.5893, "step": 30654 }, { "epoch": 0.82, "learning_rate": 0.00015843859464171594, "loss": 1.8225, "step": 30655 }, { "epoch": 0.82, "learning_rate": 0.0001583915826117952, "loss": 2.4071, "step": 30656 }, { "epoch": 0.82, "learning_rate": 0.00015834457695774939, "loss": 2.4743, "step": 30657 }, { "epoch": 0.82, "learning_rate": 0.0001582975776799349, "loss": 2.2653, "step": 30658 }, { "epoch": 0.82, "learning_rate": 0.00015825058477870712, "loss": 2.4009, "step": 30659 }, { "epoch": 0.82, "learning_rate": 0.00015820359825442255, "loss": 2.3388, "step": 30660 }, { "epoch": 0.82, "learning_rate": 0.00015815661810743688, "loss": 2.8588, "step": 30661 }, { "epoch": 0.82, "learning_rate": 0.00015810964433810625, "loss": 2.4585, "step": 30662 }, { "epoch": 0.82, "learning_rate": 0.00015806267694678643, "loss": 2.4883, "step": 30663 }, { "epoch": 0.82, "learning_rate": 0.00015801571593383347, "loss": 2.6342, "step": 30664 }, { "epoch": 0.82, "learning_rate": 0.00015796876129960268, "loss": 2.5488, "step": 30665 }, { "epoch": 0.82, "learning_rate": 0.0001579218130444501, "loss": 2.1898, "step": 30666 }, { "epoch": 0.82, "learning_rate": 0.00015787487116873122, "loss": 2.3161, "step": 30667 }, { "epoch": 0.82, "learning_rate": 0.00015782793567280175, "loss": 2.5128, "step": 30668 }, { "epoch": 0.82, "learning_rate": 0.00015778100655701756, "loss": 2.7248, "step": 30669 }, { "epoch": 0.82, "learning_rate": 0.0001577340838217336, "loss": 2.2744, "step": 30670 }, { "epoch": 0.82, "learning_rate": 0.0001576871674673056, "loss": 2.2777, "step": 30671 }, { "epoch": 0.82, "learning_rate": 0.00015764025749408938, "loss": 2.2993, "step": 30672 }, { "epoch": 0.82, "learning_rate": 0.00015759335390243967, "loss": 2.6216, "step": 30673 }, { "epoch": 0.82, "learning_rate": 0.00015754645669271205, "loss": 2.5176, "step": 30674 }, { "epoch": 0.82, "learning_rate": 0.00015749956586526192, "loss": 2.5722, "step": 30675 }, { "epoch": 0.82, "learning_rate": 0.00015745268142044455, "loss": 2.6532, "step": 30676 }, { "epoch": 0.82, "learning_rate": 0.0001574058033586151, "loss": 2.3878, "step": 30677 }, { "epoch": 0.82, "learning_rate": 0.0001573589316801285, "loss": 2.1794, "step": 30678 }, { "epoch": 0.82, "learning_rate": 0.00015731206638534002, "loss": 2.7052, "step": 30679 }, { "epoch": 0.82, "learning_rate": 0.0001572652074746046, "loss": 2.3454, "step": 30680 }, { "epoch": 0.82, "learning_rate": 0.0001572183549482773, "loss": 2.8513, "step": 30681 }, { "epoch": 0.82, "learning_rate": 0.00015717150880671326, "loss": 2.5579, "step": 30682 }, { "epoch": 0.82, "learning_rate": 0.000157124669050267, "loss": 2.8089, "step": 30683 }, { "epoch": 0.82, "learning_rate": 0.00015707783567929357, "loss": 2.3443, "step": 30684 }, { "epoch": 0.82, "learning_rate": 0.000157031008694148, "loss": 1.9014, "step": 30685 }, { "epoch": 0.82, "learning_rate": 0.00015698418809518454, "loss": 2.5916, "step": 30686 }, { "epoch": 0.82, "learning_rate": 0.00015693737388275785, "loss": 2.5146, "step": 30687 }, { "epoch": 0.82, "learning_rate": 0.00015689056605722353, "loss": 2.7312, "step": 30688 }, { "epoch": 0.82, "learning_rate": 0.00015684376461893524, "loss": 2.5468, "step": 30689 }, { "epoch": 0.82, "learning_rate": 0.00015679696956824796, "loss": 2.5884, "step": 30690 }, { "epoch": 0.82, "learning_rate": 0.00015675018090551595, "loss": 2.3965, "step": 30691 }, { "epoch": 0.82, "learning_rate": 0.00015670339863109385, "loss": 2.3763, "step": 30692 }, { "epoch": 0.82, "learning_rate": 0.00015665662274533598, "loss": 2.9336, "step": 30693 }, { "epoch": 0.82, "learning_rate": 0.00015660985324859677, "loss": 2.1259, "step": 30694 }, { "epoch": 0.82, "learning_rate": 0.0001565630901412306, "loss": 2.3512, "step": 30695 }, { "epoch": 0.82, "learning_rate": 0.00015651633342359184, "loss": 2.705, "step": 30696 }, { "epoch": 0.82, "learning_rate": 0.0001564695830960342, "loss": 2.8536, "step": 30697 }, { "epoch": 0.82, "learning_rate": 0.00015642283915891252, "loss": 2.8199, "step": 30698 }, { "epoch": 0.82, "learning_rate": 0.0001563761016125802, "loss": 2.5682, "step": 30699 }, { "epoch": 0.83, "learning_rate": 0.00015632937045739181, "loss": 2.2867, "step": 30700 }, { "epoch": 0.83, "learning_rate": 0.00015628264569370165, "loss": 2.3932, "step": 30701 }, { "epoch": 0.83, "learning_rate": 0.00015623592732186297, "loss": 2.534, "step": 30702 }, { "epoch": 0.83, "learning_rate": 0.00015618921534223007, "loss": 2.5096, "step": 30703 }, { "epoch": 0.83, "learning_rate": 0.0001561425097551571, "loss": 2.391, "step": 30704 }, { "epoch": 0.83, "learning_rate": 0.0001560958105609973, "loss": 2.3607, "step": 30705 }, { "epoch": 0.83, "learning_rate": 0.00015604911776010487, "loss": 2.6274, "step": 30706 }, { "epoch": 0.83, "learning_rate": 0.0001560024313528333, "loss": 2.6235, "step": 30707 }, { "epoch": 0.83, "learning_rate": 0.00015595575133953653, "loss": 2.8426, "step": 30708 }, { "epoch": 0.83, "learning_rate": 0.0001559090777205683, "loss": 2.1013, "step": 30709 }, { "epoch": 0.83, "learning_rate": 0.00015586241049628168, "loss": 2.2089, "step": 30710 }, { "epoch": 0.83, "learning_rate": 0.0001558157496670306, "loss": 2.2951, "step": 30711 }, { "epoch": 0.83, "learning_rate": 0.0001557690952331685, "loss": 2.8085, "step": 30712 }, { "epoch": 0.83, "learning_rate": 0.0001557224471950488, "loss": 2.6139, "step": 30713 }, { "epoch": 0.83, "learning_rate": 0.00015567580555302484, "loss": 2.3472, "step": 30714 }, { "epoch": 0.83, "learning_rate": 0.00015562917030745028, "loss": 2.7565, "step": 30715 }, { "epoch": 0.83, "learning_rate": 0.0001555825414586779, "loss": 2.3641, "step": 30716 }, { "epoch": 0.83, "learning_rate": 0.00015553591900706144, "loss": 3.1807, "step": 30717 }, { "epoch": 0.83, "learning_rate": 0.00015548930295295371, "loss": 2.3411, "step": 30718 }, { "epoch": 0.83, "learning_rate": 0.00015544269329670801, "loss": 2.4873, "step": 30719 }, { "epoch": 0.83, "learning_rate": 0.0001553960900386775, "loss": 2.185, "step": 30720 }, { "epoch": 0.83, "learning_rate": 0.0001553494931792152, "loss": 2.5945, "step": 30721 }, { "epoch": 0.83, "learning_rate": 0.0001553029027186741, "loss": 2.4901, "step": 30722 }, { "epoch": 0.83, "learning_rate": 0.00015525631865740742, "loss": 2.4768, "step": 30723 }, { "epoch": 0.83, "learning_rate": 0.00015520974099576758, "loss": 2.7133, "step": 30724 }, { "epoch": 0.83, "learning_rate": 0.0001551631697341078, "loss": 2.2116, "step": 30725 }, { "epoch": 0.83, "learning_rate": 0.00015511660487278078, "loss": 2.5705, "step": 30726 }, { "epoch": 0.83, "learning_rate": 0.0001550700464121393, "loss": 2.454, "step": 30727 }, { "epoch": 0.83, "learning_rate": 0.00015502349435253627, "loss": 2.0162, "step": 30728 }, { "epoch": 0.83, "learning_rate": 0.000154976948694324, "loss": 2.5741, "step": 30729 }, { "epoch": 0.83, "learning_rate": 0.0001549304094378553, "loss": 2.6546, "step": 30730 }, { "epoch": 0.83, "learning_rate": 0.0001548838765834829, "loss": 2.4096, "step": 30731 }, { "epoch": 0.83, "learning_rate": 0.00015483735013155898, "loss": 2.2521, "step": 30732 }, { "epoch": 0.83, "learning_rate": 0.00015479083008243622, "loss": 2.3946, "step": 30733 }, { "epoch": 0.83, "learning_rate": 0.00015474431643646702, "loss": 2.3018, "step": 30734 }, { "epoch": 0.83, "learning_rate": 0.00015469780919400366, "loss": 2.7459, "step": 30735 }, { "epoch": 0.83, "learning_rate": 0.00015465130835539887, "loss": 2.2867, "step": 30736 }, { "epoch": 0.83, "learning_rate": 0.00015460481392100446, "loss": 2.922, "step": 30737 }, { "epoch": 0.83, "learning_rate": 0.0001545583258911728, "loss": 2.8294, "step": 30738 }, { "epoch": 0.83, "learning_rate": 0.00015451184426625608, "loss": 2.3458, "step": 30739 }, { "epoch": 0.83, "learning_rate": 0.00015446536904660646, "loss": 2.7255, "step": 30740 }, { "epoch": 0.83, "learning_rate": 0.0001544189002325761, "loss": 2.7809, "step": 30741 }, { "epoch": 0.83, "learning_rate": 0.00015437243782451715, "loss": 2.5173, "step": 30742 }, { "epoch": 0.83, "learning_rate": 0.00015432598182278125, "loss": 2.3855, "step": 30743 }, { "epoch": 0.83, "learning_rate": 0.00015427953222772072, "loss": 2.7025, "step": 30744 }, { "epoch": 0.83, "learning_rate": 0.000154233089039687, "loss": 2.6913, "step": 30745 }, { "epoch": 0.83, "learning_rate": 0.00015418665225903195, "loss": 2.5478, "step": 30746 }, { "epoch": 0.83, "learning_rate": 0.0001541402218861081, "loss": 2.8506, "step": 30747 }, { "epoch": 0.83, "learning_rate": 0.00015409379792126644, "loss": 2.7013, "step": 30748 }, { "epoch": 0.83, "learning_rate": 0.00015404738036485898, "loss": 2.1095, "step": 30749 }, { "epoch": 0.83, "learning_rate": 0.0001540009692172375, "loss": 2.5451, "step": 30750 }, { "epoch": 0.83, "learning_rate": 0.00015395456447875322, "loss": 2.299, "step": 30751 }, { "epoch": 0.83, "learning_rate": 0.000153908166149758, "loss": 2.4935, "step": 30752 }, { "epoch": 0.83, "learning_rate": 0.00015386177423060311, "loss": 2.9475, "step": 30753 }, { "epoch": 0.83, "learning_rate": 0.00015381538872164013, "loss": 2.291, "step": 30754 }, { "epoch": 0.83, "learning_rate": 0.0001537690096232208, "loss": 2.932, "step": 30755 }, { "epoch": 0.83, "learning_rate": 0.00015372263693569588, "loss": 2.117, "step": 30756 }, { "epoch": 0.83, "learning_rate": 0.00015367627065941702, "loss": 2.2541, "step": 30757 }, { "epoch": 0.83, "learning_rate": 0.00015362991079473565, "loss": 2.3664, "step": 30758 }, { "epoch": 0.83, "learning_rate": 0.00015358355734200224, "loss": 2.7321, "step": 30759 }, { "epoch": 0.83, "learning_rate": 0.00015353721030156897, "loss": 2.6094, "step": 30760 }, { "epoch": 0.83, "learning_rate": 0.00015349086967378622, "loss": 2.8577, "step": 30761 }, { "epoch": 0.83, "learning_rate": 0.00015344453545900526, "loss": 2.0334, "step": 30762 }, { "epoch": 0.83, "learning_rate": 0.0001533982076575775, "loss": 2.0389, "step": 30763 }, { "epoch": 0.83, "learning_rate": 0.0001533518862698532, "loss": 2.3494, "step": 30764 }, { "epoch": 0.83, "learning_rate": 0.0001533055712961837, "loss": 2.1984, "step": 30765 }, { "epoch": 0.83, "learning_rate": 0.0001532592627369198, "loss": 2.5333, "step": 30766 }, { "epoch": 0.83, "learning_rate": 0.0001532129605924124, "loss": 2.37, "step": 30767 }, { "epoch": 0.83, "learning_rate": 0.00015316666486301245, "loss": 2.8428, "step": 30768 }, { "epoch": 0.83, "learning_rate": 0.0001531203755490701, "loss": 2.3209, "step": 30769 }, { "epoch": 0.83, "learning_rate": 0.00015307409265093652, "loss": 2.1298, "step": 30770 }, { "epoch": 0.83, "learning_rate": 0.00015302781616896233, "loss": 2.2837, "step": 30771 }, { "epoch": 0.83, "learning_rate": 0.00015298154610349758, "loss": 2.3223, "step": 30772 }, { "epoch": 0.83, "learning_rate": 0.0001529352824548933, "loss": 2.4769, "step": 30773 }, { "epoch": 0.83, "learning_rate": 0.00015288902522350023, "loss": 2.1314, "step": 30774 }, { "epoch": 0.83, "learning_rate": 0.0001528427744096682, "loss": 2.7829, "step": 30775 }, { "epoch": 0.83, "learning_rate": 0.00015279653001374794, "loss": 2.855, "step": 30776 }, { "epoch": 0.83, "learning_rate": 0.0001527502920360898, "loss": 2.4514, "step": 30777 }, { "epoch": 0.83, "learning_rate": 0.00015270406047704376, "loss": 3.043, "step": 30778 }, { "epoch": 0.83, "learning_rate": 0.00015265783533696033, "loss": 2.2747, "step": 30779 }, { "epoch": 0.83, "learning_rate": 0.00015261161661618962, "loss": 2.4018, "step": 30780 }, { "epoch": 0.83, "learning_rate": 0.0001525654043150818, "loss": 2.4658, "step": 30781 }, { "epoch": 0.83, "learning_rate": 0.0001525191984339873, "loss": 2.951, "step": 30782 }, { "epoch": 0.83, "learning_rate": 0.0001524729989732555, "loss": 2.2549, "step": 30783 }, { "epoch": 0.83, "learning_rate": 0.00015242680593323678, "loss": 2.4631, "step": 30784 }, { "epoch": 0.83, "learning_rate": 0.00015238061931428104, "loss": 2.3694, "step": 30785 }, { "epoch": 0.83, "learning_rate": 0.00015233443911673818, "loss": 2.4145, "step": 30786 }, { "epoch": 0.83, "learning_rate": 0.00015228826534095818, "loss": 2.4925, "step": 30787 }, { "epoch": 0.83, "learning_rate": 0.00015224209798729061, "loss": 2.515, "step": 30788 }, { "epoch": 0.83, "learning_rate": 0.00015219593705608536, "loss": 2.588, "step": 30789 }, { "epoch": 0.83, "learning_rate": 0.0001521497825476923, "loss": 2.0573, "step": 30790 }, { "epoch": 0.83, "learning_rate": 0.00015210363446246068, "loss": 2.3394, "step": 30791 }, { "epoch": 0.83, "learning_rate": 0.00015205749280074044, "loss": 2.6437, "step": 30792 }, { "epoch": 0.83, "learning_rate": 0.00015201135756288088, "loss": 2.4502, "step": 30793 }, { "epoch": 0.83, "learning_rate": 0.0001519652287492317, "loss": 2.5412, "step": 30794 }, { "epoch": 0.83, "learning_rate": 0.00015191910636014262, "loss": 2.4349, "step": 30795 }, { "epoch": 0.83, "learning_rate": 0.0001518729903959626, "loss": 2.5974, "step": 30796 }, { "epoch": 0.83, "learning_rate": 0.000151826880857041, "loss": 1.9058, "step": 30797 }, { "epoch": 0.83, "learning_rate": 0.00015178077774372745, "loss": 2.1361, "step": 30798 }, { "epoch": 0.83, "learning_rate": 0.00015173468105637102, "loss": 2.6138, "step": 30799 }, { "epoch": 0.83, "learning_rate": 0.00015168859079532092, "loss": 2.2794, "step": 30800 }, { "epoch": 0.83, "learning_rate": 0.00015164250696092675, "loss": 2.6698, "step": 30801 }, { "epoch": 0.83, "learning_rate": 0.00015159642955353702, "loss": 2.6718, "step": 30802 }, { "epoch": 0.83, "learning_rate": 0.0001515503585735013, "loss": 2.3499, "step": 30803 }, { "epoch": 0.83, "learning_rate": 0.00015150429402116807, "loss": 2.2506, "step": 30804 }, { "epoch": 0.83, "learning_rate": 0.00015145823589688667, "loss": 2.6504, "step": 30805 }, { "epoch": 0.83, "learning_rate": 0.0001514121842010059, "loss": 2.5236, "step": 30806 }, { "epoch": 0.83, "learning_rate": 0.00015136613893387474, "loss": 2.3642, "step": 30807 }, { "epoch": 0.83, "learning_rate": 0.00015132010009584208, "loss": 2.9913, "step": 30808 }, { "epoch": 0.83, "learning_rate": 0.00015127406768725683, "loss": 2.8699, "step": 30809 }, { "epoch": 0.83, "learning_rate": 0.00015122804170846716, "loss": 2.6244, "step": 30810 }, { "epoch": 0.83, "learning_rate": 0.00015118202215982213, "loss": 2.4264, "step": 30811 }, { "epoch": 0.83, "learning_rate": 0.00015113600904167036, "loss": 2.6048, "step": 30812 }, { "epoch": 0.83, "learning_rate": 0.00015109000235436043, "loss": 2.7175, "step": 30813 }, { "epoch": 0.83, "learning_rate": 0.0001510440020982412, "loss": 2.9292, "step": 30814 }, { "epoch": 0.83, "learning_rate": 0.0001509980082736605, "loss": 2.3057, "step": 30815 }, { "epoch": 0.83, "learning_rate": 0.00015095202088096705, "loss": 2.5323, "step": 30816 }, { "epoch": 0.83, "learning_rate": 0.00015090603992050966, "loss": 2.4466, "step": 30817 }, { "epoch": 0.83, "learning_rate": 0.00015086006539263597, "loss": 2.1956, "step": 30818 }, { "epoch": 0.83, "learning_rate": 0.00015081409729769435, "loss": 2.3824, "step": 30819 }, { "epoch": 0.83, "learning_rate": 0.00015076813563603386, "loss": 2.4909, "step": 30820 }, { "epoch": 0.83, "learning_rate": 0.0001507221804080019, "loss": 2.8219, "step": 30821 }, { "epoch": 0.83, "learning_rate": 0.00015067623161394716, "loss": 2.2131, "step": 30822 }, { "epoch": 0.83, "learning_rate": 0.00015063028925421705, "loss": 2.6719, "step": 30823 }, { "epoch": 0.83, "learning_rate": 0.00015058435332916009, "loss": 2.363, "step": 30824 }, { "epoch": 0.83, "learning_rate": 0.0001505384238391243, "loss": 2.4434, "step": 30825 }, { "epoch": 0.83, "learning_rate": 0.00015049250078445742, "loss": 2.5741, "step": 30826 }, { "epoch": 0.83, "learning_rate": 0.0001504465841655075, "loss": 2.7538, "step": 30827 }, { "epoch": 0.83, "learning_rate": 0.0001504006739826227, "loss": 2.9307, "step": 30828 }, { "epoch": 0.83, "learning_rate": 0.00015035477023615017, "loss": 2.6092, "step": 30829 }, { "epoch": 0.83, "learning_rate": 0.00015030887292643826, "loss": 2.7105, "step": 30830 }, { "epoch": 0.83, "learning_rate": 0.00015026298205383416, "loss": 2.3067, "step": 30831 }, { "epoch": 0.83, "learning_rate": 0.00015021709761868564, "loss": 2.3336, "step": 30832 }, { "epoch": 0.83, "learning_rate": 0.00015017121962134083, "loss": 2.5031, "step": 30833 }, { "epoch": 0.83, "learning_rate": 0.00015012534806214673, "loss": 2.1555, "step": 30834 }, { "epoch": 0.83, "learning_rate": 0.00015007948294145103, "loss": 2.0835, "step": 30835 }, { "epoch": 0.83, "learning_rate": 0.00015003362425960144, "loss": 2.3801, "step": 30836 }, { "epoch": 0.83, "learning_rate": 0.00014998777201694492, "loss": 2.0726, "step": 30837 }, { "epoch": 0.83, "learning_rate": 0.0001499419262138292, "loss": 2.2877, "step": 30838 }, { "epoch": 0.83, "learning_rate": 0.0001498960868506013, "loss": 2.7208, "step": 30839 }, { "epoch": 0.83, "learning_rate": 0.00014985025392760877, "loss": 2.8244, "step": 30840 }, { "epoch": 0.83, "learning_rate": 0.00014980442744519886, "loss": 2.2858, "step": 30841 }, { "epoch": 0.83, "learning_rate": 0.0001497586074037185, "loss": 2.3274, "step": 30842 }, { "epoch": 0.83, "learning_rate": 0.00014971279380351476, "loss": 2.3524, "step": 30843 }, { "epoch": 0.83, "learning_rate": 0.00014966698664493528, "loss": 2.3047, "step": 30844 }, { "epoch": 0.83, "learning_rate": 0.00014962118592832608, "loss": 2.6652, "step": 30845 }, { "epoch": 0.83, "learning_rate": 0.00014957539165403523, "loss": 2.6537, "step": 30846 }, { "epoch": 0.83, "learning_rate": 0.00014952960382240898, "loss": 3.2267, "step": 30847 }, { "epoch": 0.83, "learning_rate": 0.00014948382243379444, "loss": 2.7345, "step": 30848 }, { "epoch": 0.83, "learning_rate": 0.00014943804748853863, "loss": 2.3136, "step": 30849 }, { "epoch": 0.83, "learning_rate": 0.00014939227898698782, "loss": 2.6883, "step": 30850 }, { "epoch": 0.83, "learning_rate": 0.00014934651692948898, "loss": 2.2874, "step": 30851 }, { "epoch": 0.83, "learning_rate": 0.00014930076131638892, "loss": 1.9517, "step": 30852 }, { "epoch": 0.83, "learning_rate": 0.00014925501214803417, "loss": 1.9952, "step": 30853 }, { "epoch": 0.83, "learning_rate": 0.00014920926942477142, "loss": 2.3285, "step": 30854 }, { "epoch": 0.83, "learning_rate": 0.0001491635331469473, "loss": 2.2274, "step": 30855 }, { "epoch": 0.83, "learning_rate": 0.000149117803314908, "loss": 2.4842, "step": 30856 }, { "epoch": 0.83, "learning_rate": 0.00014907207992900017, "loss": 2.5282, "step": 30857 }, { "epoch": 0.83, "learning_rate": 0.00014902636298956974, "loss": 2.5754, "step": 30858 }, { "epoch": 0.83, "learning_rate": 0.0001489806524969637, "loss": 2.4462, "step": 30859 }, { "epoch": 0.83, "learning_rate": 0.00014893494845152834, "loss": 2.461, "step": 30860 }, { "epoch": 0.83, "learning_rate": 0.00014888925085360937, "loss": 2.5624, "step": 30861 }, { "epoch": 0.83, "learning_rate": 0.00014884355970355335, "loss": 2.6693, "step": 30862 }, { "epoch": 0.83, "learning_rate": 0.0001487978750017065, "loss": 2.9121, "step": 30863 }, { "epoch": 0.83, "learning_rate": 0.00014875219674841456, "loss": 2.5265, "step": 30864 }, { "epoch": 0.83, "learning_rate": 0.00014870652494402382, "loss": 2.4354, "step": 30865 }, { "epoch": 0.83, "learning_rate": 0.0001486608595888802, "loss": 2.3404, "step": 30866 }, { "epoch": 0.83, "learning_rate": 0.00014861520068332968, "loss": 2.2028, "step": 30867 }, { "epoch": 0.83, "learning_rate": 0.00014856954822771852, "loss": 2.2735, "step": 30868 }, { "epoch": 0.83, "learning_rate": 0.00014852390222239186, "loss": 2.3066, "step": 30869 }, { "epoch": 0.83, "learning_rate": 0.00014847826266769604, "loss": 2.2338, "step": 30870 }, { "epoch": 0.83, "learning_rate": 0.00014843262956397663, "loss": 2.7415, "step": 30871 }, { "epoch": 0.83, "learning_rate": 0.00014838700291157925, "loss": 2.5878, "step": 30872 }, { "epoch": 0.83, "learning_rate": 0.00014834138271085007, "loss": 2.7299, "step": 30873 }, { "epoch": 0.83, "learning_rate": 0.00014829576896213404, "loss": 2.0148, "step": 30874 }, { "epoch": 0.83, "learning_rate": 0.00014825016166577698, "loss": 2.3818, "step": 30875 }, { "epoch": 0.83, "learning_rate": 0.00014820456082212464, "loss": 2.6319, "step": 30876 }, { "epoch": 0.83, "learning_rate": 0.00014815896643152193, "loss": 2.5665, "step": 30877 }, { "epoch": 0.83, "learning_rate": 0.00014811337849431449, "loss": 2.1132, "step": 30878 }, { "epoch": 0.83, "learning_rate": 0.00014806779701084826, "loss": 2.5857, "step": 30879 }, { "epoch": 0.83, "learning_rate": 0.00014802222198146786, "loss": 2.5634, "step": 30880 }, { "epoch": 0.83, "learning_rate": 0.00014797665340651888, "loss": 2.4366, "step": 30881 }, { "epoch": 0.83, "learning_rate": 0.00014793109128634642, "loss": 2.574, "step": 30882 }, { "epoch": 0.83, "learning_rate": 0.00014788553562129558, "loss": 2.5411, "step": 30883 }, { "epoch": 0.83, "learning_rate": 0.00014783998641171149, "loss": 2.1299, "step": 30884 }, { "epoch": 0.83, "learning_rate": 0.0001477944436579395, "loss": 2.2721, "step": 30885 }, { "epoch": 0.83, "learning_rate": 0.0001477489073603243, "loss": 3.0893, "step": 30886 }, { "epoch": 0.83, "learning_rate": 0.00014770337751921126, "loss": 2.3434, "step": 30887 }, { "epoch": 0.83, "learning_rate": 0.0001476578541349448, "loss": 2.5838, "step": 30888 }, { "epoch": 0.83, "learning_rate": 0.00014761233720787014, "loss": 2.0769, "step": 30889 }, { "epoch": 0.83, "learning_rate": 0.00014756682673833222, "loss": 2.5898, "step": 30890 }, { "epoch": 0.83, "learning_rate": 0.00014752132272667507, "loss": 2.386, "step": 30891 }, { "epoch": 0.83, "learning_rate": 0.00014747582517324453, "loss": 2.1282, "step": 30892 }, { "epoch": 0.83, "learning_rate": 0.00014743033407838447, "loss": 2.2262, "step": 30893 }, { "epoch": 0.83, "learning_rate": 0.0001473848494424398, "loss": 2.5809, "step": 30894 }, { "epoch": 0.83, "learning_rate": 0.00014733937126575525, "loss": 2.6303, "step": 30895 }, { "epoch": 0.83, "learning_rate": 0.000147293899548675, "loss": 2.3272, "step": 30896 }, { "epoch": 0.83, "learning_rate": 0.00014724843429154367, "loss": 2.588, "step": 30897 }, { "epoch": 0.83, "learning_rate": 0.00014720297549470585, "loss": 2.7607, "step": 30898 }, { "epoch": 0.83, "learning_rate": 0.00014715752315850572, "loss": 2.743, "step": 30899 }, { "epoch": 0.83, "learning_rate": 0.0001471120772832879, "loss": 2.8598, "step": 30900 }, { "epoch": 0.83, "learning_rate": 0.00014706663786939644, "loss": 2.6082, "step": 30901 }, { "epoch": 0.83, "learning_rate": 0.00014702120491717551, "loss": 2.7181, "step": 30902 }, { "epoch": 0.83, "learning_rate": 0.00014697577842696973, "loss": 2.7626, "step": 30903 }, { "epoch": 0.83, "learning_rate": 0.0001469303583991224, "loss": 2.6151, "step": 30904 }, { "epoch": 0.83, "learning_rate": 0.0001468849448339785, "loss": 3.0431, "step": 30905 }, { "epoch": 0.83, "learning_rate": 0.00014683953773188184, "loss": 2.3302, "step": 30906 }, { "epoch": 0.83, "learning_rate": 0.00014679413709317623, "loss": 2.2701, "step": 30907 }, { "epoch": 0.83, "learning_rate": 0.00014674874291820583, "loss": 2.3622, "step": 30908 }, { "epoch": 0.83, "learning_rate": 0.00014670335520731415, "loss": 2.6942, "step": 30909 }, { "epoch": 0.83, "learning_rate": 0.00014665797396084534, "loss": 2.7571, "step": 30910 }, { "epoch": 0.83, "learning_rate": 0.00014661259917914316, "loss": 2.0986, "step": 30911 }, { "epoch": 0.83, "learning_rate": 0.00014656723086255141, "loss": 2.4889, "step": 30912 }, { "epoch": 0.83, "learning_rate": 0.00014652186901141363, "loss": 2.5545, "step": 30913 }, { "epoch": 0.83, "learning_rate": 0.00014647651362607395, "loss": 2.9341, "step": 30914 }, { "epoch": 0.83, "learning_rate": 0.00014643116470687524, "loss": 2.1183, "step": 30915 }, { "epoch": 0.83, "learning_rate": 0.00014638582225416175, "loss": 2.6504, "step": 30916 }, { "epoch": 0.83, "learning_rate": 0.00014634048626827612, "loss": 2.2638, "step": 30917 }, { "epoch": 0.83, "learning_rate": 0.0001462951567495626, "loss": 2.4561, "step": 30918 }, { "epoch": 0.83, "learning_rate": 0.00014624983369836465, "loss": 2.3029, "step": 30919 }, { "epoch": 0.83, "learning_rate": 0.00014620451711502502, "loss": 2.3125, "step": 30920 }, { "epoch": 0.83, "learning_rate": 0.00014615920699988726, "loss": 2.803, "step": 30921 }, { "epoch": 0.83, "learning_rate": 0.0001461139033532951, "loss": 2.4602, "step": 30922 }, { "epoch": 0.83, "learning_rate": 0.00014606860617559094, "loss": 2.6228, "step": 30923 }, { "epoch": 0.83, "learning_rate": 0.00014602331546711845, "loss": 2.2562, "step": 30924 }, { "epoch": 0.83, "learning_rate": 0.00014597803122822062, "loss": 2.4844, "step": 30925 }, { "epoch": 0.83, "learning_rate": 0.0001459327534592405, "loss": 2.6055, "step": 30926 }, { "epoch": 0.83, "learning_rate": 0.0001458874821605215, "loss": 2.443, "step": 30927 }, { "epoch": 0.83, "learning_rate": 0.00014584221733240587, "loss": 2.7623, "step": 30928 }, { "epoch": 0.83, "learning_rate": 0.00014579695897523704, "loss": 2.944, "step": 30929 }, { "epoch": 0.83, "learning_rate": 0.0001457517070893576, "loss": 2.5915, "step": 30930 }, { "epoch": 0.83, "learning_rate": 0.00014570646167511047, "loss": 2.8479, "step": 30931 }, { "epoch": 0.83, "learning_rate": 0.00014566122273283855, "loss": 2.2418, "step": 30932 }, { "epoch": 0.83, "learning_rate": 0.00014561599026288475, "loss": 2.3596, "step": 30933 }, { "epoch": 0.83, "learning_rate": 0.00014557076426559114, "loss": 2.5386, "step": 30934 }, { "epoch": 0.83, "learning_rate": 0.00014552554474130087, "loss": 2.4729, "step": 30935 }, { "epoch": 0.83, "learning_rate": 0.00014548033169035614, "loss": 2.1938, "step": 30936 }, { "epoch": 0.83, "learning_rate": 0.00014543512511309953, "loss": 2.6168, "step": 30937 }, { "epoch": 0.83, "learning_rate": 0.0001453899250098738, "loss": 2.4166, "step": 30938 }, { "epoch": 0.83, "learning_rate": 0.00014534473138102112, "loss": 2.7544, "step": 30939 }, { "epoch": 0.83, "learning_rate": 0.00014529954422688396, "loss": 2.4004, "step": 30940 }, { "epoch": 0.83, "learning_rate": 0.00014525436354780486, "loss": 2.315, "step": 30941 }, { "epoch": 0.83, "learning_rate": 0.00014520918934412565, "loss": 2.2038, "step": 30942 }, { "epoch": 0.83, "learning_rate": 0.0001451640216161888, "loss": 2.5719, "step": 30943 }, { "epoch": 0.83, "learning_rate": 0.0001451188603643365, "loss": 2.4172, "step": 30944 }, { "epoch": 0.83, "learning_rate": 0.00014507370558891088, "loss": 2.3031, "step": 30945 }, { "epoch": 0.83, "learning_rate": 0.00014502855729025432, "loss": 2.4073, "step": 30946 }, { "epoch": 0.83, "learning_rate": 0.0001449834154687082, "loss": 2.1066, "step": 30947 }, { "epoch": 0.83, "learning_rate": 0.00014493828012461497, "loss": 2.3966, "step": 30948 }, { "epoch": 0.83, "learning_rate": 0.00014489315125831658, "loss": 2.4862, "step": 30949 }, { "epoch": 0.83, "learning_rate": 0.00014484802887015469, "loss": 2.3964, "step": 30950 }, { "epoch": 0.83, "learning_rate": 0.00014480291296047122, "loss": 2.6478, "step": 30951 }, { "epoch": 0.83, "learning_rate": 0.0001447578035296079, "loss": 2.2285, "step": 30952 }, { "epoch": 0.83, "learning_rate": 0.00014471270057790663, "loss": 2.552, "step": 30953 }, { "epoch": 0.83, "learning_rate": 0.00014466760410570924, "loss": 2.7582, "step": 30954 }, { "epoch": 0.83, "learning_rate": 0.0001446225141133569, "loss": 2.0036, "step": 30955 }, { "epoch": 0.83, "learning_rate": 0.00014457743060119154, "loss": 2.699, "step": 30956 }, { "epoch": 0.83, "learning_rate": 0.00014453235356955463, "loss": 2.1682, "step": 30957 }, { "epoch": 0.83, "learning_rate": 0.00014448728301878755, "loss": 2.5579, "step": 30958 }, { "epoch": 0.83, "learning_rate": 0.00014444221894923214, "loss": 2.4621, "step": 30959 }, { "epoch": 0.83, "learning_rate": 0.00014439716136122938, "loss": 2.1901, "step": 30960 }, { "epoch": 0.83, "learning_rate": 0.00014435211025512075, "loss": 2.2646, "step": 30961 }, { "epoch": 0.83, "learning_rate": 0.00014430706563124763, "loss": 2.4051, "step": 30962 }, { "epoch": 0.83, "learning_rate": 0.0001442620274899511, "loss": 2.732, "step": 30963 }, { "epoch": 0.83, "learning_rate": 0.00014421699583157222, "loss": 2.5111, "step": 30964 }, { "epoch": 0.83, "learning_rate": 0.00014417197065645282, "loss": 2.2843, "step": 30965 }, { "epoch": 0.83, "learning_rate": 0.0001441269519649333, "loss": 1.8164, "step": 30966 }, { "epoch": 0.83, "learning_rate": 0.00014408193975735506, "loss": 2.8478, "step": 30967 }, { "epoch": 0.83, "learning_rate": 0.00014403693403405916, "loss": 2.7914, "step": 30968 }, { "epoch": 0.83, "learning_rate": 0.0001439919347953862, "loss": 2.2959, "step": 30969 }, { "epoch": 0.83, "learning_rate": 0.00014394694204167735, "loss": 3.1268, "step": 30970 }, { "epoch": 0.83, "learning_rate": 0.00014390195577327337, "loss": 2.6198, "step": 30971 }, { "epoch": 0.83, "learning_rate": 0.00014385697599051517, "loss": 2.3649, "step": 30972 }, { "epoch": 0.83, "learning_rate": 0.0001438120026937436, "loss": 3.3294, "step": 30973 }, { "epoch": 0.83, "learning_rate": 0.0001437670358832991, "loss": 2.2012, "step": 30974 }, { "epoch": 0.83, "learning_rate": 0.00014372207555952244, "loss": 2.4087, "step": 30975 }, { "epoch": 0.83, "learning_rate": 0.00014367712172275437, "loss": 2.6649, "step": 30976 }, { "epoch": 0.83, "learning_rate": 0.00014363217437333498, "loss": 2.1515, "step": 30977 }, { "epoch": 0.83, "learning_rate": 0.00014358723351160562, "loss": 2.4487, "step": 30978 }, { "epoch": 0.83, "learning_rate": 0.00014354229913790596, "loss": 2.6154, "step": 30979 }, { "epoch": 0.83, "learning_rate": 0.00014349737125257667, "loss": 2.4938, "step": 30980 }, { "epoch": 0.83, "learning_rate": 0.00014345244985595852, "loss": 2.5539, "step": 30981 }, { "epoch": 0.83, "learning_rate": 0.0001434075349483912, "loss": 2.1105, "step": 30982 }, { "epoch": 0.83, "learning_rate": 0.00014336262653021526, "loss": 2.8485, "step": 30983 }, { "epoch": 0.83, "learning_rate": 0.00014331772460177085, "loss": 2.4994, "step": 30984 }, { "epoch": 0.83, "learning_rate": 0.00014327282916339824, "loss": 2.549, "step": 30985 }, { "epoch": 0.83, "learning_rate": 0.00014322794021543774, "loss": 2.4515, "step": 30986 }, { "epoch": 0.83, "learning_rate": 0.00014318305775822893, "loss": 2.3354, "step": 30987 }, { "epoch": 0.83, "learning_rate": 0.00014313818179211214, "loss": 2.8916, "step": 30988 }, { "epoch": 0.83, "learning_rate": 0.00014309331231742752, "loss": 2.275, "step": 30989 }, { "epoch": 0.83, "learning_rate": 0.0001430484493345142, "loss": 2.2571, "step": 30990 }, { "epoch": 0.83, "learning_rate": 0.000143003592843713, "loss": 2.145, "step": 30991 }, { "epoch": 0.83, "learning_rate": 0.00014295874284536348, "loss": 2.7698, "step": 30992 }, { "epoch": 0.83, "learning_rate": 0.00014291389933980515, "loss": 2.5798, "step": 30993 }, { "epoch": 0.83, "learning_rate": 0.00014286906232737807, "loss": 2.2451, "step": 30994 }, { "epoch": 0.83, "learning_rate": 0.00014282423180842152, "loss": 2.3566, "step": 30995 }, { "epoch": 0.83, "learning_rate": 0.00014277940778327535, "loss": 2.482, "step": 30996 }, { "epoch": 0.83, "learning_rate": 0.0001427345902522791, "loss": 1.9165, "step": 30997 }, { "epoch": 0.83, "learning_rate": 0.0001426897792157723, "loss": 2.4423, "step": 30998 }, { "epoch": 0.83, "learning_rate": 0.00014264497467409454, "loss": 2.4507, "step": 30999 }, { "epoch": 0.83, "learning_rate": 0.00014260017662758528, "loss": 2.639, "step": 31000 }, { "epoch": 0.83, "learning_rate": 0.00014255538507658373, "loss": 1.98, "step": 31001 }, { "epoch": 0.83, "learning_rate": 0.00014251060002142912, "loss": 2.1977, "step": 31002 }, { "epoch": 0.83, "learning_rate": 0.000142465821462461, "loss": 2.6869, "step": 31003 }, { "epoch": 0.83, "learning_rate": 0.00014242104940001855, "loss": 2.7166, "step": 31004 }, { "epoch": 0.83, "learning_rate": 0.00014237628383444102, "loss": 2.6509, "step": 31005 }, { "epoch": 0.83, "learning_rate": 0.00014233152476606726, "loss": 2.5294, "step": 31006 }, { "epoch": 0.83, "learning_rate": 0.00014228677219523656, "loss": 2.3423, "step": 31007 }, { "epoch": 0.83, "learning_rate": 0.0001422420261222881, "loss": 2.5342, "step": 31008 }, { "epoch": 0.83, "learning_rate": 0.00014219728654756047, "loss": 2.2452, "step": 31009 }, { "epoch": 0.83, "learning_rate": 0.0001421525534713929, "loss": 2.2875, "step": 31010 }, { "epoch": 0.83, "learning_rate": 0.00014210782689412415, "loss": 2.4273, "step": 31011 }, { "epoch": 0.83, "learning_rate": 0.00014206310681609324, "loss": 2.4704, "step": 31012 }, { "epoch": 0.83, "learning_rate": 0.00014201839323763898, "loss": 2.3964, "step": 31013 }, { "epoch": 0.83, "learning_rate": 0.00014197368615909977, "loss": 2.8694, "step": 31014 }, { "epoch": 0.83, "learning_rate": 0.00014192898558081446, "loss": 2.564, "step": 31015 }, { "epoch": 0.83, "learning_rate": 0.00014188429150312177, "loss": 2.3655, "step": 31016 }, { "epoch": 0.83, "learning_rate": 0.0001418396039263603, "loss": 2.403, "step": 31017 }, { "epoch": 0.83, "learning_rate": 0.0001417949228508686, "loss": 2.2972, "step": 31018 }, { "epoch": 0.83, "learning_rate": 0.00014175024827698535, "loss": 2.2114, "step": 31019 }, { "epoch": 0.83, "learning_rate": 0.00014170558020504853, "loss": 2.2521, "step": 31020 }, { "epoch": 0.83, "learning_rate": 0.000141660918635397, "loss": 2.1561, "step": 31021 }, { "epoch": 0.83, "learning_rate": 0.00014161626356836866, "loss": 2.3529, "step": 31022 }, { "epoch": 0.83, "learning_rate": 0.00014157161500430205, "loss": 2.4367, "step": 31023 }, { "epoch": 0.83, "learning_rate": 0.00014152697294353544, "loss": 2.8045, "step": 31024 }, { "epoch": 0.83, "learning_rate": 0.0001414823373864069, "loss": 2.4416, "step": 31025 }, { "epoch": 0.83, "learning_rate": 0.00014143770833325474, "loss": 2.6665, "step": 31026 }, { "epoch": 0.83, "learning_rate": 0.00014139308578441735, "loss": 2.6078, "step": 31027 }, { "epoch": 0.83, "learning_rate": 0.00014134846974023208, "loss": 2.5659, "step": 31028 }, { "epoch": 0.83, "learning_rate": 0.00014130386020103737, "loss": 2.409, "step": 31029 }, { "epoch": 0.83, "learning_rate": 0.00014125925716717102, "loss": 2.633, "step": 31030 }, { "epoch": 0.83, "learning_rate": 0.00014121466063897104, "loss": 2.5279, "step": 31031 }, { "epoch": 0.83, "learning_rate": 0.00014117007061677545, "loss": 2.5238, "step": 31032 }, { "epoch": 0.83, "learning_rate": 0.00014112548710092167, "loss": 2.6011, "step": 31033 }, { "epoch": 0.83, "learning_rate": 0.00014108091009174762, "loss": 2.3395, "step": 31034 }, { "epoch": 0.83, "learning_rate": 0.00014103633958959127, "loss": 2.0483, "step": 31035 }, { "epoch": 0.83, "learning_rate": 0.0001409917755947897, "loss": 2.5572, "step": 31036 }, { "epoch": 0.83, "learning_rate": 0.00014094721810768097, "loss": 2.3925, "step": 31037 }, { "epoch": 0.83, "learning_rate": 0.00014090266712860278, "loss": 2.3358, "step": 31038 }, { "epoch": 0.83, "learning_rate": 0.00014085812265789212, "loss": 2.5103, "step": 31039 }, { "epoch": 0.83, "learning_rate": 0.000140813584695887, "loss": 1.9529, "step": 31040 }, { "epoch": 0.83, "learning_rate": 0.00014076905324292432, "loss": 2.5402, "step": 31041 }, { "epoch": 0.83, "learning_rate": 0.00014072452829934167, "loss": 2.8112, "step": 31042 }, { "epoch": 0.83, "learning_rate": 0.00014068000986547634, "loss": 2.6701, "step": 31043 }, { "epoch": 0.83, "learning_rate": 0.00014063549794166575, "loss": 2.4131, "step": 31044 }, { "epoch": 0.83, "learning_rate": 0.0001405909925282469, "loss": 2.7733, "step": 31045 }, { "epoch": 0.83, "learning_rate": 0.00014054649362555728, "loss": 2.3308, "step": 31046 }, { "epoch": 0.83, "learning_rate": 0.00014050200123393353, "loss": 2.2857, "step": 31047 }, { "epoch": 0.83, "learning_rate": 0.0001404575153537131, "loss": 2.6444, "step": 31048 }, { "epoch": 0.83, "learning_rate": 0.00014041303598523247, "loss": 2.778, "step": 31049 }, { "epoch": 0.83, "learning_rate": 0.00014036856312882927, "loss": 2.621, "step": 31050 }, { "epoch": 0.83, "learning_rate": 0.00014032409678484036, "loss": 2.6333, "step": 31051 }, { "epoch": 0.83, "learning_rate": 0.00014027963695360213, "loss": 2.7325, "step": 31052 }, { "epoch": 0.83, "learning_rate": 0.00014023518363545174, "loss": 2.8806, "step": 31053 }, { "epoch": 0.83, "learning_rate": 0.00014019073683072602, "loss": 2.5026, "step": 31054 }, { "epoch": 0.83, "learning_rate": 0.0001401462965397614, "loss": 2.1961, "step": 31055 }, { "epoch": 0.83, "learning_rate": 0.00014010186276289472, "loss": 2.1232, "step": 31056 }, { "epoch": 0.83, "learning_rate": 0.00014005743550046256, "loss": 2.2247, "step": 31057 }, { "epoch": 0.83, "learning_rate": 0.0001400130147528016, "loss": 2.4053, "step": 31058 }, { "epoch": 0.83, "learning_rate": 0.0001399686005202484, "loss": 2.6345, "step": 31059 }, { "epoch": 0.83, "learning_rate": 0.00013992419280313916, "loss": 2.5087, "step": 31060 }, { "epoch": 0.83, "learning_rate": 0.00013987979160181042, "loss": 1.8234, "step": 31061 }, { "epoch": 0.83, "learning_rate": 0.00013983539691659865, "loss": 2.7415, "step": 31062 }, { "epoch": 0.83, "learning_rate": 0.00013979100874784013, "loss": 2.3687, "step": 31063 }, { "epoch": 0.83, "learning_rate": 0.00013974662709587138, "loss": 2.2773, "step": 31064 }, { "epoch": 0.83, "learning_rate": 0.00013970225196102804, "loss": 3.0726, "step": 31065 }, { "epoch": 0.83, "learning_rate": 0.00013965788334364672, "loss": 2.5592, "step": 31066 }, { "epoch": 0.83, "learning_rate": 0.0001396135212440637, "loss": 2.3308, "step": 31067 }, { "epoch": 0.83, "learning_rate": 0.00013956916566261457, "loss": 2.6977, "step": 31068 }, { "epoch": 0.83, "learning_rate": 0.00013952481659963568, "loss": 2.8217, "step": 31069 }, { "epoch": 0.83, "learning_rate": 0.0001394804740554628, "loss": 2.6864, "step": 31070 }, { "epoch": 0.83, "learning_rate": 0.00013943613803043208, "loss": 2.3738, "step": 31071 }, { "epoch": 0.84, "learning_rate": 0.00013939180852487942, "loss": 2.3733, "step": 31072 }, { "epoch": 0.84, "learning_rate": 0.00013934748553914066, "loss": 2.5164, "step": 31073 }, { "epoch": 0.84, "learning_rate": 0.00013930316907355124, "loss": 2.602, "step": 31074 }, { "epoch": 0.84, "learning_rate": 0.00013925885912844716, "loss": 2.6128, "step": 31075 }, { "epoch": 0.84, "learning_rate": 0.00013921455570416408, "loss": 2.4115, "step": 31076 }, { "epoch": 0.84, "learning_rate": 0.00013917025880103774, "loss": 2.1837, "step": 31077 }, { "epoch": 0.84, "learning_rate": 0.00013912596841940373, "loss": 2.3056, "step": 31078 }, { "epoch": 0.84, "learning_rate": 0.00013908168455959723, "loss": 2.4875, "step": 31079 }, { "epoch": 0.84, "learning_rate": 0.00013903740722195402, "loss": 2.2052, "step": 31080 }, { "epoch": 0.84, "learning_rate": 0.00013899313640680966, "loss": 2.4541, "step": 31081 }, { "epoch": 0.84, "learning_rate": 0.00013894887211449925, "loss": 2.7083, "step": 31082 }, { "epoch": 0.84, "learning_rate": 0.00013890461434535817, "loss": 3.1053, "step": 31083 }, { "epoch": 0.84, "learning_rate": 0.0001388603630997217, "loss": 2.8031, "step": 31084 }, { "epoch": 0.84, "learning_rate": 0.0001388161183779253, "loss": 2.3049, "step": 31085 }, { "epoch": 0.84, "learning_rate": 0.00013877188018030417, "loss": 2.3988, "step": 31086 }, { "epoch": 0.84, "learning_rate": 0.0001387276485071931, "loss": 2.719, "step": 31087 }, { "epoch": 0.84, "learning_rate": 0.00013868342335892736, "loss": 2.4544, "step": 31088 }, { "epoch": 0.84, "learning_rate": 0.00013863920473584213, "loss": 2.194, "step": 31089 }, { "epoch": 0.84, "learning_rate": 0.00013859499263827214, "loss": 2.8247, "step": 31090 }, { "epoch": 0.84, "learning_rate": 0.00013855078706655278, "loss": 2.1353, "step": 31091 }, { "epoch": 0.84, "learning_rate": 0.00013850658802101834, "loss": 2.1826, "step": 31092 }, { "epoch": 0.84, "learning_rate": 0.00013846239550200412, "loss": 2.4436, "step": 31093 }, { "epoch": 0.84, "learning_rate": 0.00013841820950984485, "loss": 2.6761, "step": 31094 }, { "epoch": 0.84, "learning_rate": 0.00013837403004487504, "loss": 2.0159, "step": 31095 }, { "epoch": 0.84, "learning_rate": 0.0001383298571074293, "loss": 2.3269, "step": 31096 }, { "epoch": 0.84, "learning_rate": 0.00013828569069784292, "loss": 2.3277, "step": 31097 }, { "epoch": 0.84, "learning_rate": 0.00013824153081644984, "loss": 2.2339, "step": 31098 }, { "epoch": 0.84, "learning_rate": 0.0001381973774635852, "loss": 2.6974, "step": 31099 }, { "epoch": 0.84, "learning_rate": 0.00013815323063958286, "loss": 1.9954, "step": 31100 }, { "epoch": 0.84, "learning_rate": 0.00013810909034477748, "loss": 2.1874, "step": 31101 }, { "epoch": 0.84, "learning_rate": 0.00013806495657950357, "loss": 2.4263, "step": 31102 }, { "epoch": 0.84, "learning_rate": 0.00013802082934409555, "loss": 2.6461, "step": 31103 }, { "epoch": 0.84, "learning_rate": 0.00013797670863888756, "loss": 2.7543, "step": 31104 }, { "epoch": 0.84, "learning_rate": 0.00013793259446421413, "loss": 2.6491, "step": 31105 }, { "epoch": 0.84, "learning_rate": 0.000137888486820409, "loss": 2.6896, "step": 31106 }, { "epoch": 0.84, "learning_rate": 0.0001378443857078069, "loss": 2.3995, "step": 31107 }, { "epoch": 0.84, "learning_rate": 0.0001378002911267412, "loss": 2.7761, "step": 31108 }, { "epoch": 0.84, "learning_rate": 0.0001377562030775462, "loss": 2.2927, "step": 31109 }, { "epoch": 0.84, "learning_rate": 0.00013771212156055658, "loss": 2.814, "step": 31110 }, { "epoch": 0.84, "learning_rate": 0.00013766804657610544, "loss": 2.4726, "step": 31111 }, { "epoch": 0.84, "learning_rate": 0.00013762397812452698, "loss": 2.9056, "step": 31112 }, { "epoch": 0.84, "learning_rate": 0.0001375799162061554, "loss": 2.7066, "step": 31113 }, { "epoch": 0.84, "learning_rate": 0.00013753586082132385, "loss": 2.7919, "step": 31114 }, { "epoch": 0.84, "learning_rate": 0.00013749181197036654, "loss": 2.6937, "step": 31115 }, { "epoch": 0.84, "learning_rate": 0.00013744776965361706, "loss": 2.3334, "step": 31116 }, { "epoch": 0.84, "learning_rate": 0.00013740373387140903, "loss": 2.4008, "step": 31117 }, { "epoch": 0.84, "learning_rate": 0.00013735970462407633, "loss": 2.2941, "step": 31118 }, { "epoch": 0.84, "learning_rate": 0.00013731568191195198, "loss": 2.1255, "step": 31119 }, { "epoch": 0.84, "learning_rate": 0.00013727166573536986, "loss": 2.2573, "step": 31120 }, { "epoch": 0.84, "learning_rate": 0.0001372276560946636, "loss": 2.5737, "step": 31121 }, { "epoch": 0.84, "learning_rate": 0.00013718365299016588, "loss": 2.139, "step": 31122 }, { "epoch": 0.84, "learning_rate": 0.0001371396564222107, "loss": 2.3387, "step": 31123 }, { "epoch": 0.84, "learning_rate": 0.00013709566639113157, "loss": 2.6842, "step": 31124 }, { "epoch": 0.84, "learning_rate": 0.0001370516828972611, "loss": 2.0052, "step": 31125 }, { "epoch": 0.84, "learning_rate": 0.00013700770594093315, "loss": 1.9266, "step": 31126 }, { "epoch": 0.84, "learning_rate": 0.0001369637355224802, "loss": 2.5577, "step": 31127 }, { "epoch": 0.84, "learning_rate": 0.00013691977164223567, "loss": 2.6996, "step": 31128 }, { "epoch": 0.84, "learning_rate": 0.00013687581430053274, "loss": 2.5999, "step": 31129 }, { "epoch": 0.84, "learning_rate": 0.00013683186349770427, "loss": 2.4499, "step": 31130 }, { "epoch": 0.84, "learning_rate": 0.00013678791923408328, "loss": 2.9036, "step": 31131 }, { "epoch": 0.84, "learning_rate": 0.0001367439815100029, "loss": 1.9407, "step": 31132 }, { "epoch": 0.84, "learning_rate": 0.00013670005032579558, "loss": 2.5373, "step": 31133 }, { "epoch": 0.84, "learning_rate": 0.00013665612568179454, "loss": 2.4748, "step": 31134 }, { "epoch": 0.84, "learning_rate": 0.00013661220757833192, "loss": 2.472, "step": 31135 }, { "epoch": 0.84, "learning_rate": 0.00013656829601574105, "loss": 1.9257, "step": 31136 }, { "epoch": 0.84, "learning_rate": 0.00013652439099435466, "loss": 2.761, "step": 31137 }, { "epoch": 0.84, "learning_rate": 0.0001364804925145048, "loss": 2.6343, "step": 31138 }, { "epoch": 0.84, "learning_rate": 0.00013643660057652442, "loss": 2.4392, "step": 31139 }, { "epoch": 0.84, "learning_rate": 0.00013639271518074613, "loss": 2.3365, "step": 31140 }, { "epoch": 0.84, "learning_rate": 0.00013634883632750205, "loss": 2.4824, "step": 31141 }, { "epoch": 0.84, "learning_rate": 0.00013630496401712488, "loss": 2.0971, "step": 31142 }, { "epoch": 0.84, "learning_rate": 0.00013626109824994671, "loss": 2.3914, "step": 31143 }, { "epoch": 0.84, "learning_rate": 0.0001362172390263001, "loss": 2.5446, "step": 31144 }, { "epoch": 0.84, "learning_rate": 0.00013617338634651753, "loss": 2.1431, "step": 31145 }, { "epoch": 0.84, "learning_rate": 0.0001361295402109307, "loss": 2.5113, "step": 31146 }, { "epoch": 0.84, "learning_rate": 0.00013608570061987202, "loss": 1.7286, "step": 31147 }, { "epoch": 0.84, "learning_rate": 0.00013604186757367365, "loss": 2.4592, "step": 31148 }, { "epoch": 0.84, "learning_rate": 0.00013599804107266756, "loss": 2.4667, "step": 31149 }, { "epoch": 0.84, "learning_rate": 0.00013595422111718593, "loss": 2.3301, "step": 31150 }, { "epoch": 0.84, "learning_rate": 0.0001359104077075608, "loss": 2.584, "step": 31151 }, { "epoch": 0.84, "learning_rate": 0.00013586660084412373, "loss": 2.188, "step": 31152 }, { "epoch": 0.84, "learning_rate": 0.0001358228005272071, "loss": 2.5068, "step": 31153 }, { "epoch": 0.84, "learning_rate": 0.00013577900675714206, "loss": 2.9137, "step": 31154 }, { "epoch": 0.84, "learning_rate": 0.00013573521953426083, "loss": 2.0584, "step": 31155 }, { "epoch": 0.84, "learning_rate": 0.00013569143885889512, "loss": 2.1833, "step": 31156 }, { "epoch": 0.84, "learning_rate": 0.00013564766473137647, "loss": 2.1256, "step": 31157 }, { "epoch": 0.84, "learning_rate": 0.0001356038971520366, "loss": 2.2384, "step": 31158 }, { "epoch": 0.84, "learning_rate": 0.00013556013612120722, "loss": 2.5749, "step": 31159 }, { "epoch": 0.84, "learning_rate": 0.00013551638163921965, "loss": 2.7535, "step": 31160 }, { "epoch": 0.84, "learning_rate": 0.00013547263370640528, "loss": 2.4051, "step": 31161 }, { "epoch": 0.84, "learning_rate": 0.00013542889232309564, "loss": 2.6468, "step": 31162 }, { "epoch": 0.84, "learning_rate": 0.00013538515748962222, "loss": 2.659, "step": 31163 }, { "epoch": 0.84, "learning_rate": 0.00013534142920631654, "loss": 2.374, "step": 31164 }, { "epoch": 0.84, "learning_rate": 0.00013529770747350934, "loss": 1.9346, "step": 31165 }, { "epoch": 0.84, "learning_rate": 0.000135253992291532, "loss": 2.6996, "step": 31166 }, { "epoch": 0.84, "learning_rate": 0.0001352102836607162, "loss": 2.4974, "step": 31167 }, { "epoch": 0.84, "learning_rate": 0.00013516658158139238, "loss": 2.6173, "step": 31168 }, { "epoch": 0.84, "learning_rate": 0.0001351228860538919, "loss": 2.3083, "step": 31169 }, { "epoch": 0.84, "learning_rate": 0.0001350791970785459, "loss": 2.1748, "step": 31170 }, { "epoch": 0.84, "learning_rate": 0.00013503551465568519, "loss": 2.6697, "step": 31171 }, { "epoch": 0.84, "learning_rate": 0.00013499183878564104, "loss": 2.2649, "step": 31172 }, { "epoch": 0.84, "learning_rate": 0.00013494816946874378, "loss": 2.483, "step": 31173 }, { "epoch": 0.84, "learning_rate": 0.00013490450670532463, "loss": 2.1736, "step": 31174 }, { "epoch": 0.84, "learning_rate": 0.00013486085049571416, "loss": 2.7056, "step": 31175 }, { "epoch": 0.84, "learning_rate": 0.0001348172008402433, "loss": 2.6872, "step": 31176 }, { "epoch": 0.84, "learning_rate": 0.00013477355773924282, "loss": 2.0317, "step": 31177 }, { "epoch": 0.84, "learning_rate": 0.00013472992119304295, "loss": 2.6691, "step": 31178 }, { "epoch": 0.84, "learning_rate": 0.0001346862912019746, "loss": 2.1733, "step": 31179 }, { "epoch": 0.84, "learning_rate": 0.00013464266776636835, "loss": 2.5765, "step": 31180 }, { "epoch": 0.84, "learning_rate": 0.00013459905088655433, "loss": 2.2722, "step": 31181 }, { "epoch": 0.84, "learning_rate": 0.00013455544056286295, "loss": 2.5999, "step": 31182 }, { "epoch": 0.84, "learning_rate": 0.00013451183679562528, "loss": 2.6782, "step": 31183 }, { "epoch": 0.84, "learning_rate": 0.00013446823958517096, "loss": 2.8145, "step": 31184 }, { "epoch": 0.84, "learning_rate": 0.00013442464893183048, "loss": 2.3446, "step": 31185 }, { "epoch": 0.84, "learning_rate": 0.00013438106483593438, "loss": 2.9527, "step": 31186 }, { "epoch": 0.84, "learning_rate": 0.00013433748729781237, "loss": 2.402, "step": 31187 }, { "epoch": 0.84, "learning_rate": 0.00013429391631779476, "loss": 2.4371, "step": 31188 }, { "epoch": 0.84, "learning_rate": 0.0001342503518962117, "loss": 2.5292, "step": 31189 }, { "epoch": 0.84, "learning_rate": 0.0001342067940333932, "loss": 2.2275, "step": 31190 }, { "epoch": 0.84, "learning_rate": 0.0001341632427296694, "loss": 2.0897, "step": 31191 }, { "epoch": 0.84, "learning_rate": 0.00013411969798536995, "loss": 2.6377, "step": 31192 }, { "epoch": 0.84, "learning_rate": 0.00013407615980082476, "loss": 2.3033, "step": 31193 }, { "epoch": 0.84, "learning_rate": 0.00013403262817636397, "loss": 2.464, "step": 31194 }, { "epoch": 0.84, "learning_rate": 0.00013398910311231683, "loss": 2.9437, "step": 31195 }, { "epoch": 0.84, "learning_rate": 0.00013394558460901385, "loss": 2.726, "step": 31196 }, { "epoch": 0.84, "learning_rate": 0.000133902072666784, "loss": 2.0757, "step": 31197 }, { "epoch": 0.84, "learning_rate": 0.00013385856728595724, "loss": 2.3616, "step": 31198 }, { "epoch": 0.84, "learning_rate": 0.0001338150684668633, "loss": 2.6262, "step": 31199 }, { "epoch": 0.84, "learning_rate": 0.00013377157620983137, "loss": 2.2181, "step": 31200 }, { "epoch": 0.84, "learning_rate": 0.00013372809051519108, "loss": 2.8986, "step": 31201 }, { "epoch": 0.84, "learning_rate": 0.00013368461138327193, "loss": 2.8131, "step": 31202 }, { "epoch": 0.84, "learning_rate": 0.0001336411388144032, "loss": 2.5419, "step": 31203 }, { "epoch": 0.84, "learning_rate": 0.00013359767280891465, "loss": 2.8657, "step": 31204 }, { "epoch": 0.84, "learning_rate": 0.00013355421336713502, "loss": 2.6131, "step": 31205 }, { "epoch": 0.84, "learning_rate": 0.0001335107604893937, "loss": 2.5836, "step": 31206 }, { "epoch": 0.84, "learning_rate": 0.00013346731417601988, "loss": 2.2819, "step": 31207 }, { "epoch": 0.84, "learning_rate": 0.00013342387442734282, "loss": 1.9068, "step": 31208 }, { "epoch": 0.84, "learning_rate": 0.00013338044124369165, "loss": 2.506, "step": 31209 }, { "epoch": 0.84, "learning_rate": 0.0001333370146253955, "loss": 2.7703, "step": 31210 }, { "epoch": 0.84, "learning_rate": 0.0001332935945727829, "loss": 2.68, "step": 31211 }, { "epoch": 0.84, "learning_rate": 0.00013325018108618336, "loss": 2.5883, "step": 31212 }, { "epoch": 0.84, "learning_rate": 0.00013320677416592518, "loss": 2.2999, "step": 31213 }, { "epoch": 0.84, "learning_rate": 0.00013316337381233756, "loss": 2.7542, "step": 31214 }, { "epoch": 0.84, "learning_rate": 0.0001331199800257492, "loss": 2.5004, "step": 31215 }, { "epoch": 0.84, "learning_rate": 0.000133076592806489, "loss": 2.7669, "step": 31216 }, { "epoch": 0.84, "learning_rate": 0.0001330332121548855, "loss": 2.7611, "step": 31217 }, { "epoch": 0.84, "learning_rate": 0.00013298983807126752, "loss": 2.5974, "step": 31218 }, { "epoch": 0.84, "learning_rate": 0.00013294647055596344, "loss": 2.7279, "step": 31219 }, { "epoch": 0.84, "learning_rate": 0.00013290310960930175, "loss": 2.5474, "step": 31220 }, { "epoch": 0.84, "learning_rate": 0.0001328597552316111, "loss": 2.1313, "step": 31221 }, { "epoch": 0.84, "learning_rate": 0.00013281640742321998, "loss": 2.6843, "step": 31222 }, { "epoch": 0.84, "learning_rate": 0.00013277306618445696, "loss": 1.9942, "step": 31223 }, { "epoch": 0.84, "learning_rate": 0.0001327297315156498, "loss": 2.2237, "step": 31224 }, { "epoch": 0.84, "learning_rate": 0.00013268640341712723, "loss": 2.4808, "step": 31225 }, { "epoch": 0.84, "learning_rate": 0.0001326430818892176, "loss": 2.2169, "step": 31226 }, { "epoch": 0.84, "learning_rate": 0.00013259976693224873, "loss": 2.3917, "step": 31227 }, { "epoch": 0.84, "learning_rate": 0.00013255645854654875, "loss": 2.613, "step": 31228 }, { "epoch": 0.84, "learning_rate": 0.00013251315673244634, "loss": 2.1417, "step": 31229 }, { "epoch": 0.84, "learning_rate": 0.00013246986149026896, "loss": 2.7507, "step": 31230 }, { "epoch": 0.84, "learning_rate": 0.00013242657282034497, "loss": 2.5987, "step": 31231 }, { "epoch": 0.84, "learning_rate": 0.00013238329072300204, "loss": 2.041, "step": 31232 }, { "epoch": 0.84, "learning_rate": 0.0001323400151985681, "loss": 2.3533, "step": 31233 }, { "epoch": 0.84, "learning_rate": 0.0001322967462473711, "loss": 2.3691, "step": 31234 }, { "epoch": 0.84, "learning_rate": 0.0001322534838697388, "loss": 2.1667, "step": 31235 }, { "epoch": 0.84, "learning_rate": 0.00013221022806599904, "loss": 2.6772, "step": 31236 }, { "epoch": 0.84, "learning_rate": 0.00013216697883647967, "loss": 2.5113, "step": 31237 }, { "epoch": 0.84, "learning_rate": 0.00013212373618150787, "loss": 2.5657, "step": 31238 }, { "epoch": 0.84, "learning_rate": 0.00013208050010141159, "loss": 2.3328, "step": 31239 }, { "epoch": 0.84, "learning_rate": 0.00013203727059651814, "loss": 2.9189, "step": 31240 }, { "epoch": 0.84, "learning_rate": 0.00013199404766715494, "loss": 2.2639, "step": 31241 }, { "epoch": 0.84, "learning_rate": 0.00013195083131365014, "loss": 2.763, "step": 31242 }, { "epoch": 0.84, "learning_rate": 0.00013190762153633041, "loss": 2.5518, "step": 31243 }, { "epoch": 0.84, "learning_rate": 0.00013186441833552321, "loss": 2.4809, "step": 31244 }, { "epoch": 0.84, "learning_rate": 0.0001318212217115563, "loss": 2.3892, "step": 31245 }, { "epoch": 0.84, "learning_rate": 0.00013177803166475644, "loss": 2.3691, "step": 31246 }, { "epoch": 0.84, "learning_rate": 0.00013173484819545088, "loss": 2.5254, "step": 31247 }, { "epoch": 0.84, "learning_rate": 0.00013169167130396687, "loss": 2.3573, "step": 31248 }, { "epoch": 0.84, "learning_rate": 0.00013164850099063152, "loss": 2.4319, "step": 31249 }, { "epoch": 0.84, "learning_rate": 0.00013160533725577216, "loss": 2.6766, "step": 31250 }, { "epoch": 0.84, "learning_rate": 0.00013156218009971533, "loss": 2.6855, "step": 31251 }, { "epoch": 0.84, "learning_rate": 0.00013151902952278805, "loss": 2.7425, "step": 31252 }, { "epoch": 0.84, "learning_rate": 0.00013147588552531763, "loss": 2.7261, "step": 31253 }, { "epoch": 0.84, "learning_rate": 0.00013143274810763016, "loss": 2.6286, "step": 31254 }, { "epoch": 0.84, "learning_rate": 0.0001313896172700534, "loss": 2.7292, "step": 31255 }, { "epoch": 0.84, "learning_rate": 0.00013134649301291325, "loss": 2.7077, "step": 31256 }, { "epoch": 0.84, "learning_rate": 0.0001313033753365369, "loss": 2.226, "step": 31257 }, { "epoch": 0.84, "learning_rate": 0.00013126026424125105, "loss": 2.2287, "step": 31258 }, { "epoch": 0.84, "learning_rate": 0.0001312171597273818, "loss": 2.0119, "step": 31259 }, { "epoch": 0.84, "learning_rate": 0.00013117406179525616, "loss": 2.5881, "step": 31260 }, { "epoch": 0.84, "learning_rate": 0.00013113097044520038, "loss": 2.2166, "step": 31261 }, { "epoch": 0.84, "learning_rate": 0.00013108788567754115, "loss": 2.4912, "step": 31262 }, { "epoch": 0.84, "learning_rate": 0.0001310448074926047, "loss": 2.3209, "step": 31263 }, { "epoch": 0.84, "learning_rate": 0.0001310017358907176, "loss": 2.1097, "step": 31264 }, { "epoch": 0.84, "learning_rate": 0.0001309586708722059, "loss": 2.598, "step": 31265 }, { "epoch": 0.84, "learning_rate": 0.00013091561243739602, "loss": 2.605, "step": 31266 }, { "epoch": 0.84, "learning_rate": 0.00013087256058661378, "loss": 2.5364, "step": 31267 }, { "epoch": 0.84, "learning_rate": 0.00013082951532018572, "loss": 2.5455, "step": 31268 }, { "epoch": 0.84, "learning_rate": 0.00013078647663843811, "loss": 2.7009, "step": 31269 }, { "epoch": 0.84, "learning_rate": 0.00013074344454169662, "loss": 2.4733, "step": 31270 }, { "epoch": 0.84, "learning_rate": 0.00013070041903028728, "loss": 2.3431, "step": 31271 }, { "epoch": 0.84, "learning_rate": 0.00013065740010453642, "loss": 2.3865, "step": 31272 }, { "epoch": 0.84, "learning_rate": 0.0001306143877647694, "loss": 2.535, "step": 31273 }, { "epoch": 0.84, "learning_rate": 0.00013057138201131246, "loss": 2.4661, "step": 31274 }, { "epoch": 0.84, "learning_rate": 0.0001305283828444912, "loss": 2.5385, "step": 31275 }, { "epoch": 0.84, "learning_rate": 0.00013048539026463147, "loss": 2.4927, "step": 31276 }, { "epoch": 0.84, "learning_rate": 0.00013044240427205922, "loss": 2.4578, "step": 31277 }, { "epoch": 0.84, "learning_rate": 0.00013039942486709966, "loss": 2.2024, "step": 31278 }, { "epoch": 0.84, "learning_rate": 0.0001303564520500785, "loss": 2.1462, "step": 31279 }, { "epoch": 0.84, "learning_rate": 0.00013031348582132142, "loss": 3.0409, "step": 31280 }, { "epoch": 0.84, "learning_rate": 0.00013027052618115386, "loss": 2.3602, "step": 31281 }, { "epoch": 0.84, "learning_rate": 0.00013022757312990162, "loss": 2.7857, "step": 31282 }, { "epoch": 0.84, "learning_rate": 0.00013018462666788944, "loss": 2.3869, "step": 31283 }, { "epoch": 0.84, "learning_rate": 0.00013014168679544315, "loss": 2.63, "step": 31284 }, { "epoch": 0.84, "learning_rate": 0.00013009875351288803, "loss": 1.9846, "step": 31285 }, { "epoch": 0.84, "learning_rate": 0.00013005582682054905, "loss": 2.8253, "step": 31286 }, { "epoch": 0.84, "learning_rate": 0.00013001290671875166, "loss": 2.4206, "step": 31287 }, { "epoch": 0.84, "learning_rate": 0.00012996999320782088, "loss": 2.4959, "step": 31288 }, { "epoch": 0.84, "learning_rate": 0.0001299270862880818, "loss": 2.3189, "step": 31289 }, { "epoch": 0.84, "learning_rate": 0.00012988418595985996, "loss": 2.6095, "step": 31290 }, { "epoch": 0.84, "learning_rate": 0.00012984129222347963, "loss": 2.4626, "step": 31291 }, { "epoch": 0.84, "learning_rate": 0.0001297984050792661, "loss": 2.9586, "step": 31292 }, { "epoch": 0.84, "learning_rate": 0.00012975552452754434, "loss": 2.4873, "step": 31293 }, { "epoch": 0.84, "learning_rate": 0.00012971265056863912, "loss": 2.4091, "step": 31294 }, { "epoch": 0.84, "learning_rate": 0.00012966978320287526, "loss": 2.7247, "step": 31295 }, { "epoch": 0.84, "learning_rate": 0.00012962692243057773, "loss": 2.2418, "step": 31296 }, { "epoch": 0.84, "learning_rate": 0.0001295840682520708, "loss": 2.3787, "step": 31297 }, { "epoch": 0.84, "learning_rate": 0.00012954122066767936, "loss": 2.6019, "step": 31298 }, { "epoch": 0.84, "learning_rate": 0.00012949837967772825, "loss": 2.6356, "step": 31299 }, { "epoch": 0.84, "learning_rate": 0.00012945554528254156, "loss": 2.5089, "step": 31300 }, { "epoch": 0.84, "learning_rate": 0.00012941271748244398, "loss": 2.1157, "step": 31301 }, { "epoch": 0.84, "learning_rate": 0.00012936989627775996, "loss": 2.4153, "step": 31302 }, { "epoch": 0.84, "learning_rate": 0.00012932708166881412, "loss": 2.3369, "step": 31303 }, { "epoch": 0.84, "learning_rate": 0.00012928427365593075, "loss": 2.3939, "step": 31304 }, { "epoch": 0.84, "learning_rate": 0.00012924147223943383, "loss": 2.5254, "step": 31305 }, { "epoch": 0.84, "learning_rate": 0.00012919867741964785, "loss": 1.7814, "step": 31306 }, { "epoch": 0.84, "learning_rate": 0.00012915588919689701, "loss": 2.4327, "step": 31307 }, { "epoch": 0.84, "learning_rate": 0.0001291131075715055, "loss": 2.5682, "step": 31308 }, { "epoch": 0.84, "learning_rate": 0.00012907033254379763, "loss": 2.4492, "step": 31309 }, { "epoch": 0.84, "learning_rate": 0.0001290275641140969, "loss": 2.2744, "step": 31310 }, { "epoch": 0.84, "learning_rate": 0.00012898480228272768, "loss": 2.616, "step": 31311 }, { "epoch": 0.84, "learning_rate": 0.0001289420470500141, "loss": 2.3044, "step": 31312 }, { "epoch": 0.84, "learning_rate": 0.00012889929841627956, "loss": 2.3115, "step": 31313 }, { "epoch": 0.84, "learning_rate": 0.000128856556381848, "loss": 2.5184, "step": 31314 }, { "epoch": 0.84, "learning_rate": 0.00012881382094704396, "loss": 2.447, "step": 31315 }, { "epoch": 0.84, "learning_rate": 0.0001287710921121903, "loss": 2.3798, "step": 31316 }, { "epoch": 0.84, "learning_rate": 0.00012872836987761139, "loss": 2.2493, "step": 31317 }, { "epoch": 0.84, "learning_rate": 0.00012868565424363032, "loss": 2.7065, "step": 31318 }, { "epoch": 0.84, "learning_rate": 0.00012864294521057097, "loss": 2.5053, "step": 31319 }, { "epoch": 0.84, "learning_rate": 0.00012860024277875693, "loss": 2.5366, "step": 31320 }, { "epoch": 0.84, "learning_rate": 0.00012855754694851164, "loss": 2.6683, "step": 31321 }, { "epoch": 0.84, "learning_rate": 0.00012851485772015858, "loss": 2.3288, "step": 31322 }, { "epoch": 0.84, "learning_rate": 0.0001284721750940213, "loss": 2.207, "step": 31323 }, { "epoch": 0.84, "learning_rate": 0.0001284294990704228, "loss": 2.2105, "step": 31324 }, { "epoch": 0.84, "learning_rate": 0.00012838682964968684, "loss": 2.6076, "step": 31325 }, { "epoch": 0.84, "learning_rate": 0.00012834416683213623, "loss": 2.5809, "step": 31326 }, { "epoch": 0.84, "learning_rate": 0.00012830151061809413, "loss": 2.7886, "step": 31327 }, { "epoch": 0.84, "learning_rate": 0.00012825886100788442, "loss": 2.6907, "step": 31328 }, { "epoch": 0.84, "learning_rate": 0.00012821621800182949, "loss": 2.6538, "step": 31329 }, { "epoch": 0.84, "learning_rate": 0.0001281735816002526, "loss": 2.6106, "step": 31330 }, { "epoch": 0.84, "learning_rate": 0.000128130951803477, "loss": 2.7499, "step": 31331 }, { "epoch": 0.84, "learning_rate": 0.00012808832861182528, "loss": 2.3747, "step": 31332 }, { "epoch": 0.84, "learning_rate": 0.00012804571202562043, "loss": 2.8046, "step": 31333 }, { "epoch": 0.84, "learning_rate": 0.00012800310204518539, "loss": 2.3082, "step": 31334 }, { "epoch": 0.84, "learning_rate": 0.00012796049867084302, "loss": 2.7697, "step": 31335 }, { "epoch": 0.84, "learning_rate": 0.0001279179019029162, "loss": 2.512, "step": 31336 }, { "epoch": 0.84, "learning_rate": 0.00012787531174172716, "loss": 2.0584, "step": 31337 }, { "epoch": 0.84, "learning_rate": 0.00012783272818759885, "loss": 2.2161, "step": 31338 }, { "epoch": 0.84, "learning_rate": 0.00012779015124085414, "loss": 2.7676, "step": 31339 }, { "epoch": 0.84, "learning_rate": 0.00012774758090181482, "loss": 2.6036, "step": 31340 }, { "epoch": 0.84, "learning_rate": 0.00012770501717080407, "loss": 2.4106, "step": 31341 }, { "epoch": 0.84, "learning_rate": 0.00012766246004814442, "loss": 2.7001, "step": 31342 }, { "epoch": 0.84, "learning_rate": 0.0001276199095341578, "loss": 2.8757, "step": 31343 }, { "epoch": 0.84, "learning_rate": 0.000127577365629167, "loss": 2.7349, "step": 31344 }, { "epoch": 0.84, "learning_rate": 0.00012753482833349384, "loss": 2.378, "step": 31345 }, { "epoch": 0.84, "learning_rate": 0.00012749229764746084, "loss": 2.6421, "step": 31346 }, { "epoch": 0.84, "learning_rate": 0.0001274497735713903, "loss": 2.2357, "step": 31347 }, { "epoch": 0.84, "learning_rate": 0.0001274072561056042, "loss": 2.0273, "step": 31348 }, { "epoch": 0.84, "learning_rate": 0.00012736474525042475, "loss": 2.8052, "step": 31349 }, { "epoch": 0.84, "learning_rate": 0.0001273222410061742, "loss": 2.5969, "step": 31350 }, { "epoch": 0.84, "learning_rate": 0.00012727974337317405, "loss": 2.6763, "step": 31351 }, { "epoch": 0.84, "learning_rate": 0.00012723725235174688, "loss": 2.4589, "step": 31352 }, { "epoch": 0.84, "learning_rate": 0.00012719476794221363, "loss": 2.5103, "step": 31353 }, { "epoch": 0.84, "learning_rate": 0.00012715229014489715, "loss": 2.7078, "step": 31354 }, { "epoch": 0.84, "learning_rate": 0.00012710981896011907, "loss": 2.4361, "step": 31355 }, { "epoch": 0.84, "learning_rate": 0.0001270673543882006, "loss": 2.1323, "step": 31356 }, { "epoch": 0.84, "learning_rate": 0.0001270248964294639, "loss": 3.0758, "step": 31357 }, { "epoch": 0.84, "learning_rate": 0.00012698244508423074, "loss": 2.7143, "step": 31358 }, { "epoch": 0.84, "learning_rate": 0.00012694000035282226, "loss": 2.3575, "step": 31359 }, { "epoch": 0.84, "learning_rate": 0.00012689756223556025, "loss": 2.2723, "step": 31360 }, { "epoch": 0.84, "learning_rate": 0.0001268551307327662, "loss": 2.7249, "step": 31361 }, { "epoch": 0.84, "learning_rate": 0.00012681270584476156, "loss": 2.5267, "step": 31362 }, { "epoch": 0.84, "learning_rate": 0.00012677028757186794, "loss": 2.5545, "step": 31363 }, { "epoch": 0.84, "learning_rate": 0.00012672787591440636, "loss": 2.1636, "step": 31364 }, { "epoch": 0.84, "learning_rate": 0.00012668547087269822, "loss": 2.4583, "step": 31365 }, { "epoch": 0.84, "learning_rate": 0.00012664307244706485, "loss": 2.4408, "step": 31366 }, { "epoch": 0.84, "learning_rate": 0.00012660068063782736, "loss": 2.6222, "step": 31367 }, { "epoch": 0.84, "learning_rate": 0.00012655829544530727, "loss": 2.3035, "step": 31368 }, { "epoch": 0.84, "learning_rate": 0.0001265159168698251, "loss": 2.5594, "step": 31369 }, { "epoch": 0.84, "learning_rate": 0.00012647354491170215, "loss": 2.1791, "step": 31370 }, { "epoch": 0.84, "learning_rate": 0.0001264311795712597, "loss": 2.7115, "step": 31371 }, { "epoch": 0.84, "learning_rate": 0.00012638882084881832, "loss": 2.4596, "step": 31372 }, { "epoch": 0.84, "learning_rate": 0.00012634646874469868, "loss": 2.0089, "step": 31373 }, { "epoch": 0.84, "learning_rate": 0.0001263041232592226, "loss": 2.3248, "step": 31374 }, { "epoch": 0.84, "learning_rate": 0.00012626178439270995, "loss": 2.364, "step": 31375 }, { "epoch": 0.84, "learning_rate": 0.00012621945214548181, "loss": 2.4034, "step": 31376 }, { "epoch": 0.84, "learning_rate": 0.00012617712651785917, "loss": 2.7256, "step": 31377 }, { "epoch": 0.84, "learning_rate": 0.00012613480751016203, "loss": 2.8992, "step": 31378 }, { "epoch": 0.84, "learning_rate": 0.00012609249512271148, "loss": 2.4166, "step": 31379 }, { "epoch": 0.84, "learning_rate": 0.000126050189355828, "loss": 2.3118, "step": 31380 }, { "epoch": 0.84, "learning_rate": 0.00012600789020983193, "loss": 2.1884, "step": 31381 }, { "epoch": 0.84, "learning_rate": 0.0001259655976850441, "loss": 2.1765, "step": 31382 }, { "epoch": 0.84, "learning_rate": 0.0001259233117817844, "loss": 2.2335, "step": 31383 }, { "epoch": 0.84, "learning_rate": 0.00012588103250037343, "loss": 2.8219, "step": 31384 }, { "epoch": 0.84, "learning_rate": 0.0001258387598411317, "loss": 2.0664, "step": 31385 }, { "epoch": 0.84, "learning_rate": 0.00012579649380437875, "loss": 2.6537, "step": 31386 }, { "epoch": 0.84, "learning_rate": 0.00012575423439043577, "loss": 2.668, "step": 31387 }, { "epoch": 0.84, "learning_rate": 0.00012571198159962217, "loss": 2.8931, "step": 31388 }, { "epoch": 0.84, "learning_rate": 0.00012566973543225824, "loss": 2.7454, "step": 31389 }, { "epoch": 0.84, "learning_rate": 0.0001256274958886644, "loss": 3.1288, "step": 31390 }, { "epoch": 0.84, "learning_rate": 0.00012558526296916006, "loss": 1.9453, "step": 31391 }, { "epoch": 0.84, "learning_rate": 0.0001255430366740654, "loss": 2.6793, "step": 31392 }, { "epoch": 0.84, "learning_rate": 0.0001255008170037004, "loss": 2.2229, "step": 31393 }, { "epoch": 0.84, "learning_rate": 0.00012545860395838483, "loss": 2.2143, "step": 31394 }, { "epoch": 0.84, "learning_rate": 0.00012541639753843882, "loss": 2.1537, "step": 31395 }, { "epoch": 0.84, "learning_rate": 0.00012537419774418147, "loss": 2.4599, "step": 31396 }, { "epoch": 0.84, "learning_rate": 0.00012533200457593297, "loss": 2.1541, "step": 31397 }, { "epoch": 0.84, "learning_rate": 0.00012528981803401295, "loss": 2.5034, "step": 31398 }, { "epoch": 0.84, "learning_rate": 0.0001252476381187405, "loss": 2.376, "step": 31399 }, { "epoch": 0.84, "learning_rate": 0.0001252054648304357, "loss": 2.7297, "step": 31400 }, { "epoch": 0.84, "learning_rate": 0.00012516329816941819, "loss": 2.5112, "step": 31401 }, { "epoch": 0.84, "learning_rate": 0.0001251211381360069, "loss": 2.8508, "step": 31402 }, { "epoch": 0.84, "learning_rate": 0.00012507898473052172, "loss": 1.919, "step": 31403 }, { "epoch": 0.84, "learning_rate": 0.00012503683795328136, "loss": 2.4626, "step": 31404 }, { "epoch": 0.84, "learning_rate": 0.0001249946978046056, "loss": 2.3958, "step": 31405 }, { "epoch": 0.84, "learning_rate": 0.0001249525642848136, "loss": 3.0031, "step": 31406 }, { "epoch": 0.84, "learning_rate": 0.00012491043739422449, "loss": 2.6089, "step": 31407 }, { "epoch": 0.84, "learning_rate": 0.0001248683171331574, "loss": 2.4211, "step": 31408 }, { "epoch": 0.84, "learning_rate": 0.00012482620350193175, "loss": 2.5827, "step": 31409 }, { "epoch": 0.84, "learning_rate": 0.00012478409650086607, "loss": 2.9221, "step": 31410 }, { "epoch": 0.84, "learning_rate": 0.0001247419961302796, "loss": 2.7138, "step": 31411 }, { "epoch": 0.84, "learning_rate": 0.00012469990239049133, "loss": 2.7333, "step": 31412 }, { "epoch": 0.84, "learning_rate": 0.00012465781528182008, "loss": 2.5407, "step": 31413 }, { "epoch": 0.84, "learning_rate": 0.000124615734804585, "loss": 2.5356, "step": 31414 }, { "epoch": 0.84, "learning_rate": 0.00012457366095910426, "loss": 2.805, "step": 31415 }, { "epoch": 0.84, "learning_rate": 0.0001245315937456971, "loss": 2.1733, "step": 31416 }, { "epoch": 0.84, "learning_rate": 0.00012448953316468225, "loss": 2.3451, "step": 31417 }, { "epoch": 0.84, "learning_rate": 0.0001244474792163779, "loss": 2.6615, "step": 31418 }, { "epoch": 0.84, "learning_rate": 0.00012440543190110297, "loss": 1.9385, "step": 31419 }, { "epoch": 0.84, "learning_rate": 0.00012436339121917584, "loss": 2.4625, "step": 31420 }, { "epoch": 0.84, "learning_rate": 0.0001243213571709152, "loss": 2.7112, "step": 31421 }, { "epoch": 0.84, "learning_rate": 0.0001242793297566396, "loss": 2.3214, "step": 31422 }, { "epoch": 0.84, "learning_rate": 0.00012423730897666708, "loss": 2.7779, "step": 31423 }, { "epoch": 0.84, "learning_rate": 0.00012419529483131609, "loss": 2.6673, "step": 31424 }, { "epoch": 0.84, "learning_rate": 0.00012415328732090492, "loss": 1.9684, "step": 31425 }, { "epoch": 0.84, "learning_rate": 0.00012411128644575187, "loss": 2.624, "step": 31426 }, { "epoch": 0.84, "learning_rate": 0.00012406929220617514, "loss": 2.2898, "step": 31427 }, { "epoch": 0.84, "learning_rate": 0.00012402730460249313, "loss": 2.216, "step": 31428 }, { "epoch": 0.84, "learning_rate": 0.00012398532363502336, "loss": 2.0445, "step": 31429 }, { "epoch": 0.84, "learning_rate": 0.00012394334930408436, "loss": 2.7382, "step": 31430 }, { "epoch": 0.84, "learning_rate": 0.00012390138160999376, "loss": 2.6403, "step": 31431 }, { "epoch": 0.84, "learning_rate": 0.00012385942055306954, "loss": 2.5135, "step": 31432 }, { "epoch": 0.84, "learning_rate": 0.00012381746613362987, "loss": 2.2535, "step": 31433 }, { "epoch": 0.84, "learning_rate": 0.0001237755183519923, "loss": 2.1488, "step": 31434 }, { "epoch": 0.84, "learning_rate": 0.0001237335772084749, "loss": 2.0691, "step": 31435 }, { "epoch": 0.84, "learning_rate": 0.00012369164270339538, "loss": 2.2366, "step": 31436 }, { "epoch": 0.84, "learning_rate": 0.0001236497148370711, "loss": 2.8033, "step": 31437 }, { "epoch": 0.84, "learning_rate": 0.0001236077936098199, "loss": 2.2553, "step": 31438 }, { "epoch": 0.84, "learning_rate": 0.00012356587902195937, "loss": 2.3985, "step": 31439 }, { "epoch": 0.84, "learning_rate": 0.00012352397107380698, "loss": 2.8104, "step": 31440 }, { "epoch": 0.84, "learning_rate": 0.00012348206976568065, "loss": 2.3238, "step": 31441 }, { "epoch": 0.84, "learning_rate": 0.00012344017509789706, "loss": 2.2784, "step": 31442 }, { "epoch": 0.84, "learning_rate": 0.00012339828707077418, "loss": 2.5733, "step": 31443 }, { "epoch": 0.85, "learning_rate": 0.00012335640568462926, "loss": 2.5312, "step": 31444 }, { "epoch": 0.85, "learning_rate": 0.0001233145309397793, "loss": 2.6247, "step": 31445 }, { "epoch": 0.85, "learning_rate": 0.0001232726628365415, "loss": 2.3518, "step": 31446 }, { "epoch": 0.85, "learning_rate": 0.0001232308013752337, "loss": 2.5952, "step": 31447 }, { "epoch": 0.85, "learning_rate": 0.0001231889465561723, "loss": 2.1322, "step": 31448 }, { "epoch": 0.85, "learning_rate": 0.00012314709837967498, "loss": 2.4333, "step": 31449 }, { "epoch": 0.85, "learning_rate": 0.0001231052568460582, "loss": 2.1691, "step": 31450 }, { "epoch": 0.85, "learning_rate": 0.00012306342195563924, "loss": 2.5979, "step": 31451 }, { "epoch": 0.85, "learning_rate": 0.0001230215937087351, "loss": 2.3442, "step": 31452 }, { "epoch": 0.85, "learning_rate": 0.00012297977210566248, "loss": 2.0486, "step": 31453 }, { "epoch": 0.85, "learning_rate": 0.00012293795714673838, "loss": 2.6448, "step": 31454 }, { "epoch": 0.85, "learning_rate": 0.00012289614883227961, "loss": 2.2444, "step": 31455 }, { "epoch": 0.85, "learning_rate": 0.0001228543471626027, "loss": 2.4888, "step": 31456 }, { "epoch": 0.85, "learning_rate": 0.00012281255213802468, "loss": 2.7441, "step": 31457 }, { "epoch": 0.85, "learning_rate": 0.00012277076375886165, "loss": 2.3387, "step": 31458 }, { "epoch": 0.85, "learning_rate": 0.00012272898202543025, "loss": 2.472, "step": 31459 }, { "epoch": 0.85, "learning_rate": 0.00012268720693804768, "loss": 2.4329, "step": 31460 }, { "epoch": 0.85, "learning_rate": 0.0001226454384970298, "loss": 2.9495, "step": 31461 }, { "epoch": 0.85, "learning_rate": 0.00012260367670269322, "loss": 2.1455, "step": 31462 }, { "epoch": 0.85, "learning_rate": 0.0001225619215553545, "loss": 2.5775, "step": 31463 }, { "epoch": 0.85, "learning_rate": 0.00012252017305532957, "loss": 2.2811, "step": 31464 }, { "epoch": 0.85, "learning_rate": 0.00012247843120293501, "loss": 2.7981, "step": 31465 }, { "epoch": 0.85, "learning_rate": 0.00012243669599848694, "loss": 2.4923, "step": 31466 }, { "epoch": 0.85, "learning_rate": 0.0001223949674423015, "loss": 2.2859, "step": 31467 }, { "epoch": 0.85, "learning_rate": 0.00012235324553469518, "loss": 2.6048, "step": 31468 }, { "epoch": 0.85, "learning_rate": 0.00012231153027598353, "loss": 2.6258, "step": 31469 }, { "epoch": 0.85, "learning_rate": 0.0001222698216664827, "loss": 2.7438, "step": 31470 }, { "epoch": 0.85, "learning_rate": 0.00012222811970650916, "loss": 2.2577, "step": 31471 }, { "epoch": 0.85, "learning_rate": 0.00012218642439637794, "loss": 2.4046, "step": 31472 }, { "epoch": 0.85, "learning_rate": 0.00012214473573640583, "loss": 2.3747, "step": 31473 }, { "epoch": 0.85, "learning_rate": 0.0001221030537269081, "loss": 2.543, "step": 31474 }, { "epoch": 0.85, "learning_rate": 0.00012206137836820063, "loss": 2.6129, "step": 31475 }, { "epoch": 0.85, "learning_rate": 0.0001220197096605995, "loss": 2.484, "step": 31476 }, { "epoch": 0.85, "learning_rate": 0.00012197804760441977, "loss": 2.9165, "step": 31477 }, { "epoch": 0.85, "learning_rate": 0.00012193639219997743, "loss": 2.6318, "step": 31478 }, { "epoch": 0.85, "learning_rate": 0.00012189474344758799, "loss": 2.6, "step": 31479 }, { "epoch": 0.85, "learning_rate": 0.000121853101347567, "loss": 2.7206, "step": 31480 }, { "epoch": 0.85, "learning_rate": 0.00012181146590022995, "loss": 1.9435, "step": 31481 }, { "epoch": 0.85, "learning_rate": 0.0001217698371058924, "loss": 2.4442, "step": 31482 }, { "epoch": 0.85, "learning_rate": 0.0001217282149648693, "loss": 2.0643, "step": 31483 }, { "epoch": 0.85, "learning_rate": 0.00012168659947747652, "loss": 2.534, "step": 31484 }, { "epoch": 0.85, "learning_rate": 0.00012164499064402845, "loss": 2.3813, "step": 31485 }, { "epoch": 0.85, "learning_rate": 0.00012160338846484132, "loss": 2.3708, "step": 31486 }, { "epoch": 0.85, "learning_rate": 0.00012156179294022995, "loss": 2.5723, "step": 31487 }, { "epoch": 0.85, "learning_rate": 0.00012152020407050923, "loss": 2.5592, "step": 31488 }, { "epoch": 0.85, "learning_rate": 0.00012147862185599434, "loss": 2.6669, "step": 31489 }, { "epoch": 0.85, "learning_rate": 0.00012143704629700059, "loss": 2.2752, "step": 31490 }, { "epoch": 0.85, "learning_rate": 0.00012139547739384249, "loss": 2.627, "step": 31491 }, { "epoch": 0.85, "learning_rate": 0.00012135391514683513, "loss": 2.1132, "step": 31492 }, { "epoch": 0.85, "learning_rate": 0.00012131235955629349, "loss": 2.1939, "step": 31493 }, { "epoch": 0.85, "learning_rate": 0.0001212708106225322, "loss": 2.6197, "step": 31494 }, { "epoch": 0.85, "learning_rate": 0.00012122926834586646, "loss": 2.4595, "step": 31495 }, { "epoch": 0.85, "learning_rate": 0.00012118773272661043, "loss": 2.2469, "step": 31496 }, { "epoch": 0.85, "learning_rate": 0.00012114620376507912, "loss": 2.6339, "step": 31497 }, { "epoch": 0.85, "learning_rate": 0.00012110468146158693, "loss": 2.4548, "step": 31498 }, { "epoch": 0.85, "learning_rate": 0.0001210631658164486, "loss": 2.754, "step": 31499 }, { "epoch": 0.85, "learning_rate": 0.00012102165682997879, "loss": 2.3763, "step": 31500 }, { "epoch": 0.85, "learning_rate": 0.00012098015450249155, "loss": 2.3596, "step": 31501 }, { "epoch": 0.85, "learning_rate": 0.00012093865883430145, "loss": 2.1125, "step": 31502 }, { "epoch": 0.85, "learning_rate": 0.00012089716982572319, "loss": 2.3004, "step": 31503 }, { "epoch": 0.85, "learning_rate": 0.00012085568747707055, "loss": 2.6537, "step": 31504 }, { "epoch": 0.85, "learning_rate": 0.00012081421178865803, "loss": 2.291, "step": 31505 }, { "epoch": 0.85, "learning_rate": 0.00012077274276079986, "loss": 2.6006, "step": 31506 }, { "epoch": 0.85, "learning_rate": 0.0001207312803938102, "loss": 2.6005, "step": 31507 }, { "epoch": 0.85, "learning_rate": 0.0001206898246880035, "loss": 2.6554, "step": 31508 }, { "epoch": 0.85, "learning_rate": 0.00012064837564369313, "loss": 2.2389, "step": 31509 }, { "epoch": 0.85, "learning_rate": 0.00012060693326119343, "loss": 2.6305, "step": 31510 }, { "epoch": 0.85, "learning_rate": 0.00012056549754081846, "loss": 2.439, "step": 31511 }, { "epoch": 0.85, "learning_rate": 0.00012052406848288211, "loss": 2.3109, "step": 31512 }, { "epoch": 0.85, "learning_rate": 0.0001204826460876981, "loss": 2.6319, "step": 31513 }, { "epoch": 0.85, "learning_rate": 0.00012044123035558052, "loss": 2.4347, "step": 31514 }, { "epoch": 0.85, "learning_rate": 0.00012039982128684268, "loss": 2.2478, "step": 31515 }, { "epoch": 0.85, "learning_rate": 0.00012035841888179888, "loss": 2.5153, "step": 31516 }, { "epoch": 0.85, "learning_rate": 0.0001203170231407621, "loss": 2.8637, "step": 31517 }, { "epoch": 0.85, "learning_rate": 0.00012027563406404629, "loss": 2.9767, "step": 31518 }, { "epoch": 0.85, "learning_rate": 0.00012023425165196511, "loss": 2.6965, "step": 31519 }, { "epoch": 0.85, "learning_rate": 0.00012019287590483185, "loss": 2.834, "step": 31520 }, { "epoch": 0.85, "learning_rate": 0.00012015150682296006, "loss": 2.6871, "step": 31521 }, { "epoch": 0.85, "learning_rate": 0.00012011014440666345, "loss": 2.6248, "step": 31522 }, { "epoch": 0.85, "learning_rate": 0.00012006878865625481, "loss": 2.641, "step": 31523 }, { "epoch": 0.85, "learning_rate": 0.00012002743957204765, "loss": 2.1967, "step": 31524 }, { "epoch": 0.85, "learning_rate": 0.00011998609715435537, "loss": 2.6923, "step": 31525 }, { "epoch": 0.85, "learning_rate": 0.00011994476140349108, "loss": 2.238, "step": 31526 }, { "epoch": 0.85, "learning_rate": 0.00011990343231976809, "loss": 2.2391, "step": 31527 }, { "epoch": 0.85, "learning_rate": 0.00011986210990349922, "loss": 2.4358, "step": 31528 }, { "epoch": 0.85, "learning_rate": 0.00011982079415499758, "loss": 1.8352, "step": 31529 }, { "epoch": 0.85, "learning_rate": 0.00011977948507457647, "loss": 2.5793, "step": 31530 }, { "epoch": 0.85, "learning_rate": 0.00011973818266254821, "loss": 2.6358, "step": 31531 }, { "epoch": 0.85, "learning_rate": 0.00011969688691922631, "loss": 2.1511, "step": 31532 }, { "epoch": 0.85, "learning_rate": 0.00011965559784492364, "loss": 2.2152, "step": 31533 }, { "epoch": 0.85, "learning_rate": 0.00011961431543995249, "loss": 2.4518, "step": 31534 }, { "epoch": 0.85, "learning_rate": 0.00011957303970462619, "loss": 2.8019, "step": 31535 }, { "epoch": 0.85, "learning_rate": 0.00011953177063925691, "loss": 2.7549, "step": 31536 }, { "epoch": 0.85, "learning_rate": 0.00011949050824415741, "loss": 2.4729, "step": 31537 }, { "epoch": 0.85, "learning_rate": 0.00011944925251964056, "loss": 2.5036, "step": 31538 }, { "epoch": 0.85, "learning_rate": 0.00011940800346601866, "loss": 2.2656, "step": 31539 }, { "epoch": 0.85, "learning_rate": 0.00011936676108360423, "loss": 1.9723, "step": 31540 }, { "epoch": 0.85, "learning_rate": 0.00011932552537271013, "loss": 2.5434, "step": 31541 }, { "epoch": 0.85, "learning_rate": 0.00011928429633364812, "loss": 2.1575, "step": 31542 }, { "epoch": 0.85, "learning_rate": 0.00011924307396673096, "loss": 2.437, "step": 31543 }, { "epoch": 0.85, "learning_rate": 0.00011920185827227047, "loss": 2.3793, "step": 31544 }, { "epoch": 0.85, "learning_rate": 0.00011916064925057945, "loss": 2.7883, "step": 31545 }, { "epoch": 0.85, "learning_rate": 0.00011911944690197007, "loss": 2.4643, "step": 31546 }, { "epoch": 0.85, "learning_rate": 0.00011907825122675408, "loss": 2.5989, "step": 31547 }, { "epoch": 0.85, "learning_rate": 0.00011903706222524368, "loss": 2.8575, "step": 31548 }, { "epoch": 0.85, "learning_rate": 0.0001189958798977513, "loss": 2.6852, "step": 31549 }, { "epoch": 0.85, "learning_rate": 0.00011895470424458832, "loss": 2.4451, "step": 31550 }, { "epoch": 0.85, "learning_rate": 0.00011891353526606707, "loss": 2.3026, "step": 31551 }, { "epoch": 0.85, "learning_rate": 0.00011887237296249931, "loss": 2.343, "step": 31552 }, { "epoch": 0.85, "learning_rate": 0.000118831217334197, "loss": 2.5789, "step": 31553 }, { "epoch": 0.85, "learning_rate": 0.00011879006838147188, "loss": 2.2118, "step": 31554 }, { "epoch": 0.85, "learning_rate": 0.00011874892610463561, "loss": 2.6418, "step": 31555 }, { "epoch": 0.85, "learning_rate": 0.00011870779050399993, "loss": 2.7144, "step": 31556 }, { "epoch": 0.85, "learning_rate": 0.00011866666157987638, "loss": 2.6414, "step": 31557 }, { "epoch": 0.85, "learning_rate": 0.0001186255393325767, "loss": 2.6154, "step": 31558 }, { "epoch": 0.85, "learning_rate": 0.0001185844237624123, "loss": 2.5798, "step": 31559 }, { "epoch": 0.85, "learning_rate": 0.00011854331486969494, "loss": 2.4452, "step": 31560 }, { "epoch": 0.85, "learning_rate": 0.0001185022126547356, "loss": 2.7766, "step": 31561 }, { "epoch": 0.85, "learning_rate": 0.00011846111711784624, "loss": 2.6782, "step": 31562 }, { "epoch": 0.85, "learning_rate": 0.0001184200282593375, "loss": 2.6626, "step": 31563 }, { "epoch": 0.85, "learning_rate": 0.00011837894607952104, "loss": 2.2937, "step": 31564 }, { "epoch": 0.85, "learning_rate": 0.00011833787057870815, "loss": 2.8139, "step": 31565 }, { "epoch": 0.85, "learning_rate": 0.00011829680175720992, "loss": 2.5174, "step": 31566 }, { "epoch": 0.85, "learning_rate": 0.00011825573961533743, "loss": 1.9893, "step": 31567 }, { "epoch": 0.85, "learning_rate": 0.00011821468415340197, "loss": 2.3886, "step": 31568 }, { "epoch": 0.85, "learning_rate": 0.00011817363537171433, "loss": 2.7004, "step": 31569 }, { "epoch": 0.85, "learning_rate": 0.00011813259327058545, "loss": 2.7364, "step": 31570 }, { "epoch": 0.85, "learning_rate": 0.00011809155785032643, "loss": 2.4428, "step": 31571 }, { "epoch": 0.85, "learning_rate": 0.00011805052911124814, "loss": 2.4044, "step": 31572 }, { "epoch": 0.85, "learning_rate": 0.00011800950705366154, "loss": 2.2158, "step": 31573 }, { "epoch": 0.85, "learning_rate": 0.00011796849167787705, "loss": 2.6524, "step": 31574 }, { "epoch": 0.85, "learning_rate": 0.00011792748298420552, "loss": 2.2633, "step": 31575 }, { "epoch": 0.85, "learning_rate": 0.00011788648097295796, "loss": 2.3947, "step": 31576 }, { "epoch": 0.85, "learning_rate": 0.00011784548564444441, "loss": 2.4425, "step": 31577 }, { "epoch": 0.85, "learning_rate": 0.00011780449699897577, "loss": 2.7611, "step": 31578 }, { "epoch": 0.85, "learning_rate": 0.00011776351503686266, "loss": 2.6831, "step": 31579 }, { "epoch": 0.85, "learning_rate": 0.00011772253975841529, "loss": 2.3247, "step": 31580 }, { "epoch": 0.85, "learning_rate": 0.00011768157116394451, "loss": 2.5658, "step": 31581 }, { "epoch": 0.85, "learning_rate": 0.00011764060925376008, "loss": 2.369, "step": 31582 }, { "epoch": 0.85, "learning_rate": 0.00011759965402817275, "loss": 2.4101, "step": 31583 }, { "epoch": 0.85, "learning_rate": 0.0001175587054874927, "loss": 2.2613, "step": 31584 }, { "epoch": 0.85, "learning_rate": 0.00011751776363203004, "loss": 2.5379, "step": 31585 }, { "epoch": 0.85, "learning_rate": 0.00011747682846209528, "loss": 2.7182, "step": 31586 }, { "epoch": 0.85, "learning_rate": 0.00011743589997799808, "loss": 2.6176, "step": 31587 }, { "epoch": 0.85, "learning_rate": 0.00011739497818004874, "loss": 2.275, "step": 31588 }, { "epoch": 0.85, "learning_rate": 0.00011735406306855744, "loss": 2.375, "step": 31589 }, { "epoch": 0.85, "learning_rate": 0.00011731315464383374, "loss": 2.5243, "step": 31590 }, { "epoch": 0.85, "learning_rate": 0.0001172722529061876, "loss": 2.5703, "step": 31591 }, { "epoch": 0.85, "learning_rate": 0.00011723135785592942, "loss": 2.4825, "step": 31592 }, { "epoch": 0.85, "learning_rate": 0.00011719046949336853, "loss": 2.4036, "step": 31593 }, { "epoch": 0.85, "learning_rate": 0.00011714958781881469, "loss": 2.2441, "step": 31594 }, { "epoch": 0.85, "learning_rate": 0.00011710871283257796, "loss": 2.1774, "step": 31595 }, { "epoch": 0.85, "learning_rate": 0.00011706784453496766, "loss": 3.0421, "step": 31596 }, { "epoch": 0.85, "learning_rate": 0.00011702698292629343, "loss": 2.4836, "step": 31597 }, { "epoch": 0.85, "learning_rate": 0.00011698612800686492, "loss": 2.2156, "step": 31598 }, { "epoch": 0.85, "learning_rate": 0.00011694527977699165, "loss": 2.7628, "step": 31599 }, { "epoch": 0.85, "learning_rate": 0.00011690443823698338, "loss": 2.1465, "step": 31600 }, { "epoch": 0.85, "learning_rate": 0.00011686360338714885, "loss": 2.7592, "step": 31601 }, { "epoch": 0.85, "learning_rate": 0.00011682277522779782, "loss": 2.3926, "step": 31602 }, { "epoch": 0.85, "learning_rate": 0.00011678195375923972, "loss": 2.2418, "step": 31603 }, { "epoch": 0.85, "learning_rate": 0.00011674113898178329, "loss": 2.1997, "step": 31604 }, { "epoch": 0.85, "learning_rate": 0.00011670033089573851, "loss": 2.5184, "step": 31605 }, { "epoch": 0.85, "learning_rate": 0.00011665952950141378, "loss": 2.4161, "step": 31606 }, { "epoch": 0.85, "learning_rate": 0.00011661873479911855, "loss": 2.1086, "step": 31607 }, { "epoch": 0.85, "learning_rate": 0.00011657794678916212, "loss": 2.5134, "step": 31608 }, { "epoch": 0.85, "learning_rate": 0.000116537165471853, "loss": 2.8248, "step": 31609 }, { "epoch": 0.85, "learning_rate": 0.0001164963908475004, "loss": 2.8096, "step": 31610 }, { "epoch": 0.85, "learning_rate": 0.0001164556229164131, "loss": 2.3514, "step": 31611 }, { "epoch": 0.85, "learning_rate": 0.00011641486167890014, "loss": 2.1678, "step": 31612 }, { "epoch": 0.85, "learning_rate": 0.00011637410713527042, "loss": 2.0894, "step": 31613 }, { "epoch": 0.85, "learning_rate": 0.00011633335928583222, "loss": 2.2797, "step": 31614 }, { "epoch": 0.85, "learning_rate": 0.00011629261813089454, "loss": 2.8189, "step": 31615 }, { "epoch": 0.85, "learning_rate": 0.00011625188367076611, "loss": 2.1793, "step": 31616 }, { "epoch": 0.85, "learning_rate": 0.00011621115590575504, "loss": 2.4324, "step": 31617 }, { "epoch": 0.85, "learning_rate": 0.00011617043483617051, "loss": 2.2653, "step": 31618 }, { "epoch": 0.85, "learning_rate": 0.00011612972046232096, "loss": 2.3306, "step": 31619 }, { "epoch": 0.85, "learning_rate": 0.00011608901278451434, "loss": 2.7977, "step": 31620 }, { "epoch": 0.85, "learning_rate": 0.00011604831180305963, "loss": 2.2368, "step": 31621 }, { "epoch": 0.85, "learning_rate": 0.00011600761751826461, "loss": 2.3941, "step": 31622 }, { "epoch": 0.85, "learning_rate": 0.00011596692993043778, "loss": 2.3444, "step": 31623 }, { "epoch": 0.85, "learning_rate": 0.00011592624903988758, "loss": 2.9741, "step": 31624 }, { "epoch": 0.85, "learning_rate": 0.00011588557484692197, "loss": 2.4777, "step": 31625 }, { "epoch": 0.85, "learning_rate": 0.00011584490735184916, "loss": 2.6092, "step": 31626 }, { "epoch": 0.85, "learning_rate": 0.00011580424655497757, "loss": 2.0109, "step": 31627 }, { "epoch": 0.85, "learning_rate": 0.0001157635924566146, "loss": 2.5252, "step": 31628 }, { "epoch": 0.85, "learning_rate": 0.00011572294505706882, "loss": 2.1871, "step": 31629 }, { "epoch": 0.85, "learning_rate": 0.0001156823043566475, "loss": 2.6415, "step": 31630 }, { "epoch": 0.85, "learning_rate": 0.0001156416703556592, "loss": 2.8887, "step": 31631 }, { "epoch": 0.85, "learning_rate": 0.00011560104305441166, "loss": 2.5593, "step": 31632 }, { "epoch": 0.85, "learning_rate": 0.0001155604224532123, "loss": 2.6131, "step": 31633 }, { "epoch": 0.85, "learning_rate": 0.00011551980855236898, "loss": 2.2489, "step": 31634 }, { "epoch": 0.85, "learning_rate": 0.00011547920135218981, "loss": 2.9964, "step": 31635 }, { "epoch": 0.85, "learning_rate": 0.00011543860085298175, "loss": 2.2648, "step": 31636 }, { "epoch": 0.85, "learning_rate": 0.00011539800705505277, "loss": 2.1671, "step": 31637 }, { "epoch": 0.85, "learning_rate": 0.00011535741995871029, "loss": 2.6645, "step": 31638 }, { "epoch": 0.85, "learning_rate": 0.00011531683956426187, "loss": 2.5601, "step": 31639 }, { "epoch": 0.85, "learning_rate": 0.00011527626587201512, "loss": 2.7994, "step": 31640 }, { "epoch": 0.85, "learning_rate": 0.00011523569888227703, "loss": 2.4826, "step": 31641 }, { "epoch": 0.85, "learning_rate": 0.00011519513859535503, "loss": 3.0877, "step": 31642 }, { "epoch": 0.85, "learning_rate": 0.00011515458501155651, "loss": 2.435, "step": 31643 }, { "epoch": 0.85, "learning_rate": 0.0001151140381311887, "loss": 2.5348, "step": 31644 }, { "epoch": 0.85, "learning_rate": 0.00011507349795455868, "loss": 2.6104, "step": 31645 }, { "epoch": 0.85, "learning_rate": 0.00011503296448197376, "loss": 2.4492, "step": 31646 }, { "epoch": 0.85, "learning_rate": 0.0001149924377137408, "loss": 2.7217, "step": 31647 }, { "epoch": 0.85, "learning_rate": 0.00011495191765016711, "loss": 2.4982, "step": 31648 }, { "epoch": 0.85, "learning_rate": 0.00011491140429155921, "loss": 2.6337, "step": 31649 }, { "epoch": 0.85, "learning_rate": 0.00011487089763822422, "loss": 2.2033, "step": 31650 }, { "epoch": 0.85, "learning_rate": 0.00011483039769046911, "loss": 2.4423, "step": 31651 }, { "epoch": 0.85, "learning_rate": 0.00011478990444860072, "loss": 2.7491, "step": 31652 }, { "epoch": 0.85, "learning_rate": 0.0001147494179129257, "loss": 2.112, "step": 31653 }, { "epoch": 0.85, "learning_rate": 0.00011470893808375105, "loss": 2.7063, "step": 31654 }, { "epoch": 0.85, "learning_rate": 0.00011466846496138295, "loss": 2.3711, "step": 31655 }, { "epoch": 0.85, "learning_rate": 0.00011462799854612827, "loss": 2.5178, "step": 31656 }, { "epoch": 0.85, "learning_rate": 0.00011458753883829365, "loss": 2.5928, "step": 31657 }, { "epoch": 0.85, "learning_rate": 0.00011454708583818552, "loss": 2.2628, "step": 31658 }, { "epoch": 0.85, "learning_rate": 0.00011450663954611052, "loss": 2.9173, "step": 31659 }, { "epoch": 0.85, "learning_rate": 0.00011446619996237473, "loss": 2.4371, "step": 31660 }, { "epoch": 0.85, "learning_rate": 0.00011442576708728481, "loss": 2.2648, "step": 31661 }, { "epoch": 0.85, "learning_rate": 0.00011438534092114694, "loss": 2.9209, "step": 31662 }, { "epoch": 0.85, "learning_rate": 0.00011434492146426733, "loss": 2.4668, "step": 31663 }, { "epoch": 0.85, "learning_rate": 0.0001143045087169522, "loss": 2.5439, "step": 31664 }, { "epoch": 0.85, "learning_rate": 0.00011426410267950782, "loss": 2.5175, "step": 31665 }, { "epoch": 0.85, "learning_rate": 0.0001142237033522402, "loss": 2.6531, "step": 31666 }, { "epoch": 0.85, "learning_rate": 0.00011418331073545562, "loss": 2.1537, "step": 31667 }, { "epoch": 0.85, "learning_rate": 0.00011414292482945976, "loss": 2.6544, "step": 31668 }, { "epoch": 0.85, "learning_rate": 0.0001141025456345588, "loss": 2.3478, "step": 31669 }, { "epoch": 0.85, "learning_rate": 0.00011406217315105839, "loss": 2.5694, "step": 31670 }, { "epoch": 0.85, "learning_rate": 0.0001140218073792647, "loss": 2.5261, "step": 31671 }, { "epoch": 0.85, "learning_rate": 0.00011398144831948332, "loss": 2.5257, "step": 31672 }, { "epoch": 0.85, "learning_rate": 0.00011394109597202029, "loss": 2.5072, "step": 31673 }, { "epoch": 0.85, "learning_rate": 0.00011390075033718094, "loss": 2.3108, "step": 31674 }, { "epoch": 0.85, "learning_rate": 0.00011386041141527126, "loss": 2.3423, "step": 31675 }, { "epoch": 0.85, "learning_rate": 0.00011382007920659654, "loss": 2.1537, "step": 31676 }, { "epoch": 0.85, "learning_rate": 0.0001137797537114622, "loss": 2.6574, "step": 31677 }, { "epoch": 0.85, "learning_rate": 0.00011373943493017447, "loss": 2.4245, "step": 31678 }, { "epoch": 0.85, "learning_rate": 0.00011369912286303807, "loss": 2.518, "step": 31679 }, { "epoch": 0.85, "learning_rate": 0.00011365881751035867, "loss": 2.4066, "step": 31680 }, { "epoch": 0.85, "learning_rate": 0.0001136185188724418, "loss": 2.4386, "step": 31681 }, { "epoch": 0.85, "learning_rate": 0.00011357822694959241, "loss": 2.4902, "step": 31682 }, { "epoch": 0.85, "learning_rate": 0.00011353794174211584, "loss": 2.4719, "step": 31683 }, { "epoch": 0.85, "learning_rate": 0.0001134976632503173, "loss": 2.9838, "step": 31684 }, { "epoch": 0.85, "learning_rate": 0.00011345739147450207, "loss": 2.3102, "step": 31685 }, { "epoch": 0.85, "learning_rate": 0.00011341712641497526, "loss": 2.6395, "step": 31686 }, { "epoch": 0.85, "learning_rate": 0.00011337686807204161, "loss": 2.3824, "step": 31687 }, { "epoch": 0.85, "learning_rate": 0.00011333661644600634, "loss": 2.4986, "step": 31688 }, { "epoch": 0.85, "learning_rate": 0.00011329637153717454, "loss": 2.3922, "step": 31689 }, { "epoch": 0.85, "learning_rate": 0.0001132561333458505, "loss": 2.8424, "step": 31690 }, { "epoch": 0.85, "learning_rate": 0.00011321590187233977, "loss": 2.2583, "step": 31691 }, { "epoch": 0.85, "learning_rate": 0.00011317567711694677, "loss": 2.2863, "step": 31692 }, { "epoch": 0.85, "learning_rate": 0.00011313545907997614, "loss": 2.6832, "step": 31693 }, { "epoch": 0.85, "learning_rate": 0.00011309524776173307, "loss": 2.0254, "step": 31694 }, { "epoch": 0.85, "learning_rate": 0.00011305504316252158, "loss": 2.5104, "step": 31695 }, { "epoch": 0.85, "learning_rate": 0.00011301484528264649, "loss": 2.582, "step": 31696 }, { "epoch": 0.85, "learning_rate": 0.00011297465412241226, "loss": 2.2997, "step": 31697 }, { "epoch": 0.85, "learning_rate": 0.00011293446968212362, "loss": 2.5694, "step": 31698 }, { "epoch": 0.85, "learning_rate": 0.00011289429196208501, "loss": 2.6284, "step": 31699 }, { "epoch": 0.85, "learning_rate": 0.0001128541209626004, "loss": 2.367, "step": 31700 }, { "epoch": 0.85, "learning_rate": 0.00011281395668397442, "loss": 2.5211, "step": 31701 }, { "epoch": 0.85, "learning_rate": 0.0001127737991265112, "loss": 2.7008, "step": 31702 }, { "epoch": 0.85, "learning_rate": 0.00011273364829051514, "loss": 2.3966, "step": 31703 }, { "epoch": 0.85, "learning_rate": 0.00011269350417629032, "loss": 2.2936, "step": 31704 }, { "epoch": 0.85, "learning_rate": 0.00011265336678414107, "loss": 2.8839, "step": 31705 }, { "epoch": 0.85, "learning_rate": 0.00011261323611437102, "loss": 2.6666, "step": 31706 }, { "epoch": 0.85, "learning_rate": 0.0001125731121672845, "loss": 2.2409, "step": 31707 }, { "epoch": 0.85, "learning_rate": 0.00011253299494318559, "loss": 2.4461, "step": 31708 }, { "epoch": 0.85, "learning_rate": 0.00011249288444237782, "loss": 2.1148, "step": 31709 }, { "epoch": 0.85, "learning_rate": 0.0001124527806651654, "loss": 2.257, "step": 31710 }, { "epoch": 0.85, "learning_rate": 0.00011241268361185197, "loss": 2.0711, "step": 31711 }, { "epoch": 0.85, "learning_rate": 0.0001123725932827413, "loss": 2.5577, "step": 31712 }, { "epoch": 0.85, "learning_rate": 0.00011233250967813746, "loss": 2.4384, "step": 31713 }, { "epoch": 0.85, "learning_rate": 0.00011229243279834355, "loss": 2.3842, "step": 31714 }, { "epoch": 0.85, "learning_rate": 0.00011225236264366356, "loss": 2.5009, "step": 31715 }, { "epoch": 0.85, "learning_rate": 0.0001122122992144009, "loss": 2.2221, "step": 31716 }, { "epoch": 0.85, "learning_rate": 0.00011217224251085911, "loss": 2.454, "step": 31717 }, { "epoch": 0.85, "learning_rate": 0.00011213219253334195, "loss": 2.1382, "step": 31718 }, { "epoch": 0.85, "learning_rate": 0.00011209214928215239, "loss": 2.7865, "step": 31719 }, { "epoch": 0.85, "learning_rate": 0.00011205211275759386, "loss": 2.2673, "step": 31720 }, { "epoch": 0.85, "learning_rate": 0.00011201208295997001, "loss": 2.3044, "step": 31721 }, { "epoch": 0.85, "learning_rate": 0.0001119720598895837, "loss": 2.5269, "step": 31722 }, { "epoch": 0.85, "learning_rate": 0.00011193204354673803, "loss": 2.5926, "step": 31723 }, { "epoch": 0.85, "learning_rate": 0.00011189203393173686, "loss": 2.1398, "step": 31724 }, { "epoch": 0.85, "learning_rate": 0.00011185203104488273, "loss": 2.292, "step": 31725 }, { "epoch": 0.85, "learning_rate": 0.00011181203488647895, "loss": 2.1861, "step": 31726 }, { "epoch": 0.85, "learning_rate": 0.00011177204545682817, "loss": 2.6896, "step": 31727 }, { "epoch": 0.85, "learning_rate": 0.0001117320627562336, "loss": 2.412, "step": 31728 }, { "epoch": 0.85, "learning_rate": 0.0001116920867849982, "loss": 2.4283, "step": 31729 }, { "epoch": 0.85, "learning_rate": 0.00011165211754342464, "loss": 2.6236, "step": 31730 }, { "epoch": 0.85, "learning_rate": 0.00011161215503181588, "loss": 1.9597, "step": 31731 }, { "epoch": 0.85, "learning_rate": 0.00011157219925047468, "loss": 2.4248, "step": 31732 }, { "epoch": 0.85, "learning_rate": 0.0001115322501997036, "loss": 2.4599, "step": 31733 }, { "epoch": 0.85, "learning_rate": 0.00011149230787980547, "loss": 2.841, "step": 31734 }, { "epoch": 0.85, "learning_rate": 0.00011145237229108262, "loss": 2.9043, "step": 31735 }, { "epoch": 0.85, "learning_rate": 0.0001114124434338375, "loss": 2.0959, "step": 31736 }, { "epoch": 0.85, "learning_rate": 0.00011137252130837328, "loss": 2.3434, "step": 31737 }, { "epoch": 0.85, "learning_rate": 0.00011133260591499172, "loss": 2.5303, "step": 31738 }, { "epoch": 0.85, "learning_rate": 0.00011129269725399548, "loss": 2.6556, "step": 31739 }, { "epoch": 0.85, "learning_rate": 0.0001112527953256871, "loss": 2.4698, "step": 31740 }, { "epoch": 0.85, "learning_rate": 0.00011121290013036844, "loss": 2.1045, "step": 31741 }, { "epoch": 0.85, "learning_rate": 0.00011117301166834193, "loss": 2.3715, "step": 31742 }, { "epoch": 0.85, "learning_rate": 0.00011113312993990987, "loss": 2.2528, "step": 31743 }, { "epoch": 0.85, "learning_rate": 0.00011109325494537414, "loss": 2.3778, "step": 31744 }, { "epoch": 0.85, "learning_rate": 0.00011105338668503728, "loss": 2.6463, "step": 31745 }, { "epoch": 0.85, "learning_rate": 0.00011101352515920082, "loss": 2.0485, "step": 31746 }, { "epoch": 0.85, "learning_rate": 0.00011097367036816697, "loss": 2.9012, "step": 31747 }, { "epoch": 0.85, "learning_rate": 0.00011093382231223792, "loss": 2.6954, "step": 31748 }, { "epoch": 0.85, "learning_rate": 0.00011089398099171476, "loss": 2.3989, "step": 31749 }, { "epoch": 0.85, "learning_rate": 0.00011085414640690006, "loss": 2.2958, "step": 31750 }, { "epoch": 0.85, "learning_rate": 0.00011081431855809565, "loss": 2.472, "step": 31751 }, { "epoch": 0.85, "learning_rate": 0.00011077449744560276, "loss": 2.6499, "step": 31752 }, { "epoch": 0.85, "learning_rate": 0.00011073468306972345, "loss": 2.2295, "step": 31753 }, { "epoch": 0.85, "learning_rate": 0.00011069487543075907, "loss": 2.4886, "step": 31754 }, { "epoch": 0.85, "learning_rate": 0.00011065507452901125, "loss": 2.2343, "step": 31755 }, { "epoch": 0.85, "learning_rate": 0.00011061528036478164, "loss": 2.0851, "step": 31756 }, { "epoch": 0.85, "learning_rate": 0.00011057549293837166, "loss": 2.1785, "step": 31757 }, { "epoch": 0.85, "learning_rate": 0.00011053571225008274, "loss": 2.5852, "step": 31758 }, { "epoch": 0.85, "learning_rate": 0.00011049593830021642, "loss": 2.3384, "step": 31759 }, { "epoch": 0.85, "learning_rate": 0.00011045617108907357, "loss": 2.7674, "step": 31760 }, { "epoch": 0.85, "learning_rate": 0.00011041641061695607, "loss": 2.1455, "step": 31761 }, { "epoch": 0.85, "learning_rate": 0.00011037665688416432, "loss": 2.8292, "step": 31762 }, { "epoch": 0.85, "learning_rate": 0.0001103369098910002, "loss": 2.3359, "step": 31763 }, { "epoch": 0.85, "learning_rate": 0.00011029716963776471, "loss": 2.5061, "step": 31764 }, { "epoch": 0.85, "learning_rate": 0.00011025743612475869, "loss": 2.9475, "step": 31765 }, { "epoch": 0.85, "learning_rate": 0.00011021770935228326, "loss": 1.976, "step": 31766 }, { "epoch": 0.85, "learning_rate": 0.00011017798932063949, "loss": 2.2126, "step": 31767 }, { "epoch": 0.85, "learning_rate": 0.00011013827603012804, "loss": 2.6365, "step": 31768 }, { "epoch": 0.85, "learning_rate": 0.00011009856948105002, "loss": 2.4001, "step": 31769 }, { "epoch": 0.85, "learning_rate": 0.00011005886967370604, "loss": 2.5781, "step": 31770 }, { "epoch": 0.85, "learning_rate": 0.00011001917660839699, "loss": 2.6348, "step": 31771 }, { "epoch": 0.85, "learning_rate": 0.00010997949028542364, "loss": 2.5003, "step": 31772 }, { "epoch": 0.85, "learning_rate": 0.00010993981070508652, "loss": 2.5331, "step": 31773 }, { "epoch": 0.85, "learning_rate": 0.00010990013786768615, "loss": 2.2489, "step": 31774 }, { "epoch": 0.85, "learning_rate": 0.00010986047177352321, "loss": 2.1141, "step": 31775 }, { "epoch": 0.85, "learning_rate": 0.0001098208124228982, "loss": 2.3958, "step": 31776 }, { "epoch": 0.85, "learning_rate": 0.00010978115981611181, "loss": 2.3411, "step": 31777 }, { "epoch": 0.85, "learning_rate": 0.000109741513953464, "loss": 2.2213, "step": 31778 }, { "epoch": 0.85, "learning_rate": 0.00010970187483525529, "loss": 2.6123, "step": 31779 }, { "epoch": 0.85, "learning_rate": 0.00010966224246178613, "loss": 2.406, "step": 31780 }, { "epoch": 0.85, "learning_rate": 0.00010962261683335661, "loss": 2.8159, "step": 31781 }, { "epoch": 0.85, "learning_rate": 0.00010958299795026683, "loss": 2.2003, "step": 31782 }, { "epoch": 0.85, "learning_rate": 0.00010954338581281708, "loss": 2.592, "step": 31783 }, { "epoch": 0.85, "learning_rate": 0.00010950378042130749, "loss": 2.5117, "step": 31784 }, { "epoch": 0.85, "learning_rate": 0.00010946418177603801, "loss": 2.1598, "step": 31785 }, { "epoch": 0.85, "learning_rate": 0.00010942458987730885, "loss": 2.7954, "step": 31786 }, { "epoch": 0.85, "learning_rate": 0.00010938500472541968, "loss": 2.3683, "step": 31787 }, { "epoch": 0.85, "learning_rate": 0.00010934542632067046, "loss": 2.3263, "step": 31788 }, { "epoch": 0.85, "learning_rate": 0.00010930585466336095, "loss": 2.2372, "step": 31789 }, { "epoch": 0.85, "learning_rate": 0.00010926628975379116, "loss": 2.6346, "step": 31790 }, { "epoch": 0.85, "learning_rate": 0.00010922673159226083, "loss": 2.7114, "step": 31791 }, { "epoch": 0.85, "learning_rate": 0.00010918718017906936, "loss": 1.9801, "step": 31792 }, { "epoch": 0.85, "learning_rate": 0.00010914763551451656, "loss": 3.0465, "step": 31793 }, { "epoch": 0.85, "learning_rate": 0.00010910809759890228, "loss": 2.3446, "step": 31794 }, { "epoch": 0.85, "learning_rate": 0.00010906856643252539, "loss": 2.2249, "step": 31795 }, { "epoch": 0.85, "learning_rate": 0.00010902904201568587, "loss": 2.6175, "step": 31796 }, { "epoch": 0.85, "learning_rate": 0.00010898952434868304, "loss": 2.5302, "step": 31797 }, { "epoch": 0.85, "learning_rate": 0.00010895001343181632, "loss": 2.2364, "step": 31798 }, { "epoch": 0.85, "learning_rate": 0.00010891050926538515, "loss": 2.4896, "step": 31799 }, { "epoch": 0.85, "learning_rate": 0.0001088710118496884, "loss": 2.9379, "step": 31800 }, { "epoch": 0.85, "learning_rate": 0.0001088315211850256, "loss": 2.3708, "step": 31801 }, { "epoch": 0.85, "learning_rate": 0.00010879203727169585, "loss": 2.353, "step": 31802 }, { "epoch": 0.85, "learning_rate": 0.00010875256010999824, "loss": 2.8805, "step": 31803 }, { "epoch": 0.85, "learning_rate": 0.00010871308970023219, "loss": 2.9703, "step": 31804 }, { "epoch": 0.85, "learning_rate": 0.00010867362604269615, "loss": 2.4733, "step": 31805 }, { "epoch": 0.85, "learning_rate": 0.00010863416913768943, "loss": 2.504, "step": 31806 }, { "epoch": 0.85, "learning_rate": 0.0001085947189855111, "loss": 2.324, "step": 31807 }, { "epoch": 0.85, "learning_rate": 0.0001085552755864595, "loss": 2.2163, "step": 31808 }, { "epoch": 0.85, "learning_rate": 0.0001085158389408336, "loss": 2.6076, "step": 31809 }, { "epoch": 0.85, "learning_rate": 0.00010847640904893274, "loss": 2.4391, "step": 31810 }, { "epoch": 0.85, "learning_rate": 0.00010843698591105511, "loss": 2.6064, "step": 31811 }, { "epoch": 0.85, "learning_rate": 0.00010839756952749957, "loss": 2.1979, "step": 31812 }, { "epoch": 0.85, "learning_rate": 0.00010835815989856446, "loss": 2.2521, "step": 31813 }, { "epoch": 0.85, "learning_rate": 0.00010831875702454852, "loss": 2.7625, "step": 31814 }, { "epoch": 0.85, "learning_rate": 0.00010827936090575019, "loss": 2.0511, "step": 31815 }, { "epoch": 0.86, "learning_rate": 0.00010823997154246812, "loss": 2.629, "step": 31816 }, { "epoch": 0.86, "learning_rate": 0.00010820058893500051, "loss": 2.4208, "step": 31817 }, { "epoch": 0.86, "learning_rate": 0.00010816121308364602, "loss": 2.6025, "step": 31818 }, { "epoch": 0.86, "learning_rate": 0.00010812184398870251, "loss": 2.5977, "step": 31819 }, { "epoch": 0.86, "learning_rate": 0.00010808248165046852, "loss": 2.6481, "step": 31820 }, { "epoch": 0.86, "learning_rate": 0.00010804312606924238, "loss": 2.6236, "step": 31821 }, { "epoch": 0.86, "learning_rate": 0.00010800377724532163, "loss": 2.8254, "step": 31822 }, { "epoch": 0.86, "learning_rate": 0.00010796443517900512, "loss": 2.5998, "step": 31823 }, { "epoch": 0.86, "learning_rate": 0.0001079250998705904, "loss": 2.2986, "step": 31824 }, { "epoch": 0.86, "learning_rate": 0.0001078857713203757, "loss": 2.6763, "step": 31825 }, { "epoch": 0.86, "learning_rate": 0.00010784644952865907, "loss": 2.3871, "step": 31826 }, { "epoch": 0.86, "learning_rate": 0.0001078071344957381, "loss": 2.422, "step": 31827 }, { "epoch": 0.86, "learning_rate": 0.00010776782622191062, "loss": 2.4887, "step": 31828 }, { "epoch": 0.86, "learning_rate": 0.00010772852470747474, "loss": 2.4608, "step": 31829 }, { "epoch": 0.86, "learning_rate": 0.0001076892299527279, "loss": 2.3725, "step": 31830 }, { "epoch": 0.86, "learning_rate": 0.00010764994195796818, "loss": 2.8526, "step": 31831 }, { "epoch": 0.86, "learning_rate": 0.0001076106607234928, "loss": 2.8107, "step": 31832 }, { "epoch": 0.86, "learning_rate": 0.00010757138624959939, "loss": 2.7724, "step": 31833 }, { "epoch": 0.86, "learning_rate": 0.00010753211853658596, "loss": 2.5482, "step": 31834 }, { "epoch": 0.86, "learning_rate": 0.00010749285758474914, "loss": 2.3977, "step": 31835 }, { "epoch": 0.86, "learning_rate": 0.00010745360339438703, "loss": 2.5331, "step": 31836 }, { "epoch": 0.86, "learning_rate": 0.00010741435596579719, "loss": 2.3315, "step": 31837 }, { "epoch": 0.86, "learning_rate": 0.00010737511529927624, "loss": 2.4761, "step": 31838 }, { "epoch": 0.86, "learning_rate": 0.00010733588139512219, "loss": 2.5414, "step": 31839 }, { "epoch": 0.86, "learning_rate": 0.00010729665425363167, "loss": 2.3764, "step": 31840 }, { "epoch": 0.86, "learning_rate": 0.000107257433875102, "loss": 2.6342, "step": 31841 }, { "epoch": 0.86, "learning_rate": 0.00010721822025983052, "loss": 2.5586, "step": 31842 }, { "epoch": 0.86, "learning_rate": 0.0001071790134081141, "loss": 2.4627, "step": 31843 }, { "epoch": 0.86, "learning_rate": 0.00010713981332024991, "loss": 2.4758, "step": 31844 }, { "epoch": 0.86, "learning_rate": 0.00010710061999653498, "loss": 2.5953, "step": 31845 }, { "epoch": 0.86, "learning_rate": 0.00010706143343726604, "loss": 2.3325, "step": 31846 }, { "epoch": 0.86, "learning_rate": 0.00010702225364274021, "loss": 2.7842, "step": 31847 }, { "epoch": 0.86, "learning_rate": 0.00010698308061325368, "loss": 2.5378, "step": 31848 }, { "epoch": 0.86, "learning_rate": 0.00010694391434910389, "loss": 2.7127, "step": 31849 }, { "epoch": 0.86, "learning_rate": 0.0001069047548505876, "loss": 2.0931, "step": 31850 }, { "epoch": 0.86, "learning_rate": 0.0001068656021180009, "loss": 2.7429, "step": 31851 }, { "epoch": 0.86, "learning_rate": 0.00010682645615164088, "loss": 2.7482, "step": 31852 }, { "epoch": 0.86, "learning_rate": 0.00010678731695180399, "loss": 2.4284, "step": 31853 }, { "epoch": 0.86, "learning_rate": 0.00010674818451878654, "loss": 2.8808, "step": 31854 }, { "epoch": 0.86, "learning_rate": 0.00010670905885288518, "loss": 2.7229, "step": 31855 }, { "epoch": 0.86, "learning_rate": 0.00010666993995439633, "loss": 2.6705, "step": 31856 }, { "epoch": 0.86, "learning_rate": 0.00010663082782361622, "loss": 2.4364, "step": 31857 }, { "epoch": 0.86, "learning_rate": 0.00010659172246084147, "loss": 2.8017, "step": 31858 }, { "epoch": 0.86, "learning_rate": 0.00010655262386636789, "loss": 2.4178, "step": 31859 }, { "epoch": 0.86, "learning_rate": 0.00010651353204049185, "loss": 2.4467, "step": 31860 }, { "epoch": 0.86, "learning_rate": 0.00010647444698350961, "loss": 2.436, "step": 31861 }, { "epoch": 0.86, "learning_rate": 0.00010643536869571723, "loss": 2.273, "step": 31862 }, { "epoch": 0.86, "learning_rate": 0.00010639629717741073, "loss": 2.3577, "step": 31863 }, { "epoch": 0.86, "learning_rate": 0.00010635723242888629, "loss": 2.3416, "step": 31864 }, { "epoch": 0.86, "learning_rate": 0.00010631817445043956, "loss": 2.714, "step": 31865 }, { "epoch": 0.86, "learning_rate": 0.00010627912324236666, "loss": 2.8134, "step": 31866 }, { "epoch": 0.86, "learning_rate": 0.00010624007880496322, "loss": 2.333, "step": 31867 }, { "epoch": 0.86, "learning_rate": 0.00010620104113852491, "loss": 2.6525, "step": 31868 }, { "epoch": 0.86, "learning_rate": 0.00010616201024334815, "loss": 2.3518, "step": 31869 }, { "epoch": 0.86, "learning_rate": 0.00010612298611972804, "loss": 2.5801, "step": 31870 }, { "epoch": 0.86, "learning_rate": 0.00010608396876796034, "loss": 2.3456, "step": 31871 }, { "epoch": 0.86, "learning_rate": 0.00010604495818834081, "loss": 2.8386, "step": 31872 }, { "epoch": 0.86, "learning_rate": 0.00010600595438116467, "loss": 2.5041, "step": 31873 }, { "epoch": 0.86, "learning_rate": 0.00010596695734672767, "loss": 2.4032, "step": 31874 }, { "epoch": 0.86, "learning_rate": 0.00010592796708532503, "loss": 2.5906, "step": 31875 }, { "epoch": 0.86, "learning_rate": 0.0001058889835972524, "loss": 2.2587, "step": 31876 }, { "epoch": 0.86, "learning_rate": 0.0001058500068828051, "loss": 2.5217, "step": 31877 }, { "epoch": 0.86, "learning_rate": 0.00010581103694227811, "loss": 2.4142, "step": 31878 }, { "epoch": 0.86, "learning_rate": 0.00010577207377596687, "loss": 2.263, "step": 31879 }, { "epoch": 0.86, "learning_rate": 0.00010573311738416669, "loss": 2.5312, "step": 31880 }, { "epoch": 0.86, "learning_rate": 0.00010569416776717211, "loss": 2.565, "step": 31881 }, { "epoch": 0.86, "learning_rate": 0.00010565522492527913, "loss": 2.2828, "step": 31882 }, { "epoch": 0.86, "learning_rate": 0.00010561628885878195, "loss": 2.2574, "step": 31883 }, { "epoch": 0.86, "learning_rate": 0.00010557735956797599, "loss": 2.0749, "step": 31884 }, { "epoch": 0.86, "learning_rate": 0.00010553843705315614, "loss": 2.6584, "step": 31885 }, { "epoch": 0.86, "learning_rate": 0.00010549952131461694, "loss": 2.7923, "step": 31886 }, { "epoch": 0.86, "learning_rate": 0.00010546061235265358, "loss": 2.5969, "step": 31887 }, { "epoch": 0.86, "learning_rate": 0.00010542171016756064, "loss": 2.5684, "step": 31888 }, { "epoch": 0.86, "learning_rate": 0.00010538281475963285, "loss": 2.3152, "step": 31889 }, { "epoch": 0.86, "learning_rate": 0.00010534392612916488, "loss": 2.6451, "step": 31890 }, { "epoch": 0.86, "learning_rate": 0.00010530504427645171, "loss": 2.6457, "step": 31891 }, { "epoch": 0.86, "learning_rate": 0.00010526616920178722, "loss": 2.5849, "step": 31892 }, { "epoch": 0.86, "learning_rate": 0.0001052273009054665, "loss": 2.6952, "step": 31893 }, { "epoch": 0.86, "learning_rate": 0.00010518843938778344, "loss": 2.5199, "step": 31894 }, { "epoch": 0.86, "learning_rate": 0.00010514958464903301, "loss": 2.8968, "step": 31895 }, { "epoch": 0.86, "learning_rate": 0.00010511073668950943, "loss": 2.3101, "step": 31896 }, { "epoch": 0.86, "learning_rate": 0.0001050718955095068, "loss": 2.6133, "step": 31897 }, { "epoch": 0.86, "learning_rate": 0.00010503306110931954, "loss": 2.4468, "step": 31898 }, { "epoch": 0.86, "learning_rate": 0.00010499423348924186, "loss": 2.2526, "step": 31899 }, { "epoch": 0.86, "learning_rate": 0.00010495541264956776, "loss": 2.2368, "step": 31900 }, { "epoch": 0.86, "learning_rate": 0.00010491659859059144, "loss": 2.568, "step": 31901 }, { "epoch": 0.86, "learning_rate": 0.00010487779131260689, "loss": 2.6259, "step": 31902 }, { "epoch": 0.86, "learning_rate": 0.0001048389908159082, "loss": 2.6135, "step": 31903 }, { "epoch": 0.86, "learning_rate": 0.00010480019710078948, "loss": 2.601, "step": 31904 }, { "epoch": 0.86, "learning_rate": 0.00010476141016754414, "loss": 2.5779, "step": 31905 }, { "epoch": 0.86, "learning_rate": 0.00010472263001646642, "loss": 2.1833, "step": 31906 }, { "epoch": 0.86, "learning_rate": 0.00010468385664784985, "loss": 2.476, "step": 31907 }, { "epoch": 0.86, "learning_rate": 0.00010464509006198841, "loss": 2.5293, "step": 31908 }, { "epoch": 0.86, "learning_rate": 0.00010460633025917588, "loss": 2.3071, "step": 31909 }, { "epoch": 0.86, "learning_rate": 0.00010456757723970556, "loss": 2.4149, "step": 31910 }, { "epoch": 0.86, "learning_rate": 0.00010452883100387112, "loss": 2.3845, "step": 31911 }, { "epoch": 0.86, "learning_rate": 0.00010449009155196643, "loss": 2.235, "step": 31912 }, { "epoch": 0.86, "learning_rate": 0.00010445135888428436, "loss": 2.4399, "step": 31913 }, { "epoch": 0.86, "learning_rate": 0.00010441263300111881, "loss": 2.3996, "step": 31914 }, { "epoch": 0.86, "learning_rate": 0.00010437391390276308, "loss": 2.1861, "step": 31915 }, { "epoch": 0.86, "learning_rate": 0.00010433520158951038, "loss": 2.2256, "step": 31916 }, { "epoch": 0.86, "learning_rate": 0.00010429649606165426, "loss": 2.7459, "step": 31917 }, { "epoch": 0.86, "learning_rate": 0.00010425779731948748, "loss": 2.6533, "step": 31918 }, { "epoch": 0.86, "learning_rate": 0.00010421910536330358, "loss": 2.2923, "step": 31919 }, { "epoch": 0.86, "learning_rate": 0.00010418042019339558, "loss": 3.1466, "step": 31920 }, { "epoch": 0.86, "learning_rate": 0.00010414174181005653, "loss": 2.4232, "step": 31921 }, { "epoch": 0.86, "learning_rate": 0.00010410307021357946, "loss": 3.1774, "step": 31922 }, { "epoch": 0.86, "learning_rate": 0.00010406440540425766, "loss": 1.8788, "step": 31923 }, { "epoch": 0.86, "learning_rate": 0.00010402574738238346, "loss": 2.7711, "step": 31924 }, { "epoch": 0.86, "learning_rate": 0.00010398709614825019, "loss": 2.2831, "step": 31925 }, { "epoch": 0.86, "learning_rate": 0.00010394845170215039, "loss": 2.3542, "step": 31926 }, { "epoch": 0.86, "learning_rate": 0.00010390981404437683, "loss": 2.4572, "step": 31927 }, { "epoch": 0.86, "learning_rate": 0.00010387118317522237, "loss": 2.6182, "step": 31928 }, { "epoch": 0.86, "learning_rate": 0.00010383255909497957, "loss": 2.4408, "step": 31929 }, { "epoch": 0.86, "learning_rate": 0.00010379394180394108, "loss": 2.2159, "step": 31930 }, { "epoch": 0.86, "learning_rate": 0.00010375533130239967, "loss": 2.6979, "step": 31931 }, { "epoch": 0.86, "learning_rate": 0.00010371672759064743, "loss": 2.5684, "step": 31932 }, { "epoch": 0.86, "learning_rate": 0.00010367813066897703, "loss": 2.4584, "step": 31933 }, { "epoch": 0.86, "learning_rate": 0.00010363954053768087, "loss": 2.2308, "step": 31934 }, { "epoch": 0.86, "learning_rate": 0.00010360095719705131, "loss": 2.5392, "step": 31935 }, { "epoch": 0.86, "learning_rate": 0.00010356238064738088, "loss": 2.3543, "step": 31936 }, { "epoch": 0.86, "learning_rate": 0.00010352381088896123, "loss": 2.11, "step": 31937 }, { "epoch": 0.86, "learning_rate": 0.00010348524792208502, "loss": 2.3167, "step": 31938 }, { "epoch": 0.86, "learning_rate": 0.00010344669174704457, "loss": 2.8235, "step": 31939 }, { "epoch": 0.86, "learning_rate": 0.00010340814236413132, "loss": 2.9043, "step": 31940 }, { "epoch": 0.86, "learning_rate": 0.00010336959977363758, "loss": 2.3011, "step": 31941 }, { "epoch": 0.86, "learning_rate": 0.0001033310639758559, "loss": 2.4341, "step": 31942 }, { "epoch": 0.86, "learning_rate": 0.00010329253497107749, "loss": 2.4749, "step": 31943 }, { "epoch": 0.86, "learning_rate": 0.00010325401275959478, "loss": 2.6583, "step": 31944 }, { "epoch": 0.86, "learning_rate": 0.00010321549734169911, "loss": 2.2396, "step": 31945 }, { "epoch": 0.86, "learning_rate": 0.00010317698871768244, "loss": 2.4561, "step": 31946 }, { "epoch": 0.86, "learning_rate": 0.00010313848688783666, "loss": 1.9819, "step": 31947 }, { "epoch": 0.86, "learning_rate": 0.00010309999185245333, "loss": 2.2867, "step": 31948 }, { "epoch": 0.86, "learning_rate": 0.00010306150361182409, "loss": 2.768, "step": 31949 }, { "epoch": 0.86, "learning_rate": 0.00010302302216624083, "loss": 2.3409, "step": 31950 }, { "epoch": 0.86, "learning_rate": 0.00010298454751599451, "loss": 2.1525, "step": 31951 }, { "epoch": 0.86, "learning_rate": 0.00010294607966137704, "loss": 2.3086, "step": 31952 }, { "epoch": 0.86, "learning_rate": 0.00010290761860267962, "loss": 2.3462, "step": 31953 }, { "epoch": 0.86, "learning_rate": 0.00010286916434019344, "loss": 2.7243, "step": 31954 }, { "epoch": 0.86, "learning_rate": 0.00010283071687421041, "loss": 2.5481, "step": 31955 }, { "epoch": 0.86, "learning_rate": 0.0001027922762050213, "loss": 2.0259, "step": 31956 }, { "epoch": 0.86, "learning_rate": 0.00010275384233291762, "loss": 2.54, "step": 31957 }, { "epoch": 0.86, "learning_rate": 0.0001027154152581905, "loss": 2.6765, "step": 31958 }, { "epoch": 0.86, "learning_rate": 0.00010267699498113082, "loss": 2.08, "step": 31959 }, { "epoch": 0.86, "learning_rate": 0.00010263858150202976, "loss": 2.5713, "step": 31960 }, { "epoch": 0.86, "learning_rate": 0.00010260017482117834, "loss": 2.6809, "step": 31961 }, { "epoch": 0.86, "learning_rate": 0.00010256177493886764, "loss": 2.1918, "step": 31962 }, { "epoch": 0.86, "learning_rate": 0.00010252338185538868, "loss": 2.3861, "step": 31963 }, { "epoch": 0.86, "learning_rate": 0.00010248499557103185, "loss": 2.4543, "step": 31964 }, { "epoch": 0.86, "learning_rate": 0.0001024466160860883, "loss": 2.3428, "step": 31965 }, { "epoch": 0.86, "learning_rate": 0.00010240824340084886, "loss": 1.9846, "step": 31966 }, { "epoch": 0.86, "learning_rate": 0.00010236987751560378, "loss": 2.226, "step": 31967 }, { "epoch": 0.86, "learning_rate": 0.00010233151843064414, "loss": 1.6795, "step": 31968 }, { "epoch": 0.86, "learning_rate": 0.00010229316614626072, "loss": 2.5032, "step": 31969 }, { "epoch": 0.86, "learning_rate": 0.00010225482066274349, "loss": 2.5131, "step": 31970 }, { "epoch": 0.86, "learning_rate": 0.00010221648198038347, "loss": 2.21, "step": 31971 }, { "epoch": 0.86, "learning_rate": 0.00010217815009947073, "loss": 2.0121, "step": 31972 }, { "epoch": 0.86, "learning_rate": 0.00010213982502029573, "loss": 2.8015, "step": 31973 }, { "epoch": 0.86, "learning_rate": 0.00010210150674314888, "loss": 2.3953, "step": 31974 }, { "epoch": 0.86, "learning_rate": 0.00010206319526832053, "loss": 2.0041, "step": 31975 }, { "epoch": 0.86, "learning_rate": 0.00010202489059610088, "loss": 2.6022, "step": 31976 }, { "epoch": 0.86, "learning_rate": 0.00010198659272678035, "loss": 2.431, "step": 31977 }, { "epoch": 0.86, "learning_rate": 0.00010194830166064862, "loss": 2.9167, "step": 31978 }, { "epoch": 0.86, "learning_rate": 0.00010191001739799611, "loss": 2.6384, "step": 31979 }, { "epoch": 0.86, "learning_rate": 0.00010187173993911248, "loss": 2.4838, "step": 31980 }, { "epoch": 0.86, "learning_rate": 0.00010183346928428805, "loss": 2.7892, "step": 31981 }, { "epoch": 0.86, "learning_rate": 0.00010179520543381293, "loss": 2.5974, "step": 31982 }, { "epoch": 0.86, "learning_rate": 0.00010175694838797656, "loss": 2.391, "step": 31983 }, { "epoch": 0.86, "learning_rate": 0.00010171869814706902, "loss": 2.7348, "step": 31984 }, { "epoch": 0.86, "learning_rate": 0.0001016804547113801, "loss": 2.2581, "step": 31985 }, { "epoch": 0.86, "learning_rate": 0.00010164221808119934, "loss": 2.2079, "step": 31986 }, { "epoch": 0.86, "learning_rate": 0.00010160398825681649, "loss": 2.137, "step": 31987 }, { "epoch": 0.86, "learning_rate": 0.00010156576523852124, "loss": 2.6602, "step": 31988 }, { "epoch": 0.86, "learning_rate": 0.0001015275490266031, "loss": 2.8111, "step": 31989 }, { "epoch": 0.86, "learning_rate": 0.00010148933962135188, "loss": 2.6047, "step": 31990 }, { "epoch": 0.86, "learning_rate": 0.00010145113702305653, "loss": 2.5037, "step": 31991 }, { "epoch": 0.86, "learning_rate": 0.00010141294123200673, "loss": 2.5126, "step": 31992 }, { "epoch": 0.86, "learning_rate": 0.00010137475224849179, "loss": 2.7262, "step": 31993 }, { "epoch": 0.86, "learning_rate": 0.00010133657007280106, "loss": 1.8998, "step": 31994 }, { "epoch": 0.86, "learning_rate": 0.00010129839470522406, "loss": 2.8741, "step": 31995 }, { "epoch": 0.86, "learning_rate": 0.00010126022614604958, "loss": 2.5368, "step": 31996 }, { "epoch": 0.86, "learning_rate": 0.00010122206439556691, "loss": 2.489, "step": 31997 }, { "epoch": 0.86, "learning_rate": 0.00010118390945406541, "loss": 2.607, "step": 31998 }, { "epoch": 0.86, "learning_rate": 0.00010114576132183361, "loss": 2.5047, "step": 31999 }, { "epoch": 0.86, "learning_rate": 0.00010110761999916096, "loss": 2.3443, "step": 32000 }, { "epoch": 0.86, "learning_rate": 0.00010106948548633621, "loss": 2.3182, "step": 32001 }, { "epoch": 0.86, "learning_rate": 0.00010103135778364836, "loss": 2.8, "step": 32002 }, { "epoch": 0.86, "learning_rate": 0.00010099323689138617, "loss": 2.3814, "step": 32003 }, { "epoch": 0.86, "learning_rate": 0.00010095512280983877, "loss": 2.3998, "step": 32004 }, { "epoch": 0.86, "learning_rate": 0.00010091701553929433, "loss": 2.3422, "step": 32005 }, { "epoch": 0.86, "learning_rate": 0.00010087891508004187, "loss": 2.6176, "step": 32006 }, { "epoch": 0.86, "learning_rate": 0.00010084082143237006, "loss": 2.5254, "step": 32007 }, { "epoch": 0.86, "learning_rate": 0.00010080273459656741, "loss": 3.2415, "step": 32008 }, { "epoch": 0.86, "learning_rate": 0.00010076465457292261, "loss": 2.2218, "step": 32009 }, { "epoch": 0.86, "learning_rate": 0.00010072658136172386, "loss": 2.9661, "step": 32010 }, { "epoch": 0.86, "learning_rate": 0.00010068851496325981, "loss": 2.1978, "step": 32011 }, { "epoch": 0.86, "learning_rate": 0.00010065045537781892, "loss": 2.307, "step": 32012 }, { "epoch": 0.86, "learning_rate": 0.00010061240260568927, "loss": 2.0758, "step": 32013 }, { "epoch": 0.86, "learning_rate": 0.0001005743566471592, "loss": 2.6567, "step": 32014 }, { "epoch": 0.86, "learning_rate": 0.00010053631750251702, "loss": 2.2939, "step": 32015 }, { "epoch": 0.86, "learning_rate": 0.00010049828517205084, "loss": 2.3386, "step": 32016 }, { "epoch": 0.86, "learning_rate": 0.0001004602596560491, "loss": 2.3492, "step": 32017 }, { "epoch": 0.86, "learning_rate": 0.00010042224095479935, "loss": 2.2877, "step": 32018 }, { "epoch": 0.86, "learning_rate": 0.00010038422906858991, "loss": 2.1522, "step": 32019 }, { "epoch": 0.86, "learning_rate": 0.00010034622399770876, "loss": 2.7029, "step": 32020 }, { "epoch": 0.86, "learning_rate": 0.00010030822574244369, "loss": 2.6033, "step": 32021 }, { "epoch": 0.86, "learning_rate": 0.0001002702343030829, "loss": 2.0527, "step": 32022 }, { "epoch": 0.86, "learning_rate": 0.00010023224967991373, "loss": 2.1174, "step": 32023 }, { "epoch": 0.86, "learning_rate": 0.00010019427187322417, "loss": 2.748, "step": 32024 }, { "epoch": 0.86, "learning_rate": 0.00010015630088330218, "loss": 2.7095, "step": 32025 }, { "epoch": 0.86, "learning_rate": 0.0001001183367104349, "loss": 2.1881, "step": 32026 }, { "epoch": 0.86, "learning_rate": 0.0001000803793549101, "loss": 2.3403, "step": 32027 }, { "epoch": 0.86, "learning_rate": 0.00010004242881701586, "loss": 2.3501, "step": 32028 }, { "epoch": 0.86, "learning_rate": 0.00010000448509703908, "loss": 2.4412, "step": 32029 }, { "epoch": 0.86, "learning_rate": 9.996654819526751e-05, "loss": 2.6385, "step": 32030 }, { "epoch": 0.86, "learning_rate": 9.992861811198839e-05, "loss": 2.8929, "step": 32031 }, { "epoch": 0.86, "learning_rate": 9.989069484748903e-05, "loss": 2.0074, "step": 32032 }, { "epoch": 0.86, "learning_rate": 9.985277840205698e-05, "loss": 2.7231, "step": 32033 }, { "epoch": 0.86, "learning_rate": 9.981486877597923e-05, "loss": 2.2786, "step": 32034 }, { "epoch": 0.86, "learning_rate": 9.977696596954311e-05, "loss": 2.6906, "step": 32035 }, { "epoch": 0.86, "learning_rate": 9.973906998303594e-05, "loss": 2.592, "step": 32036 }, { "epoch": 0.86, "learning_rate": 9.970118081674451e-05, "loss": 2.7246, "step": 32037 }, { "epoch": 0.86, "learning_rate": 9.966329847095612e-05, "loss": 2.4427, "step": 32038 }, { "epoch": 0.86, "learning_rate": 9.962542294595722e-05, "loss": 2.4333, "step": 32039 }, { "epoch": 0.86, "learning_rate": 9.958755424203536e-05, "loss": 2.472, "step": 32040 }, { "epoch": 0.86, "learning_rate": 9.954969235947741e-05, "loss": 2.6119, "step": 32041 }, { "epoch": 0.86, "learning_rate": 9.951183729856971e-05, "loss": 2.3165, "step": 32042 }, { "epoch": 0.86, "learning_rate": 9.947398905959948e-05, "loss": 2.5746, "step": 32043 }, { "epoch": 0.86, "learning_rate": 9.943614764285347e-05, "loss": 2.6946, "step": 32044 }, { "epoch": 0.86, "learning_rate": 9.939831304861791e-05, "loss": 1.9116, "step": 32045 }, { "epoch": 0.86, "learning_rate": 9.936048527717978e-05, "loss": 2.3199, "step": 32046 }, { "epoch": 0.86, "learning_rate": 9.932266432882564e-05, "loss": 2.5981, "step": 32047 }, { "epoch": 0.86, "learning_rate": 9.928485020384192e-05, "loss": 2.249, "step": 32048 }, { "epoch": 0.86, "learning_rate": 9.924704290251541e-05, "loss": 2.0871, "step": 32049 }, { "epoch": 0.86, "learning_rate": 9.920924242513196e-05, "loss": 2.8059, "step": 32050 }, { "epoch": 0.86, "learning_rate": 9.917144877197825e-05, "loss": 2.3539, "step": 32051 }, { "epoch": 0.86, "learning_rate": 9.913366194334061e-05, "loss": 2.5343, "step": 32052 }, { "epoch": 0.86, "learning_rate": 9.909588193950537e-05, "loss": 2.225, "step": 32053 }, { "epoch": 0.86, "learning_rate": 9.90581087607586e-05, "loss": 2.6114, "step": 32054 }, { "epoch": 0.86, "learning_rate": 9.902034240738666e-05, "loss": 2.4246, "step": 32055 }, { "epoch": 0.86, "learning_rate": 9.898258287967543e-05, "loss": 2.1125, "step": 32056 }, { "epoch": 0.86, "learning_rate": 9.894483017791123e-05, "loss": 2.4902, "step": 32057 }, { "epoch": 0.86, "learning_rate": 9.890708430237971e-05, "loss": 2.3145, "step": 32058 }, { "epoch": 0.86, "learning_rate": 9.8869345253367e-05, "loss": 2.7456, "step": 32059 }, { "epoch": 0.86, "learning_rate": 9.883161303115907e-05, "loss": 2.54, "step": 32060 }, { "epoch": 0.86, "learning_rate": 9.879388763604157e-05, "loss": 2.8947, "step": 32061 }, { "epoch": 0.86, "learning_rate": 9.875616906830065e-05, "loss": 2.5941, "step": 32062 }, { "epoch": 0.86, "learning_rate": 9.871845732822194e-05, "loss": 2.5254, "step": 32063 }, { "epoch": 0.86, "learning_rate": 9.868075241609098e-05, "loss": 2.5249, "step": 32064 }, { "epoch": 0.86, "learning_rate": 9.864305433219334e-05, "loss": 2.7788, "step": 32065 }, { "epoch": 0.86, "learning_rate": 9.860536307681489e-05, "loss": 2.9272, "step": 32066 }, { "epoch": 0.86, "learning_rate": 9.856767865024107e-05, "loss": 2.4933, "step": 32067 }, { "epoch": 0.86, "learning_rate": 9.853000105275744e-05, "loss": 2.6825, "step": 32068 }, { "epoch": 0.86, "learning_rate": 9.849233028464933e-05, "loss": 2.5211, "step": 32069 }, { "epoch": 0.86, "learning_rate": 9.845466634620204e-05, "loss": 2.4957, "step": 32070 }, { "epoch": 0.86, "learning_rate": 9.841700923770114e-05, "loss": 3.0954, "step": 32071 }, { "epoch": 0.86, "learning_rate": 9.837935895943173e-05, "loss": 2.777, "step": 32072 }, { "epoch": 0.86, "learning_rate": 9.834171551167903e-05, "loss": 2.5282, "step": 32073 }, { "epoch": 0.86, "learning_rate": 9.830407889472837e-05, "loss": 2.7755, "step": 32074 }, { "epoch": 0.86, "learning_rate": 9.826644910886473e-05, "loss": 2.602, "step": 32075 }, { "epoch": 0.86, "learning_rate": 9.822882615437345e-05, "loss": 2.3763, "step": 32076 }, { "epoch": 0.86, "learning_rate": 9.81912100315392e-05, "loss": 2.561, "step": 32077 }, { "epoch": 0.86, "learning_rate": 9.815360074064705e-05, "loss": 2.1759, "step": 32078 }, { "epoch": 0.86, "learning_rate": 9.811599828198203e-05, "loss": 2.1582, "step": 32079 }, { "epoch": 0.86, "learning_rate": 9.80784026558289e-05, "loss": 2.221, "step": 32080 }, { "epoch": 0.86, "learning_rate": 9.804081386247266e-05, "loss": 2.2271, "step": 32081 }, { "epoch": 0.86, "learning_rate": 9.800323190219806e-05, "loss": 2.0287, "step": 32082 }, { "epoch": 0.86, "learning_rate": 9.796565677528956e-05, "loss": 2.6026, "step": 32083 }, { "epoch": 0.86, "learning_rate": 9.792808848203217e-05, "loss": 2.3805, "step": 32084 }, { "epoch": 0.86, "learning_rate": 9.789052702271017e-05, "loss": 2.7676, "step": 32085 }, { "epoch": 0.86, "learning_rate": 9.785297239760793e-05, "loss": 2.672, "step": 32086 }, { "epoch": 0.86, "learning_rate": 9.781542460701076e-05, "loss": 1.9716, "step": 32087 }, { "epoch": 0.86, "learning_rate": 9.777788365120243e-05, "loss": 2.5225, "step": 32088 }, { "epoch": 0.86, "learning_rate": 9.774034953046762e-05, "loss": 2.4471, "step": 32089 }, { "epoch": 0.86, "learning_rate": 9.770282224509064e-05, "loss": 2.7577, "step": 32090 }, { "epoch": 0.86, "learning_rate": 9.766530179535571e-05, "loss": 2.2263, "step": 32091 }, { "epoch": 0.86, "learning_rate": 9.762778818154705e-05, "loss": 2.0503, "step": 32092 }, { "epoch": 0.86, "learning_rate": 9.759028140394899e-05, "loss": 2.9771, "step": 32093 }, { "epoch": 0.86, "learning_rate": 9.755278146284564e-05, "loss": 2.4613, "step": 32094 }, { "epoch": 0.86, "learning_rate": 9.751528835852119e-05, "loss": 2.4588, "step": 32095 }, { "epoch": 0.86, "learning_rate": 9.747780209125945e-05, "loss": 2.3599, "step": 32096 }, { "epoch": 0.86, "learning_rate": 9.74403226613445e-05, "loss": 1.9724, "step": 32097 }, { "epoch": 0.86, "learning_rate": 9.740285006906047e-05, "loss": 2.4247, "step": 32098 }, { "epoch": 0.86, "learning_rate": 9.736538431469067e-05, "loss": 2.2564, "step": 32099 }, { "epoch": 0.86, "learning_rate": 9.732792539851976e-05, "loss": 2.2501, "step": 32100 }, { "epoch": 0.86, "learning_rate": 9.729047332083096e-05, "loss": 2.5511, "step": 32101 }, { "epoch": 0.86, "learning_rate": 9.725302808190816e-05, "loss": 2.3511, "step": 32102 }, { "epoch": 0.86, "learning_rate": 9.721558968203515e-05, "loss": 2.3787, "step": 32103 }, { "epoch": 0.86, "learning_rate": 9.717815812149522e-05, "loss": 2.3911, "step": 32104 }, { "epoch": 0.86, "learning_rate": 9.714073340057217e-05, "loss": 2.2195, "step": 32105 }, { "epoch": 0.86, "learning_rate": 9.710331551954954e-05, "loss": 2.2056, "step": 32106 }, { "epoch": 0.86, "learning_rate": 9.706590447871078e-05, "loss": 2.7039, "step": 32107 }, { "epoch": 0.86, "learning_rate": 9.702850027833943e-05, "loss": 2.468, "step": 32108 }, { "epoch": 0.86, "learning_rate": 9.69911029187186e-05, "loss": 2.5179, "step": 32109 }, { "epoch": 0.86, "learning_rate": 9.695371240013162e-05, "loss": 2.4648, "step": 32110 }, { "epoch": 0.86, "learning_rate": 9.691632872286215e-05, "loss": 2.5432, "step": 32111 }, { "epoch": 0.86, "learning_rate": 9.687895188719276e-05, "loss": 2.6512, "step": 32112 }, { "epoch": 0.86, "learning_rate": 9.684158189340708e-05, "loss": 2.0896, "step": 32113 }, { "epoch": 0.86, "learning_rate": 9.680421874178836e-05, "loss": 2.4466, "step": 32114 }, { "epoch": 0.86, "learning_rate": 9.676686243261912e-05, "loss": 2.9835, "step": 32115 }, { "epoch": 0.86, "learning_rate": 9.67295129661827e-05, "loss": 2.1211, "step": 32116 }, { "epoch": 0.86, "learning_rate": 9.669217034276224e-05, "loss": 2.4139, "step": 32117 }, { "epoch": 0.86, "learning_rate": 9.665483456264024e-05, "loss": 2.7864, "step": 32118 }, { "epoch": 0.86, "learning_rate": 9.661750562609961e-05, "loss": 2.5416, "step": 32119 }, { "epoch": 0.86, "learning_rate": 9.658018353342324e-05, "loss": 2.3715, "step": 32120 }, { "epoch": 0.86, "learning_rate": 9.65428682848939e-05, "loss": 2.5093, "step": 32121 }, { "epoch": 0.86, "learning_rate": 9.650555988079457e-05, "loss": 2.4148, "step": 32122 }, { "epoch": 0.86, "learning_rate": 9.646825832140726e-05, "loss": 2.3678, "step": 32123 }, { "epoch": 0.86, "learning_rate": 9.643096360701498e-05, "loss": 2.508, "step": 32124 }, { "epoch": 0.86, "learning_rate": 9.639367573790015e-05, "loss": 2.2892, "step": 32125 }, { "epoch": 0.86, "learning_rate": 9.63563947143452e-05, "loss": 2.4999, "step": 32126 }, { "epoch": 0.86, "learning_rate": 9.631912053663295e-05, "loss": 2.2012, "step": 32127 }, { "epoch": 0.86, "learning_rate": 9.628185320504524e-05, "loss": 2.4255, "step": 32128 }, { "epoch": 0.86, "learning_rate": 9.624459271986463e-05, "loss": 2.5959, "step": 32129 }, { "epoch": 0.86, "learning_rate": 9.620733908137358e-05, "loss": 2.7729, "step": 32130 }, { "epoch": 0.86, "learning_rate": 9.617009228985407e-05, "loss": 2.3538, "step": 32131 }, { "epoch": 0.86, "learning_rate": 9.613285234558821e-05, "loss": 2.9215, "step": 32132 }, { "epoch": 0.86, "learning_rate": 9.609561924885835e-05, "loss": 2.2008, "step": 32133 }, { "epoch": 0.86, "learning_rate": 9.605839299994645e-05, "loss": 2.4759, "step": 32134 }, { "epoch": 0.86, "learning_rate": 9.602117359913476e-05, "loss": 2.4687, "step": 32135 }, { "epoch": 0.86, "learning_rate": 9.598396104670482e-05, "loss": 2.121, "step": 32136 }, { "epoch": 0.86, "learning_rate": 9.594675534293873e-05, "loss": 2.6081, "step": 32137 }, { "epoch": 0.86, "learning_rate": 9.59095564881185e-05, "loss": 2.6097, "step": 32138 }, { "epoch": 0.86, "learning_rate": 9.587236448252579e-05, "loss": 2.2924, "step": 32139 }, { "epoch": 0.86, "learning_rate": 9.583517932644237e-05, "loss": 2.6119, "step": 32140 }, { "epoch": 0.86, "learning_rate": 9.579800102015024e-05, "loss": 2.0806, "step": 32141 }, { "epoch": 0.86, "learning_rate": 9.57608295639305e-05, "loss": 2.4521, "step": 32142 }, { "epoch": 0.86, "learning_rate": 9.57236649580654e-05, "loss": 2.3002, "step": 32143 }, { "epoch": 0.86, "learning_rate": 9.568650720283578e-05, "loss": 2.6749, "step": 32144 }, { "epoch": 0.86, "learning_rate": 9.564935629852368e-05, "loss": 2.3366, "step": 32145 }, { "epoch": 0.86, "learning_rate": 9.561221224541029e-05, "loss": 2.382, "step": 32146 }, { "epoch": 0.86, "learning_rate": 9.557507504377705e-05, "loss": 2.1155, "step": 32147 }, { "epoch": 0.86, "learning_rate": 9.553794469390531e-05, "loss": 2.6373, "step": 32148 }, { "epoch": 0.86, "learning_rate": 9.550082119607673e-05, "loss": 2.4248, "step": 32149 }, { "epoch": 0.86, "learning_rate": 9.546370455057197e-05, "loss": 3.1239, "step": 32150 }, { "epoch": 0.86, "learning_rate": 9.542659475767246e-05, "loss": 2.8491, "step": 32151 }, { "epoch": 0.86, "learning_rate": 9.538949181765933e-05, "loss": 2.2941, "step": 32152 }, { "epoch": 0.86, "learning_rate": 9.535239573081367e-05, "loss": 3.0111, "step": 32153 }, { "epoch": 0.86, "learning_rate": 9.531530649741671e-05, "loss": 2.3164, "step": 32154 }, { "epoch": 0.86, "learning_rate": 9.527822411774912e-05, "loss": 2.3554, "step": 32155 }, { "epoch": 0.86, "learning_rate": 9.524114859209187e-05, "loss": 2.6105, "step": 32156 }, { "epoch": 0.86, "learning_rate": 9.520407992072621e-05, "loss": 2.9243, "step": 32157 }, { "epoch": 0.86, "learning_rate": 9.516701810393246e-05, "loss": 2.7322, "step": 32158 }, { "epoch": 0.86, "learning_rate": 9.51299631419914e-05, "loss": 2.3517, "step": 32159 }, { "epoch": 0.86, "learning_rate": 9.509291503518425e-05, "loss": 2.6405, "step": 32160 }, { "epoch": 0.86, "learning_rate": 9.505587378379132e-05, "loss": 2.545, "step": 32161 }, { "epoch": 0.86, "learning_rate": 9.501883938809353e-05, "loss": 2.5091, "step": 32162 }, { "epoch": 0.86, "learning_rate": 9.498181184837096e-05, "loss": 2.1141, "step": 32163 }, { "epoch": 0.86, "learning_rate": 9.49447911649044e-05, "loss": 3.3166, "step": 32164 }, { "epoch": 0.86, "learning_rate": 9.49077773379743e-05, "loss": 2.2826, "step": 32165 }, { "epoch": 0.86, "learning_rate": 9.487077036786097e-05, "loss": 2.6662, "step": 32166 }, { "epoch": 0.86, "learning_rate": 9.483377025484496e-05, "loss": 2.2169, "step": 32167 }, { "epoch": 0.86, "learning_rate": 9.479677699920664e-05, "loss": 2.4788, "step": 32168 }, { "epoch": 0.86, "learning_rate": 9.475979060122586e-05, "loss": 2.5328, "step": 32169 }, { "epoch": 0.86, "learning_rate": 9.47228110611833e-05, "loss": 2.9418, "step": 32170 }, { "epoch": 0.86, "learning_rate": 9.468583837935874e-05, "loss": 3.0595, "step": 32171 }, { "epoch": 0.86, "learning_rate": 9.464887255603217e-05, "loss": 2.6548, "step": 32172 }, { "epoch": 0.86, "learning_rate": 9.461191359148425e-05, "loss": 2.362, "step": 32173 }, { "epoch": 0.86, "learning_rate": 9.457496148599443e-05, "loss": 2.4636, "step": 32174 }, { "epoch": 0.86, "learning_rate": 9.453801623984281e-05, "loss": 2.7967, "step": 32175 }, { "epoch": 0.86, "learning_rate": 9.450107785330953e-05, "loss": 2.9897, "step": 32176 }, { "epoch": 0.86, "learning_rate": 9.4464146326674e-05, "loss": 2.3719, "step": 32177 }, { "epoch": 0.86, "learning_rate": 9.442722166021622e-05, "loss": 2.4733, "step": 32178 }, { "epoch": 0.86, "learning_rate": 9.439030385421587e-05, "loss": 2.2598, "step": 32179 }, { "epoch": 0.86, "learning_rate": 9.435339290895262e-05, "loss": 2.5851, "step": 32180 }, { "epoch": 0.86, "learning_rate": 9.431648882470644e-05, "loss": 2.4804, "step": 32181 }, { "epoch": 0.86, "learning_rate": 9.427959160175636e-05, "loss": 2.109, "step": 32182 }, { "epoch": 0.86, "learning_rate": 9.424270124038226e-05, "loss": 2.6429, "step": 32183 }, { "epoch": 0.86, "learning_rate": 9.420581774086356e-05, "loss": 2.3366, "step": 32184 }, { "epoch": 0.86, "learning_rate": 9.41689411034794e-05, "loss": 2.1905, "step": 32185 }, { "epoch": 0.86, "learning_rate": 9.413207132850965e-05, "loss": 2.6262, "step": 32186 }, { "epoch": 0.86, "learning_rate": 9.409520841623331e-05, "loss": 2.5437, "step": 32187 }, { "epoch": 0.87, "learning_rate": 9.40583523669296e-05, "loss": 2.409, "step": 32188 }, { "epoch": 0.87, "learning_rate": 9.40215031808781e-05, "loss": 2.4633, "step": 32189 }, { "epoch": 0.87, "learning_rate": 9.398466085835755e-05, "loss": 2.5896, "step": 32190 }, { "epoch": 0.87, "learning_rate": 9.394782539964719e-05, "loss": 2.1461, "step": 32191 }, { "epoch": 0.87, "learning_rate": 9.391099680502612e-05, "loss": 2.4987, "step": 32192 }, { "epoch": 0.87, "learning_rate": 9.387417507477337e-05, "loss": 2.0263, "step": 32193 }, { "epoch": 0.87, "learning_rate": 9.383736020916789e-05, "loss": 2.5263, "step": 32194 }, { "epoch": 0.87, "learning_rate": 9.380055220848871e-05, "loss": 2.5995, "step": 32195 }, { "epoch": 0.87, "learning_rate": 9.376375107301426e-05, "loss": 2.6957, "step": 32196 }, { "epoch": 0.87, "learning_rate": 9.37269568030239e-05, "loss": 2.5421, "step": 32197 }, { "epoch": 0.87, "learning_rate": 9.369016939879571e-05, "loss": 2.4355, "step": 32198 }, { "epoch": 0.87, "learning_rate": 9.365338886060892e-05, "loss": 2.3421, "step": 32199 }, { "epoch": 0.87, "learning_rate": 9.361661518874232e-05, "loss": 2.5303, "step": 32200 }, { "epoch": 0.87, "learning_rate": 9.357984838347388e-05, "loss": 2.5951, "step": 32201 }, { "epoch": 0.87, "learning_rate": 9.354308844508242e-05, "loss": 2.3069, "step": 32202 }, { "epoch": 0.87, "learning_rate": 9.350633537384679e-05, "loss": 2.3286, "step": 32203 }, { "epoch": 0.87, "learning_rate": 9.346958917004478e-05, "loss": 1.9593, "step": 32204 }, { "epoch": 0.87, "learning_rate": 9.343284983395517e-05, "loss": 2.6239, "step": 32205 }, { "epoch": 0.87, "learning_rate": 9.339611736585618e-05, "loss": 3.0211, "step": 32206 }, { "epoch": 0.87, "learning_rate": 9.335939176602615e-05, "loss": 2.9569, "step": 32207 }, { "epoch": 0.87, "learning_rate": 9.33226730347434e-05, "loss": 2.7105, "step": 32208 }, { "epoch": 0.87, "learning_rate": 9.328596117228583e-05, "loss": 2.0809, "step": 32209 }, { "epoch": 0.87, "learning_rate": 9.324925617893176e-05, "loss": 2.447, "step": 32210 }, { "epoch": 0.87, "learning_rate": 9.32125580549592e-05, "loss": 2.7125, "step": 32211 }, { "epoch": 0.87, "learning_rate": 9.317586680064615e-05, "loss": 2.8942, "step": 32212 }, { "epoch": 0.87, "learning_rate": 9.313918241627073e-05, "loss": 2.3817, "step": 32213 }, { "epoch": 0.87, "learning_rate": 9.31025049021107e-05, "loss": 2.4215, "step": 32214 }, { "epoch": 0.87, "learning_rate": 9.306583425844384e-05, "loss": 2.309, "step": 32215 }, { "epoch": 0.87, "learning_rate": 9.302917048554827e-05, "loss": 2.4937, "step": 32216 }, { "epoch": 0.87, "learning_rate": 9.299251358370143e-05, "loss": 2.5227, "step": 32217 }, { "epoch": 0.87, "learning_rate": 9.295586355318086e-05, "loss": 2.0491, "step": 32218 }, { "epoch": 0.87, "learning_rate": 9.291922039426493e-05, "loss": 2.4541, "step": 32219 }, { "epoch": 0.87, "learning_rate": 9.288258410723072e-05, "loss": 2.5044, "step": 32220 }, { "epoch": 0.87, "learning_rate": 9.28459546923559e-05, "loss": 2.6062, "step": 32221 }, { "epoch": 0.87, "learning_rate": 9.280933214991783e-05, "loss": 2.6126, "step": 32222 }, { "epoch": 0.87, "learning_rate": 9.277271648019414e-05, "loss": 2.3872, "step": 32223 }, { "epoch": 0.87, "learning_rate": 9.273610768346208e-05, "loss": 2.6519, "step": 32224 }, { "epoch": 0.87, "learning_rate": 9.269950575999908e-05, "loss": 2.6743, "step": 32225 }, { "epoch": 0.87, "learning_rate": 9.266291071008237e-05, "loss": 2.6729, "step": 32226 }, { "epoch": 0.87, "learning_rate": 9.262632253398939e-05, "loss": 2.5804, "step": 32227 }, { "epoch": 0.87, "learning_rate": 9.258974123199714e-05, "loss": 2.2089, "step": 32228 }, { "epoch": 0.87, "learning_rate": 9.255316680438264e-05, "loss": 2.6018, "step": 32229 }, { "epoch": 0.87, "learning_rate": 9.251659925142331e-05, "loss": 2.1845, "step": 32230 }, { "epoch": 0.87, "learning_rate": 9.248003857339571e-05, "loss": 2.1819, "step": 32231 }, { "epoch": 0.87, "learning_rate": 9.244348477057741e-05, "loss": 2.3507, "step": 32232 }, { "epoch": 0.87, "learning_rate": 9.240693784324472e-05, "loss": 2.4016, "step": 32233 }, { "epoch": 0.87, "learning_rate": 9.237039779167488e-05, "loss": 2.4952, "step": 32234 }, { "epoch": 0.87, "learning_rate": 9.23338646161449e-05, "loss": 2.0328, "step": 32235 }, { "epoch": 0.87, "learning_rate": 9.229733831693099e-05, "loss": 2.1078, "step": 32236 }, { "epoch": 0.87, "learning_rate": 9.226081889431026e-05, "loss": 2.2555, "step": 32237 }, { "epoch": 0.87, "learning_rate": 9.222430634855928e-05, "loss": 2.5572, "step": 32238 }, { "epoch": 0.87, "learning_rate": 9.218780067995458e-05, "loss": 2.2277, "step": 32239 }, { "epoch": 0.87, "learning_rate": 9.215130188877296e-05, "loss": 2.6402, "step": 32240 }, { "epoch": 0.87, "learning_rate": 9.211480997529065e-05, "loss": 2.6626, "step": 32241 }, { "epoch": 0.87, "learning_rate": 9.207832493978418e-05, "loss": 2.3292, "step": 32242 }, { "epoch": 0.87, "learning_rate": 9.204184678253025e-05, "loss": 2.7952, "step": 32243 }, { "epoch": 0.87, "learning_rate": 9.200537550380462e-05, "loss": 2.3712, "step": 32244 }, { "epoch": 0.87, "learning_rate": 9.196891110388405e-05, "loss": 2.9512, "step": 32245 }, { "epoch": 0.87, "learning_rate": 9.193245358304481e-05, "loss": 2.7877, "step": 32246 }, { "epoch": 0.87, "learning_rate": 9.189600294156286e-05, "loss": 2.3831, "step": 32247 }, { "epoch": 0.87, "learning_rate": 9.185955917971455e-05, "loss": 2.7746, "step": 32248 }, { "epoch": 0.87, "learning_rate": 9.182312229777567e-05, "loss": 2.6943, "step": 32249 }, { "epoch": 0.87, "learning_rate": 9.178669229602254e-05, "loss": 2.8285, "step": 32250 }, { "epoch": 0.87, "learning_rate": 9.175026917473095e-05, "loss": 2.3932, "step": 32251 }, { "epoch": 0.87, "learning_rate": 9.1713852934177e-05, "loss": 2.2354, "step": 32252 }, { "epoch": 0.87, "learning_rate": 9.167744357463659e-05, "loss": 2.4234, "step": 32253 }, { "epoch": 0.87, "learning_rate": 9.164104109638549e-05, "loss": 2.2558, "step": 32254 }, { "epoch": 0.87, "learning_rate": 9.160464549969939e-05, "loss": 2.6657, "step": 32255 }, { "epoch": 0.87, "learning_rate": 9.156825678485426e-05, "loss": 2.4644, "step": 32256 }, { "epoch": 0.87, "learning_rate": 9.153187495212523e-05, "loss": 2.4952, "step": 32257 }, { "epoch": 0.87, "learning_rate": 9.149550000178842e-05, "loss": 2.427, "step": 32258 }, { "epoch": 0.87, "learning_rate": 9.145913193411959e-05, "loss": 2.3479, "step": 32259 }, { "epoch": 0.87, "learning_rate": 9.142277074939365e-05, "loss": 2.8165, "step": 32260 }, { "epoch": 0.87, "learning_rate": 9.138641644788637e-05, "loss": 2.8698, "step": 32261 }, { "epoch": 0.87, "learning_rate": 9.135006902987342e-05, "loss": 2.3462, "step": 32262 }, { "epoch": 0.87, "learning_rate": 9.131372849562958e-05, "loss": 2.2664, "step": 32263 }, { "epoch": 0.87, "learning_rate": 9.127739484543063e-05, "loss": 2.6393, "step": 32264 }, { "epoch": 0.87, "learning_rate": 9.124106807955157e-05, "loss": 2.8007, "step": 32265 }, { "epoch": 0.87, "learning_rate": 9.120474819826774e-05, "loss": 2.8114, "step": 32266 }, { "epoch": 0.87, "learning_rate": 9.116843520185436e-05, "loss": 2.8375, "step": 32267 }, { "epoch": 0.87, "learning_rate": 9.113212909058632e-05, "loss": 2.6034, "step": 32268 }, { "epoch": 0.87, "learning_rate": 9.109582986473885e-05, "loss": 2.5419, "step": 32269 }, { "epoch": 0.87, "learning_rate": 9.105953752458685e-05, "loss": 2.4888, "step": 32270 }, { "epoch": 0.87, "learning_rate": 9.102325207040518e-05, "loss": 2.5777, "step": 32271 }, { "epoch": 0.87, "learning_rate": 9.098697350246888e-05, "loss": 2.2722, "step": 32272 }, { "epoch": 0.87, "learning_rate": 9.095070182105303e-05, "loss": 2.3317, "step": 32273 }, { "epoch": 0.87, "learning_rate": 9.091443702643188e-05, "loss": 2.4937, "step": 32274 }, { "epoch": 0.87, "learning_rate": 9.087817911888064e-05, "loss": 2.7674, "step": 32275 }, { "epoch": 0.87, "learning_rate": 9.084192809867354e-05, "loss": 2.4358, "step": 32276 }, { "epoch": 0.87, "learning_rate": 9.080568396608546e-05, "loss": 2.7518, "step": 32277 }, { "epoch": 0.87, "learning_rate": 9.076944672139098e-05, "loss": 2.276, "step": 32278 }, { "epoch": 0.87, "learning_rate": 9.073321636486465e-05, "loss": 2.298, "step": 32279 }, { "epoch": 0.87, "learning_rate": 9.069699289678091e-05, "loss": 2.2523, "step": 32280 }, { "epoch": 0.87, "learning_rate": 9.066077631741431e-05, "loss": 2.5971, "step": 32281 }, { "epoch": 0.87, "learning_rate": 9.0624566627039e-05, "loss": 2.3495, "step": 32282 }, { "epoch": 0.87, "learning_rate": 9.058836382592939e-05, "loss": 2.4591, "step": 32283 }, { "epoch": 0.87, "learning_rate": 9.055216791435971e-05, "loss": 2.3321, "step": 32284 }, { "epoch": 0.87, "learning_rate": 9.05159788926042e-05, "loss": 2.7129, "step": 32285 }, { "epoch": 0.87, "learning_rate": 9.04797967609372e-05, "loss": 2.5968, "step": 32286 }, { "epoch": 0.87, "learning_rate": 9.044362151963247e-05, "loss": 2.5912, "step": 32287 }, { "epoch": 0.87, "learning_rate": 9.040745316896426e-05, "loss": 2.7904, "step": 32288 }, { "epoch": 0.87, "learning_rate": 9.037129170920678e-05, "loss": 2.4063, "step": 32289 }, { "epoch": 0.87, "learning_rate": 9.033513714063357e-05, "loss": 2.3764, "step": 32290 }, { "epoch": 0.87, "learning_rate": 9.029898946351867e-05, "loss": 2.0646, "step": 32291 }, { "epoch": 0.87, "learning_rate": 9.026284867813605e-05, "loss": 2.554, "step": 32292 }, { "epoch": 0.87, "learning_rate": 9.022671478475942e-05, "loss": 2.5084, "step": 32293 }, { "epoch": 0.87, "learning_rate": 9.019058778366274e-05, "loss": 2.6286, "step": 32294 }, { "epoch": 0.87, "learning_rate": 9.015446767511937e-05, "loss": 2.6997, "step": 32295 }, { "epoch": 0.87, "learning_rate": 9.011835445940308e-05, "loss": 2.8414, "step": 32296 }, { "epoch": 0.87, "learning_rate": 9.008224813678745e-05, "loss": 2.4432, "step": 32297 }, { "epoch": 0.87, "learning_rate": 9.004614870754591e-05, "loss": 2.2077, "step": 32298 }, { "epoch": 0.87, "learning_rate": 9.001005617195234e-05, "loss": 2.5444, "step": 32299 }, { "epoch": 0.87, "learning_rate": 8.997397053027979e-05, "loss": 2.0798, "step": 32300 }, { "epoch": 0.87, "learning_rate": 8.993789178280165e-05, "loss": 2.2924, "step": 32301 }, { "epoch": 0.87, "learning_rate": 8.990181992979152e-05, "loss": 2.4164, "step": 32302 }, { "epoch": 0.87, "learning_rate": 8.986575497152239e-05, "loss": 2.7101, "step": 32303 }, { "epoch": 0.87, "learning_rate": 8.982969690826726e-05, "loss": 2.5841, "step": 32304 }, { "epoch": 0.87, "learning_rate": 8.979364574030014e-05, "loss": 2.7509, "step": 32305 }, { "epoch": 0.87, "learning_rate": 8.975760146789336e-05, "loss": 2.5002, "step": 32306 }, { "epoch": 0.87, "learning_rate": 8.972156409132026e-05, "loss": 1.7256, "step": 32307 }, { "epoch": 0.87, "learning_rate": 8.968553361085397e-05, "loss": 2.1859, "step": 32308 }, { "epoch": 0.87, "learning_rate": 8.964951002676725e-05, "loss": 2.4457, "step": 32309 }, { "epoch": 0.87, "learning_rate": 8.961349333933311e-05, "loss": 2.7762, "step": 32310 }, { "epoch": 0.87, "learning_rate": 8.957748354882422e-05, "loss": 2.1012, "step": 32311 }, { "epoch": 0.87, "learning_rate": 8.954148065551371e-05, "loss": 2.835, "step": 32312 }, { "epoch": 0.87, "learning_rate": 8.950548465967423e-05, "loss": 2.7314, "step": 32313 }, { "epoch": 0.87, "learning_rate": 8.946949556157835e-05, "loss": 2.2859, "step": 32314 }, { "epoch": 0.87, "learning_rate": 8.943351336149875e-05, "loss": 2.5787, "step": 32315 }, { "epoch": 0.87, "learning_rate": 8.939753805970818e-05, "loss": 2.3404, "step": 32316 }, { "epoch": 0.87, "learning_rate": 8.93615696564788e-05, "loss": 2.4833, "step": 32317 }, { "epoch": 0.87, "learning_rate": 8.932560815208357e-05, "loss": 2.1808, "step": 32318 }, { "epoch": 0.87, "learning_rate": 8.928965354679464e-05, "loss": 2.7147, "step": 32319 }, { "epoch": 0.87, "learning_rate": 8.925370584088454e-05, "loss": 2.2814, "step": 32320 }, { "epoch": 0.87, "learning_rate": 8.921776503462564e-05, "loss": 2.3769, "step": 32321 }, { "epoch": 0.87, "learning_rate": 8.918183112828993e-05, "loss": 2.5646, "step": 32322 }, { "epoch": 0.87, "learning_rate": 8.914590412214984e-05, "loss": 2.4304, "step": 32323 }, { "epoch": 0.87, "learning_rate": 8.910998401647752e-05, "loss": 2.6443, "step": 32324 }, { "epoch": 0.87, "learning_rate": 8.907407081154517e-05, "loss": 2.3123, "step": 32325 }, { "epoch": 0.87, "learning_rate": 8.903816450762491e-05, "loss": 2.5651, "step": 32326 }, { "epoch": 0.87, "learning_rate": 8.900226510498843e-05, "loss": 2.4227, "step": 32327 }, { "epoch": 0.87, "learning_rate": 8.896637260390806e-05, "loss": 1.9736, "step": 32328 }, { "epoch": 0.87, "learning_rate": 8.893048700465567e-05, "loss": 2.3983, "step": 32329 }, { "epoch": 0.87, "learning_rate": 8.889460830750262e-05, "loss": 2.5886, "step": 32330 }, { "epoch": 0.87, "learning_rate": 8.885873651272136e-05, "loss": 2.4107, "step": 32331 }, { "epoch": 0.87, "learning_rate": 8.882287162058366e-05, "loss": 2.6225, "step": 32332 }, { "epoch": 0.87, "learning_rate": 8.878701363136077e-05, "loss": 2.5117, "step": 32333 }, { "epoch": 0.87, "learning_rate": 8.875116254532467e-05, "loss": 2.5089, "step": 32334 }, { "epoch": 0.87, "learning_rate": 8.871531836274671e-05, "loss": 2.504, "step": 32335 }, { "epoch": 0.87, "learning_rate": 8.867948108389856e-05, "loss": 2.3515, "step": 32336 }, { "epoch": 0.87, "learning_rate": 8.864365070905178e-05, "loss": 2.5847, "step": 32337 }, { "epoch": 0.87, "learning_rate": 8.860782723847771e-05, "loss": 2.5858, "step": 32338 }, { "epoch": 0.87, "learning_rate": 8.85720106724478e-05, "loss": 2.7133, "step": 32339 }, { "epoch": 0.87, "learning_rate": 8.853620101123361e-05, "loss": 2.4767, "step": 32340 }, { "epoch": 0.87, "learning_rate": 8.850039825510592e-05, "loss": 2.3436, "step": 32341 }, { "epoch": 0.87, "learning_rate": 8.84646024043364e-05, "loss": 2.1104, "step": 32342 }, { "epoch": 0.87, "learning_rate": 8.842881345919596e-05, "loss": 2.4497, "step": 32343 }, { "epoch": 0.87, "learning_rate": 8.839303141995592e-05, "loss": 1.7332, "step": 32344 }, { "epoch": 0.87, "learning_rate": 8.835725628688751e-05, "loss": 2.5693, "step": 32345 }, { "epoch": 0.87, "learning_rate": 8.83214880602613e-05, "loss": 2.4005, "step": 32346 }, { "epoch": 0.87, "learning_rate": 8.828572674034851e-05, "loss": 2.3272, "step": 32347 }, { "epoch": 0.87, "learning_rate": 8.824997232742027e-05, "loss": 2.7428, "step": 32348 }, { "epoch": 0.87, "learning_rate": 8.821422482174701e-05, "loss": 2.1795, "step": 32349 }, { "epoch": 0.87, "learning_rate": 8.817848422359986e-05, "loss": 2.684, "step": 32350 }, { "epoch": 0.87, "learning_rate": 8.814275053324938e-05, "loss": 2.854, "step": 32351 }, { "epoch": 0.87, "learning_rate": 8.810702375096646e-05, "loss": 2.4749, "step": 32352 }, { "epoch": 0.87, "learning_rate": 8.80713038770219e-05, "loss": 2.2213, "step": 32353 }, { "epoch": 0.87, "learning_rate": 8.803559091168579e-05, "loss": 2.3065, "step": 32354 }, { "epoch": 0.87, "learning_rate": 8.799988485522914e-05, "loss": 2.6029, "step": 32355 }, { "epoch": 0.87, "learning_rate": 8.79641857079223e-05, "loss": 2.8176, "step": 32356 }, { "epoch": 0.87, "learning_rate": 8.792849347003562e-05, "loss": 2.2154, "step": 32357 }, { "epoch": 0.87, "learning_rate": 8.789280814183975e-05, "loss": 2.4301, "step": 32358 }, { "epoch": 0.87, "learning_rate": 8.785712972360505e-05, "loss": 2.4988, "step": 32359 }, { "epoch": 0.87, "learning_rate": 8.782145821560139e-05, "loss": 2.683, "step": 32360 }, { "epoch": 0.87, "learning_rate": 8.778579361809946e-05, "loss": 2.9411, "step": 32361 }, { "epoch": 0.87, "learning_rate": 8.775013593136915e-05, "loss": 2.5099, "step": 32362 }, { "epoch": 0.87, "learning_rate": 8.771448515568081e-05, "loss": 2.3804, "step": 32363 }, { "epoch": 0.87, "learning_rate": 8.767884129130432e-05, "loss": 2.4943, "step": 32364 }, { "epoch": 0.87, "learning_rate": 8.76432043385098e-05, "loss": 2.2878, "step": 32365 }, { "epoch": 0.87, "learning_rate": 8.760757429756727e-05, "loss": 2.5931, "step": 32366 }, { "epoch": 0.87, "learning_rate": 8.757195116874684e-05, "loss": 3.0454, "step": 32367 }, { "epoch": 0.87, "learning_rate": 8.753633495231794e-05, "loss": 2.5877, "step": 32368 }, { "epoch": 0.87, "learning_rate": 8.750072564855071e-05, "loss": 2.5339, "step": 32369 }, { "epoch": 0.87, "learning_rate": 8.746512325771483e-05, "loss": 2.5992, "step": 32370 }, { "epoch": 0.87, "learning_rate": 8.742952778007995e-05, "loss": 2.7409, "step": 32371 }, { "epoch": 0.87, "learning_rate": 8.73939392159161e-05, "loss": 2.4356, "step": 32372 }, { "epoch": 0.87, "learning_rate": 8.735835756549238e-05, "loss": 2.6002, "step": 32373 }, { "epoch": 0.87, "learning_rate": 8.732278282907857e-05, "loss": 2.4356, "step": 32374 }, { "epoch": 0.87, "learning_rate": 8.728721500694437e-05, "loss": 2.5509, "step": 32375 }, { "epoch": 0.87, "learning_rate": 8.725165409935875e-05, "loss": 2.7243, "step": 32376 }, { "epoch": 0.87, "learning_rate": 8.721610010659153e-05, "loss": 2.6875, "step": 32377 }, { "epoch": 0.87, "learning_rate": 8.718055302891215e-05, "loss": 2.1475, "step": 32378 }, { "epoch": 0.87, "learning_rate": 8.714501286658949e-05, "loss": 2.5145, "step": 32379 }, { "epoch": 0.87, "learning_rate": 8.710947961989324e-05, "loss": 2.5275, "step": 32380 }, { "epoch": 0.87, "learning_rate": 8.707395328909218e-05, "loss": 2.5785, "step": 32381 }, { "epoch": 0.87, "learning_rate": 8.703843387445553e-05, "loss": 2.3863, "step": 32382 }, { "epoch": 0.87, "learning_rate": 8.700292137625266e-05, "loss": 2.7208, "step": 32383 }, { "epoch": 0.87, "learning_rate": 8.696741579475232e-05, "loss": 2.4666, "step": 32384 }, { "epoch": 0.87, "learning_rate": 8.693191713022353e-05, "loss": 2.6909, "step": 32385 }, { "epoch": 0.87, "learning_rate": 8.689642538293563e-05, "loss": 2.4913, "step": 32386 }, { "epoch": 0.87, "learning_rate": 8.686094055315685e-05, "loss": 2.4068, "step": 32387 }, { "epoch": 0.87, "learning_rate": 8.682546264115665e-05, "loss": 2.3631, "step": 32388 }, { "epoch": 0.87, "learning_rate": 8.678999164720303e-05, "loss": 2.5804, "step": 32389 }, { "epoch": 0.87, "learning_rate": 8.675452757156532e-05, "loss": 2.854, "step": 32390 }, { "epoch": 0.87, "learning_rate": 8.671907041451232e-05, "loss": 2.4963, "step": 32391 }, { "epoch": 0.87, "learning_rate": 8.668362017631204e-05, "loss": 2.3259, "step": 32392 }, { "epoch": 0.87, "learning_rate": 8.664817685723348e-05, "loss": 2.3494, "step": 32393 }, { "epoch": 0.87, "learning_rate": 8.661274045754519e-05, "loss": 2.3682, "step": 32394 }, { "epoch": 0.87, "learning_rate": 8.657731097751531e-05, "loss": 2.5958, "step": 32395 }, { "epoch": 0.87, "learning_rate": 8.65418884174124e-05, "loss": 2.5212, "step": 32396 }, { "epoch": 0.87, "learning_rate": 8.650647277750489e-05, "loss": 2.6864, "step": 32397 }, { "epoch": 0.87, "learning_rate": 8.647106405806093e-05, "loss": 2.4749, "step": 32398 }, { "epoch": 0.87, "learning_rate": 8.643566225934907e-05, "loss": 2.4928, "step": 32399 }, { "epoch": 0.87, "learning_rate": 8.64002673816372e-05, "loss": 2.2482, "step": 32400 }, { "epoch": 0.87, "learning_rate": 8.636487942519345e-05, "loss": 2.4399, "step": 32401 }, { "epoch": 0.87, "learning_rate": 8.632949839028615e-05, "loss": 2.1957, "step": 32402 }, { "epoch": 0.87, "learning_rate": 8.62941242771832e-05, "loss": 2.2527, "step": 32403 }, { "epoch": 0.87, "learning_rate": 8.625875708615272e-05, "loss": 2.7611, "step": 32404 }, { "epoch": 0.87, "learning_rate": 8.622339681746238e-05, "loss": 2.6037, "step": 32405 }, { "epoch": 0.87, "learning_rate": 8.61880434713802e-05, "loss": 2.6642, "step": 32406 }, { "epoch": 0.87, "learning_rate": 8.61526970481743e-05, "loss": 2.6056, "step": 32407 }, { "epoch": 0.87, "learning_rate": 8.61173575481119e-05, "loss": 2.1883, "step": 32408 }, { "epoch": 0.87, "learning_rate": 8.608202497146101e-05, "loss": 2.2327, "step": 32409 }, { "epoch": 0.87, "learning_rate": 8.604669931848941e-05, "loss": 2.5973, "step": 32410 }, { "epoch": 0.87, "learning_rate": 8.601138058946457e-05, "loss": 2.216, "step": 32411 }, { "epoch": 0.87, "learning_rate": 8.597606878465403e-05, "loss": 2.3494, "step": 32412 }, { "epoch": 0.87, "learning_rate": 8.594076390432571e-05, "loss": 2.3108, "step": 32413 }, { "epoch": 0.87, "learning_rate": 8.590546594874638e-05, "loss": 2.3922, "step": 32414 }, { "epoch": 0.87, "learning_rate": 8.587017491818394e-05, "loss": 2.6223, "step": 32415 }, { "epoch": 0.87, "learning_rate": 8.583489081290564e-05, "loss": 2.3251, "step": 32416 }, { "epoch": 0.87, "learning_rate": 8.579961363317868e-05, "loss": 2.2092, "step": 32417 }, { "epoch": 0.87, "learning_rate": 8.576434337927064e-05, "loss": 2.6966, "step": 32418 }, { "epoch": 0.87, "learning_rate": 8.57290800514483e-05, "loss": 2.5043, "step": 32419 }, { "epoch": 0.87, "learning_rate": 8.569382364997903e-05, "loss": 2.1114, "step": 32420 }, { "epoch": 0.87, "learning_rate": 8.565857417513001e-05, "loss": 2.1794, "step": 32421 }, { "epoch": 0.87, "learning_rate": 8.562333162716795e-05, "loss": 2.0391, "step": 32422 }, { "epoch": 0.87, "learning_rate": 8.558809600636008e-05, "loss": 2.9677, "step": 32423 }, { "epoch": 0.87, "learning_rate": 8.55528673129734e-05, "loss": 2.9203, "step": 32424 }, { "epoch": 0.87, "learning_rate": 8.551764554727459e-05, "loss": 2.7094, "step": 32425 }, { "epoch": 0.87, "learning_rate": 8.548243070953087e-05, "loss": 2.8672, "step": 32426 }, { "epoch": 0.87, "learning_rate": 8.54472228000085e-05, "loss": 1.9541, "step": 32427 }, { "epoch": 0.87, "learning_rate": 8.541202181897457e-05, "loss": 3.1184, "step": 32428 }, { "epoch": 0.87, "learning_rate": 8.537682776669552e-05, "loss": 2.0097, "step": 32429 }, { "epoch": 0.87, "learning_rate": 8.53416406434382e-05, "loss": 2.3446, "step": 32430 }, { "epoch": 0.87, "learning_rate": 8.530646044946922e-05, "loss": 2.1854, "step": 32431 }, { "epoch": 0.87, "learning_rate": 8.527128718505483e-05, "loss": 2.1464, "step": 32432 }, { "epoch": 0.87, "learning_rate": 8.523612085046162e-05, "loss": 2.5148, "step": 32433 }, { "epoch": 0.87, "learning_rate": 8.520096144595613e-05, "loss": 2.4788, "step": 32434 }, { "epoch": 0.87, "learning_rate": 8.516580897180448e-05, "loss": 2.4814, "step": 32435 }, { "epoch": 0.87, "learning_rate": 8.513066342827291e-05, "loss": 2.381, "step": 32436 }, { "epoch": 0.87, "learning_rate": 8.509552481562821e-05, "loss": 2.6113, "step": 32437 }, { "epoch": 0.87, "learning_rate": 8.506039313413605e-05, "loss": 2.5197, "step": 32438 }, { "epoch": 0.87, "learning_rate": 8.502526838406299e-05, "loss": 2.868, "step": 32439 }, { "epoch": 0.87, "learning_rate": 8.499015056567471e-05, "loss": 2.324, "step": 32440 }, { "epoch": 0.87, "learning_rate": 8.495503967923757e-05, "loss": 2.4814, "step": 32441 }, { "epoch": 0.87, "learning_rate": 8.491993572501733e-05, "loss": 2.4349, "step": 32442 }, { "epoch": 0.87, "learning_rate": 8.488483870328012e-05, "loss": 1.9928, "step": 32443 }, { "epoch": 0.87, "learning_rate": 8.484974861429173e-05, "loss": 2.1672, "step": 32444 }, { "epoch": 0.87, "learning_rate": 8.481466545831828e-05, "loss": 2.1169, "step": 32445 }, { "epoch": 0.87, "learning_rate": 8.477958923562501e-05, "loss": 2.5452, "step": 32446 }, { "epoch": 0.87, "learning_rate": 8.474451994647825e-05, "loss": 2.0252, "step": 32447 }, { "epoch": 0.87, "learning_rate": 8.470945759114312e-05, "loss": 2.6607, "step": 32448 }, { "epoch": 0.87, "learning_rate": 8.467440216988531e-05, "loss": 2.1354, "step": 32449 }, { "epoch": 0.87, "learning_rate": 8.463935368297093e-05, "loss": 2.2302, "step": 32450 }, { "epoch": 0.87, "learning_rate": 8.4604312130665e-05, "loss": 2.6945, "step": 32451 }, { "epoch": 0.87, "learning_rate": 8.456927751323317e-05, "loss": 2.4099, "step": 32452 }, { "epoch": 0.87, "learning_rate": 8.453424983094105e-05, "loss": 2.276, "step": 32453 }, { "epoch": 0.87, "learning_rate": 8.44992290840535e-05, "loss": 2.3974, "step": 32454 }, { "epoch": 0.87, "learning_rate": 8.446421527283609e-05, "loss": 2.5697, "step": 32455 }, { "epoch": 0.87, "learning_rate": 8.442920839755419e-05, "loss": 2.721, "step": 32456 }, { "epoch": 0.87, "learning_rate": 8.43942084584729e-05, "loss": 2.267, "step": 32457 }, { "epoch": 0.87, "learning_rate": 8.435921545585757e-05, "loss": 2.3009, "step": 32458 }, { "epoch": 0.87, "learning_rate": 8.432422938997297e-05, "loss": 2.9931, "step": 32459 }, { "epoch": 0.87, "learning_rate": 8.428925026108425e-05, "loss": 2.6423, "step": 32460 }, { "epoch": 0.87, "learning_rate": 8.425427806945674e-05, "loss": 2.8226, "step": 32461 }, { "epoch": 0.87, "learning_rate": 8.421931281535466e-05, "loss": 2.8218, "step": 32462 }, { "epoch": 0.87, "learning_rate": 8.418435449904349e-05, "loss": 2.7576, "step": 32463 }, { "epoch": 0.87, "learning_rate": 8.414940312078812e-05, "loss": 2.02, "step": 32464 }, { "epoch": 0.87, "learning_rate": 8.411445868085299e-05, "loss": 2.4716, "step": 32465 }, { "epoch": 0.87, "learning_rate": 8.407952117950312e-05, "loss": 2.7328, "step": 32466 }, { "epoch": 0.87, "learning_rate": 8.404459061700287e-05, "loss": 2.5192, "step": 32467 }, { "epoch": 0.87, "learning_rate": 8.400966699361701e-05, "loss": 2.7426, "step": 32468 }, { "epoch": 0.87, "learning_rate": 8.397475030961021e-05, "loss": 2.9666, "step": 32469 }, { "epoch": 0.87, "learning_rate": 8.393984056524695e-05, "loss": 2.3649, "step": 32470 }, { "epoch": 0.87, "learning_rate": 8.390493776079167e-05, "loss": 2.6738, "step": 32471 }, { "epoch": 0.87, "learning_rate": 8.387004189650894e-05, "loss": 2.2897, "step": 32472 }, { "epoch": 0.87, "learning_rate": 8.383515297266275e-05, "loss": 2.5952, "step": 32473 }, { "epoch": 0.87, "learning_rate": 8.380027098951793e-05, "loss": 2.7299, "step": 32474 }, { "epoch": 0.87, "learning_rate": 8.376539594733801e-05, "loss": 2.6881, "step": 32475 }, { "epoch": 0.87, "learning_rate": 8.373052784638791e-05, "loss": 2.338, "step": 32476 }, { "epoch": 0.87, "learning_rate": 8.369566668693163e-05, "loss": 2.5309, "step": 32477 }, { "epoch": 0.87, "learning_rate": 8.366081246923307e-05, "loss": 2.5202, "step": 32478 }, { "epoch": 0.87, "learning_rate": 8.362596519355625e-05, "loss": 2.5466, "step": 32479 }, { "epoch": 0.87, "learning_rate": 8.359112486016551e-05, "loss": 2.4236, "step": 32480 }, { "epoch": 0.87, "learning_rate": 8.355629146932442e-05, "loss": 2.646, "step": 32481 }, { "epoch": 0.87, "learning_rate": 8.352146502129698e-05, "loss": 2.5305, "step": 32482 }, { "epoch": 0.87, "learning_rate": 8.34866455163471e-05, "loss": 2.7486, "step": 32483 }, { "epoch": 0.87, "learning_rate": 8.345183295473857e-05, "loss": 2.5899, "step": 32484 }, { "epoch": 0.87, "learning_rate": 8.341702733673517e-05, "loss": 2.6807, "step": 32485 }, { "epoch": 0.87, "learning_rate": 8.338222866260037e-05, "loss": 2.5399, "step": 32486 }, { "epoch": 0.87, "learning_rate": 8.334743693259794e-05, "loss": 2.1507, "step": 32487 }, { "epoch": 0.87, "learning_rate": 8.331265214699147e-05, "loss": 2.2935, "step": 32488 }, { "epoch": 0.87, "learning_rate": 8.327787430604439e-05, "loss": 2.5747, "step": 32489 }, { "epoch": 0.87, "learning_rate": 8.324310341002028e-05, "loss": 2.5098, "step": 32490 }, { "epoch": 0.87, "learning_rate": 8.320833945918271e-05, "loss": 2.4876, "step": 32491 }, { "epoch": 0.87, "learning_rate": 8.317358245379469e-05, "loss": 3.0422, "step": 32492 }, { "epoch": 0.87, "learning_rate": 8.31388323941199e-05, "loss": 2.4098, "step": 32493 }, { "epoch": 0.87, "learning_rate": 8.310408928042112e-05, "loss": 2.1166, "step": 32494 }, { "epoch": 0.87, "learning_rate": 8.306935311296193e-05, "loss": 2.2475, "step": 32495 }, { "epoch": 0.87, "learning_rate": 8.303462389200534e-05, "loss": 2.2929, "step": 32496 }, { "epoch": 0.87, "learning_rate": 8.299990161781445e-05, "loss": 2.6736, "step": 32497 }, { "epoch": 0.87, "learning_rate": 8.296518629065242e-05, "loss": 2.0154, "step": 32498 }, { "epoch": 0.87, "learning_rate": 8.293047791078234e-05, "loss": 2.3641, "step": 32499 }, { "epoch": 0.87, "learning_rate": 8.28957764784668e-05, "loss": 2.4344, "step": 32500 }, { "epoch": 0.87, "learning_rate": 8.286108199396902e-05, "loss": 2.641, "step": 32501 }, { "epoch": 0.87, "learning_rate": 8.282639445755158e-05, "loss": 2.391, "step": 32502 }, { "epoch": 0.87, "learning_rate": 8.279171386947747e-05, "loss": 2.3858, "step": 32503 }, { "epoch": 0.87, "learning_rate": 8.275704023000952e-05, "loss": 2.4372, "step": 32504 }, { "epoch": 0.87, "learning_rate": 8.272237353941003e-05, "loss": 2.4602, "step": 32505 }, { "epoch": 0.87, "learning_rate": 8.268771379794193e-05, "loss": 2.3359, "step": 32506 }, { "epoch": 0.87, "learning_rate": 8.265306100586778e-05, "loss": 2.7844, "step": 32507 }, { "epoch": 0.87, "learning_rate": 8.261841516344992e-05, "loss": 2.2855, "step": 32508 }, { "epoch": 0.87, "learning_rate": 8.258377627095093e-05, "loss": 2.9648, "step": 32509 }, { "epoch": 0.87, "learning_rate": 8.254914432863326e-05, "loss": 2.242, "step": 32510 }, { "epoch": 0.87, "learning_rate": 8.251451933675913e-05, "loss": 2.2892, "step": 32511 }, { "epoch": 0.87, "learning_rate": 8.247990129559124e-05, "loss": 2.0681, "step": 32512 }, { "epoch": 0.87, "learning_rate": 8.244529020539148e-05, "loss": 2.3163, "step": 32513 }, { "epoch": 0.87, "learning_rate": 8.2410686066422e-05, "loss": 2.57, "step": 32514 }, { "epoch": 0.87, "learning_rate": 8.23760888789452e-05, "loss": 2.5472, "step": 32515 }, { "epoch": 0.87, "learning_rate": 8.234149864322304e-05, "loss": 2.3083, "step": 32516 }, { "epoch": 0.87, "learning_rate": 8.230691535951795e-05, "loss": 2.1372, "step": 32517 }, { "epoch": 0.87, "learning_rate": 8.227233902809129e-05, "loss": 3.0416, "step": 32518 }, { "epoch": 0.87, "learning_rate": 8.223776964920527e-05, "loss": 2.4808, "step": 32519 }, { "epoch": 0.87, "learning_rate": 8.220320722312214e-05, "loss": 2.192, "step": 32520 }, { "epoch": 0.87, "learning_rate": 8.216865175010314e-05, "loss": 2.002, "step": 32521 }, { "epoch": 0.87, "learning_rate": 8.213410323041026e-05, "loss": 2.5767, "step": 32522 }, { "epoch": 0.87, "learning_rate": 8.209956166430555e-05, "loss": 2.5242, "step": 32523 }, { "epoch": 0.87, "learning_rate": 8.206502705205044e-05, "loss": 2.7383, "step": 32524 }, { "epoch": 0.87, "learning_rate": 8.20304993939064e-05, "loss": 2.5826, "step": 32525 }, { "epoch": 0.87, "learning_rate": 8.199597869013542e-05, "loss": 2.3349, "step": 32526 }, { "epoch": 0.87, "learning_rate": 8.196146494099865e-05, "loss": 2.3898, "step": 32527 }, { "epoch": 0.87, "learning_rate": 8.192695814675766e-05, "loss": 2.5358, "step": 32528 }, { "epoch": 0.87, "learning_rate": 8.189245830767388e-05, "loss": 2.4842, "step": 32529 }, { "epoch": 0.87, "learning_rate": 8.18579654240087e-05, "loss": 2.733, "step": 32530 }, { "epoch": 0.87, "learning_rate": 8.182347949602365e-05, "loss": 2.3934, "step": 32531 }, { "epoch": 0.87, "learning_rate": 8.178900052397953e-05, "loss": 2.8055, "step": 32532 }, { "epoch": 0.87, "learning_rate": 8.175452850813781e-05, "loss": 2.0437, "step": 32533 }, { "epoch": 0.87, "learning_rate": 8.172006344875959e-05, "loss": 2.6705, "step": 32534 }, { "epoch": 0.87, "learning_rate": 8.168560534610603e-05, "loss": 2.1425, "step": 32535 }, { "epoch": 0.87, "learning_rate": 8.165115420043834e-05, "loss": 2.6266, "step": 32536 }, { "epoch": 0.87, "learning_rate": 8.161671001201709e-05, "loss": 2.1376, "step": 32537 }, { "epoch": 0.87, "learning_rate": 8.158227278110352e-05, "loss": 2.5874, "step": 32538 }, { "epoch": 0.87, "learning_rate": 8.154784250795855e-05, "loss": 2.6412, "step": 32539 }, { "epoch": 0.87, "learning_rate": 8.151341919284284e-05, "loss": 2.6325, "step": 32540 }, { "epoch": 0.87, "learning_rate": 8.147900283601717e-05, "loss": 2.2696, "step": 32541 }, { "epoch": 0.87, "learning_rate": 8.144459343774235e-05, "loss": 2.5734, "step": 32542 }, { "epoch": 0.87, "learning_rate": 8.141019099827906e-05, "loss": 2.9119, "step": 32543 }, { "epoch": 0.87, "learning_rate": 8.13757955178882e-05, "loss": 2.3767, "step": 32544 }, { "epoch": 0.87, "learning_rate": 8.134140699682991e-05, "loss": 2.6792, "step": 32545 }, { "epoch": 0.87, "learning_rate": 8.130702543536472e-05, "loss": 2.0643, "step": 32546 }, { "epoch": 0.87, "learning_rate": 8.127265083375346e-05, "loss": 2.2573, "step": 32547 }, { "epoch": 0.87, "learning_rate": 8.123828319225624e-05, "loss": 2.8788, "step": 32548 }, { "epoch": 0.87, "learning_rate": 8.120392251113351e-05, "loss": 2.6953, "step": 32549 }, { "epoch": 0.87, "learning_rate": 8.116956879064575e-05, "loss": 2.2219, "step": 32550 }, { "epoch": 0.87, "learning_rate": 8.113522203105294e-05, "loss": 2.6621, "step": 32551 }, { "epoch": 0.87, "learning_rate": 8.110088223261558e-05, "loss": 2.6128, "step": 32552 }, { "epoch": 0.87, "learning_rate": 8.106654939559355e-05, "loss": 2.3238, "step": 32553 }, { "epoch": 0.87, "learning_rate": 8.103222352024697e-05, "loss": 2.6785, "step": 32554 }, { "epoch": 0.87, "learning_rate": 8.099790460683598e-05, "loss": 2.3964, "step": 32555 }, { "epoch": 0.87, "learning_rate": 8.096359265562059e-05, "loss": 2.2783, "step": 32556 }, { "epoch": 0.87, "learning_rate": 8.092928766686058e-05, "loss": 2.599, "step": 32557 }, { "epoch": 0.87, "learning_rate": 8.089498964081632e-05, "loss": 2.4603, "step": 32558 }, { "epoch": 0.87, "learning_rate": 8.086069857774702e-05, "loss": 2.81, "step": 32559 }, { "epoch": 0.88, "learning_rate": 8.082641447791284e-05, "loss": 2.932, "step": 32560 }, { "epoch": 0.88, "learning_rate": 8.079213734157332e-05, "loss": 2.8927, "step": 32561 }, { "epoch": 0.88, "learning_rate": 8.075786716898825e-05, "loss": 2.4224, "step": 32562 }, { "epoch": 0.88, "learning_rate": 8.072360396041745e-05, "loss": 2.5413, "step": 32563 }, { "epoch": 0.88, "learning_rate": 8.068934771612002e-05, "loss": 2.4194, "step": 32564 }, { "epoch": 0.88, "learning_rate": 8.065509843635577e-05, "loss": 2.1685, "step": 32565 }, { "epoch": 0.88, "learning_rate": 8.062085612138437e-05, "loss": 2.7627, "step": 32566 }, { "epoch": 0.88, "learning_rate": 8.058662077146473e-05, "loss": 2.4416, "step": 32567 }, { "epoch": 0.88, "learning_rate": 8.05523923868563e-05, "loss": 2.6655, "step": 32568 }, { "epoch": 0.88, "learning_rate": 8.0518170967819e-05, "loss": 2.067, "step": 32569 }, { "epoch": 0.88, "learning_rate": 8.048395651461138e-05, "loss": 2.5071, "step": 32570 }, { "epoch": 0.88, "learning_rate": 8.044974902749313e-05, "loss": 2.62, "step": 32571 }, { "epoch": 0.88, "learning_rate": 8.041554850672306e-05, "loss": 2.3025, "step": 32572 }, { "epoch": 0.88, "learning_rate": 8.038135495256027e-05, "loss": 2.1168, "step": 32573 }, { "epoch": 0.88, "learning_rate": 8.034716836526401e-05, "loss": 2.3842, "step": 32574 }, { "epoch": 0.88, "learning_rate": 8.031298874509319e-05, "loss": 2.7314, "step": 32575 }, { "epoch": 0.88, "learning_rate": 8.02788160923067e-05, "loss": 2.4367, "step": 32576 }, { "epoch": 0.88, "learning_rate": 8.024465040716366e-05, "loss": 2.54, "step": 32577 }, { "epoch": 0.88, "learning_rate": 8.021049168992256e-05, "loss": 2.7289, "step": 32578 }, { "epoch": 0.88, "learning_rate": 8.01763399408425e-05, "loss": 1.8729, "step": 32579 }, { "epoch": 0.88, "learning_rate": 8.014219516018184e-05, "loss": 2.5221, "step": 32580 }, { "epoch": 0.88, "learning_rate": 8.010805734819925e-05, "loss": 2.714, "step": 32581 }, { "epoch": 0.88, "learning_rate": 8.007392650515399e-05, "loss": 2.5507, "step": 32582 }, { "epoch": 0.88, "learning_rate": 8.003980263130395e-05, "loss": 2.5459, "step": 32583 }, { "epoch": 0.88, "learning_rate": 8.000568572690792e-05, "loss": 2.7773, "step": 32584 }, { "epoch": 0.88, "learning_rate": 7.997157579222447e-05, "loss": 2.4869, "step": 32585 }, { "epoch": 0.88, "learning_rate": 7.993747282751174e-05, "loss": 1.949, "step": 32586 }, { "epoch": 0.88, "learning_rate": 7.990337683302817e-05, "loss": 2.5564, "step": 32587 }, { "epoch": 0.88, "learning_rate": 7.986928780903224e-05, "loss": 2.1727, "step": 32588 }, { "epoch": 0.88, "learning_rate": 7.983520575578196e-05, "loss": 2.5358, "step": 32589 }, { "epoch": 0.88, "learning_rate": 7.980113067353589e-05, "loss": 2.5248, "step": 32590 }, { "epoch": 0.88, "learning_rate": 7.976706256255173e-05, "loss": 2.0164, "step": 32591 }, { "epoch": 0.88, "learning_rate": 7.973300142308782e-05, "loss": 2.4957, "step": 32592 }, { "epoch": 0.88, "learning_rate": 7.969894725540227e-05, "loss": 1.8546, "step": 32593 }, { "epoch": 0.88, "learning_rate": 7.966490005975268e-05, "loss": 2.5951, "step": 32594 }, { "epoch": 0.88, "learning_rate": 7.963085983639762e-05, "loss": 2.5198, "step": 32595 }, { "epoch": 0.88, "learning_rate": 7.959682658559442e-05, "loss": 2.7543, "step": 32596 }, { "epoch": 0.88, "learning_rate": 7.95628003076011e-05, "loss": 2.6445, "step": 32597 }, { "epoch": 0.88, "learning_rate": 7.952878100267569e-05, "loss": 2.3708, "step": 32598 }, { "epoch": 0.88, "learning_rate": 7.949476867107541e-05, "loss": 2.3798, "step": 32599 }, { "epoch": 0.88, "learning_rate": 7.946076331305818e-05, "loss": 1.8958, "step": 32600 }, { "epoch": 0.88, "learning_rate": 7.942676492888168e-05, "loss": 2.6535, "step": 32601 }, { "epoch": 0.88, "learning_rate": 7.939277351880347e-05, "loss": 2.7476, "step": 32602 }, { "epoch": 0.88, "learning_rate": 7.935878908308092e-05, "loss": 2.296, "step": 32603 }, { "epoch": 0.88, "learning_rate": 7.932481162197181e-05, "loss": 2.8112, "step": 32604 }, { "epoch": 0.88, "learning_rate": 7.929084113573315e-05, "loss": 2.559, "step": 32605 }, { "epoch": 0.88, "learning_rate": 7.925687762462263e-05, "loss": 2.0489, "step": 32606 }, { "epoch": 0.88, "learning_rate": 7.922292108889706e-05, "loss": 2.1829, "step": 32607 }, { "epoch": 0.88, "learning_rate": 7.918897152881421e-05, "loss": 2.7766, "step": 32608 }, { "epoch": 0.88, "learning_rate": 7.915502894463122e-05, "loss": 2.4633, "step": 32609 }, { "epoch": 0.88, "learning_rate": 7.912109333660489e-05, "loss": 2.3122, "step": 32610 }, { "epoch": 0.88, "learning_rate": 7.908716470499267e-05, "loss": 2.5788, "step": 32611 }, { "epoch": 0.88, "learning_rate": 7.905324305005146e-05, "loss": 2.7436, "step": 32612 }, { "epoch": 0.88, "learning_rate": 7.901932837203818e-05, "loss": 2.4896, "step": 32613 }, { "epoch": 0.88, "learning_rate": 7.898542067120973e-05, "loss": 2.0328, "step": 32614 }, { "epoch": 0.88, "learning_rate": 7.895151994782313e-05, "loss": 2.8089, "step": 32615 }, { "epoch": 0.88, "learning_rate": 7.891762620213506e-05, "loss": 2.6654, "step": 32616 }, { "epoch": 0.88, "learning_rate": 7.888373943440263e-05, "loss": 2.5907, "step": 32617 }, { "epoch": 0.88, "learning_rate": 7.884985964488211e-05, "loss": 2.3641, "step": 32618 }, { "epoch": 0.88, "learning_rate": 7.881598683383029e-05, "loss": 2.1897, "step": 32619 }, { "epoch": 0.88, "learning_rate": 7.878212100150395e-05, "loss": 2.5812, "step": 32620 }, { "epoch": 0.88, "learning_rate": 7.874826214815956e-05, "loss": 2.6943, "step": 32621 }, { "epoch": 0.88, "learning_rate": 7.871441027405379e-05, "loss": 2.1971, "step": 32622 }, { "epoch": 0.88, "learning_rate": 7.868056537944279e-05, "loss": 2.8812, "step": 32623 }, { "epoch": 0.88, "learning_rate": 7.864672746458313e-05, "loss": 2.3638, "step": 32624 }, { "epoch": 0.88, "learning_rate": 7.861289652973124e-05, "loss": 2.8352, "step": 32625 }, { "epoch": 0.88, "learning_rate": 7.857907257514318e-05, "loss": 2.4398, "step": 32626 }, { "epoch": 0.88, "learning_rate": 7.854525560107529e-05, "loss": 2.7792, "step": 32627 }, { "epoch": 0.88, "learning_rate": 7.851144560778389e-05, "loss": 2.7698, "step": 32628 }, { "epoch": 0.88, "learning_rate": 7.847764259552504e-05, "loss": 2.3005, "step": 32629 }, { "epoch": 0.88, "learning_rate": 7.844384656455483e-05, "loss": 2.2832, "step": 32630 }, { "epoch": 0.88, "learning_rate": 7.841005751512931e-05, "loss": 2.7121, "step": 32631 }, { "epoch": 0.88, "learning_rate": 7.837627544750425e-05, "loss": 2.4485, "step": 32632 }, { "epoch": 0.88, "learning_rate": 7.834250036193592e-05, "loss": 2.3162, "step": 32633 }, { "epoch": 0.88, "learning_rate": 7.830873225867985e-05, "loss": 2.4787, "step": 32634 }, { "epoch": 0.88, "learning_rate": 7.82749711379922e-05, "loss": 2.2872, "step": 32635 }, { "epoch": 0.88, "learning_rate": 7.824121700012865e-05, "loss": 2.2925, "step": 32636 }, { "epoch": 0.88, "learning_rate": 7.820746984534476e-05, "loss": 2.9258, "step": 32637 }, { "epoch": 0.88, "learning_rate": 7.817372967389624e-05, "loss": 2.5477, "step": 32638 }, { "epoch": 0.88, "learning_rate": 7.813999648603887e-05, "loss": 2.5997, "step": 32639 }, { "epoch": 0.88, "learning_rate": 7.810627028202788e-05, "loss": 2.704, "step": 32640 }, { "epoch": 0.88, "learning_rate": 7.807255106211908e-05, "loss": 2.5787, "step": 32641 }, { "epoch": 0.88, "learning_rate": 7.803883882656771e-05, "loss": 2.4334, "step": 32642 }, { "epoch": 0.88, "learning_rate": 7.800513357562933e-05, "loss": 2.6297, "step": 32643 }, { "epoch": 0.88, "learning_rate": 7.797143530955941e-05, "loss": 2.5481, "step": 32644 }, { "epoch": 0.88, "learning_rate": 7.793774402861275e-05, "loss": 2.3246, "step": 32645 }, { "epoch": 0.88, "learning_rate": 7.790405973304504e-05, "loss": 2.3472, "step": 32646 }, { "epoch": 0.88, "learning_rate": 7.787038242311128e-05, "loss": 2.8711, "step": 32647 }, { "epoch": 0.88, "learning_rate": 7.783671209906662e-05, "loss": 2.8113, "step": 32648 }, { "epoch": 0.88, "learning_rate": 7.780304876116629e-05, "loss": 2.2205, "step": 32649 }, { "epoch": 0.88, "learning_rate": 7.776939240966507e-05, "loss": 2.5392, "step": 32650 }, { "epoch": 0.88, "learning_rate": 7.7735743044818e-05, "loss": 2.8595, "step": 32651 }, { "epoch": 0.88, "learning_rate": 7.770210066688033e-05, "loss": 2.8586, "step": 32652 }, { "epoch": 0.88, "learning_rate": 7.766846527610638e-05, "loss": 2.5234, "step": 32653 }, { "epoch": 0.88, "learning_rate": 7.763483687275108e-05, "loss": 2.6375, "step": 32654 }, { "epoch": 0.88, "learning_rate": 7.760121545706978e-05, "loss": 2.8027, "step": 32655 }, { "epoch": 0.88, "learning_rate": 7.756760102931648e-05, "loss": 2.5058, "step": 32656 }, { "epoch": 0.88, "learning_rate": 7.753399358974633e-05, "loss": 1.9615, "step": 32657 }, { "epoch": 0.88, "learning_rate": 7.750039313861357e-05, "loss": 2.4125, "step": 32658 }, { "epoch": 0.88, "learning_rate": 7.746679967617298e-05, "loss": 2.4154, "step": 32659 }, { "epoch": 0.88, "learning_rate": 7.743321320267882e-05, "loss": 2.5968, "step": 32660 }, { "epoch": 0.88, "learning_rate": 7.739963371838588e-05, "loss": 2.6112, "step": 32661 }, { "epoch": 0.88, "learning_rate": 7.736606122354817e-05, "loss": 2.2806, "step": 32662 }, { "epoch": 0.88, "learning_rate": 7.73324957184206e-05, "loss": 2.3678, "step": 32663 }, { "epoch": 0.88, "learning_rate": 7.729893720325676e-05, "loss": 2.1989, "step": 32664 }, { "epoch": 0.88, "learning_rate": 7.726538567831143e-05, "loss": 2.5467, "step": 32665 }, { "epoch": 0.88, "learning_rate": 7.723184114383841e-05, "loss": 2.7874, "step": 32666 }, { "epoch": 0.88, "learning_rate": 7.719830360009183e-05, "loss": 2.3381, "step": 32667 }, { "epoch": 0.88, "learning_rate": 7.716477304732617e-05, "loss": 2.2652, "step": 32668 }, { "epoch": 0.88, "learning_rate": 7.71312494857952e-05, "loss": 2.8066, "step": 32669 }, { "epoch": 0.88, "learning_rate": 7.709773291575273e-05, "loss": 2.71, "step": 32670 }, { "epoch": 0.88, "learning_rate": 7.706422333745311e-05, "loss": 2.4938, "step": 32671 }, { "epoch": 0.88, "learning_rate": 7.70307207511497e-05, "loss": 2.7443, "step": 32672 }, { "epoch": 0.88, "learning_rate": 7.699722515709651e-05, "loss": 2.6092, "step": 32673 }, { "epoch": 0.88, "learning_rate": 7.696373655554734e-05, "loss": 2.4077, "step": 32674 }, { "epoch": 0.88, "learning_rate": 7.693025494675598e-05, "loss": 2.3929, "step": 32675 }, { "epoch": 0.88, "learning_rate": 7.689678033097603e-05, "loss": 2.2379, "step": 32676 }, { "epoch": 0.88, "learning_rate": 7.686331270846092e-05, "loss": 2.4616, "step": 32677 }, { "epoch": 0.88, "learning_rate": 7.682985207946435e-05, "loss": 2.5602, "step": 32678 }, { "epoch": 0.88, "learning_rate": 7.679639844423991e-05, "loss": 2.3035, "step": 32679 }, { "epoch": 0.88, "learning_rate": 7.67629518030405e-05, "loss": 2.3228, "step": 32680 }, { "epoch": 0.88, "learning_rate": 7.672951215612012e-05, "loss": 2.3913, "step": 32681 }, { "epoch": 0.88, "learning_rate": 7.669607950373203e-05, "loss": 2.364, "step": 32682 }, { "epoch": 0.88, "learning_rate": 7.666265384612925e-05, "loss": 2.4608, "step": 32683 }, { "epoch": 0.88, "learning_rate": 7.662923518356535e-05, "loss": 2.5493, "step": 32684 }, { "epoch": 0.88, "learning_rate": 7.659582351629302e-05, "loss": 2.7009, "step": 32685 }, { "epoch": 0.88, "learning_rate": 7.656241884456572e-05, "loss": 2.5916, "step": 32686 }, { "epoch": 0.88, "learning_rate": 7.652902116863635e-05, "loss": 2.8819, "step": 32687 }, { "epoch": 0.88, "learning_rate": 7.649563048875808e-05, "loss": 2.9368, "step": 32688 }, { "epoch": 0.88, "learning_rate": 7.646224680518377e-05, "loss": 2.8386, "step": 32689 }, { "epoch": 0.88, "learning_rate": 7.642887011816646e-05, "loss": 2.3083, "step": 32690 }, { "epoch": 0.88, "learning_rate": 7.639550042795884e-05, "loss": 2.9805, "step": 32691 }, { "epoch": 0.88, "learning_rate": 7.636213773481394e-05, "loss": 2.5923, "step": 32692 }, { "epoch": 0.88, "learning_rate": 7.632878203898409e-05, "loss": 2.6033, "step": 32693 }, { "epoch": 0.88, "learning_rate": 7.629543334072231e-05, "loss": 2.2358, "step": 32694 }, { "epoch": 0.88, "learning_rate": 7.626209164028142e-05, "loss": 2.2606, "step": 32695 }, { "epoch": 0.88, "learning_rate": 7.622875693791353e-05, "loss": 2.459, "step": 32696 }, { "epoch": 0.88, "learning_rate": 7.619542923387147e-05, "loss": 2.707, "step": 32697 }, { "epoch": 0.88, "learning_rate": 7.616210852840788e-05, "loss": 2.6409, "step": 32698 }, { "epoch": 0.88, "learning_rate": 7.612879482177471e-05, "loss": 2.3503, "step": 32699 }, { "epoch": 0.88, "learning_rate": 7.609548811422473e-05, "loss": 2.4585, "step": 32700 }, { "epoch": 0.88, "learning_rate": 7.606218840601009e-05, "loss": 2.259, "step": 32701 }, { "epoch": 0.88, "learning_rate": 7.602889569738314e-05, "loss": 2.3616, "step": 32702 }, { "epoch": 0.88, "learning_rate": 7.599560998859622e-05, "loss": 2.3736, "step": 32703 }, { "epoch": 0.88, "learning_rate": 7.596233127990126e-05, "loss": 2.1878, "step": 32704 }, { "epoch": 0.88, "learning_rate": 7.592905957155049e-05, "loss": 2.5232, "step": 32705 }, { "epoch": 0.88, "learning_rate": 7.589579486379594e-05, "loss": 2.3791, "step": 32706 }, { "epoch": 0.88, "learning_rate": 7.586253715688962e-05, "loss": 2.2765, "step": 32707 }, { "epoch": 0.88, "learning_rate": 7.582928645108367e-05, "loss": 2.6637, "step": 32708 }, { "epoch": 0.88, "learning_rate": 7.579604274662955e-05, "loss": 2.4228, "step": 32709 }, { "epoch": 0.88, "learning_rate": 7.57628060437795e-05, "loss": 2.5702, "step": 32710 }, { "epoch": 0.88, "learning_rate": 7.572957634278532e-05, "loss": 2.1798, "step": 32711 }, { "epoch": 0.88, "learning_rate": 7.569635364389848e-05, "loss": 1.992, "step": 32712 }, { "epoch": 0.88, "learning_rate": 7.566313794737067e-05, "loss": 2.6946, "step": 32713 }, { "epoch": 0.88, "learning_rate": 7.56299292534539e-05, "loss": 2.0925, "step": 32714 }, { "epoch": 0.88, "learning_rate": 7.559672756239943e-05, "loss": 2.6276, "step": 32715 }, { "epoch": 0.88, "learning_rate": 7.556353287445894e-05, "loss": 2.5153, "step": 32716 }, { "epoch": 0.88, "learning_rate": 7.553034518988388e-05, "loss": 2.664, "step": 32717 }, { "epoch": 0.88, "learning_rate": 7.549716450892563e-05, "loss": 2.6709, "step": 32718 }, { "epoch": 0.88, "learning_rate": 7.546399083183542e-05, "loss": 2.4433, "step": 32719 }, { "epoch": 0.88, "learning_rate": 7.543082415886483e-05, "loss": 2.6695, "step": 32720 }, { "epoch": 0.88, "learning_rate": 7.539766449026497e-05, "loss": 1.942, "step": 32721 }, { "epoch": 0.88, "learning_rate": 7.536451182628735e-05, "loss": 2.1195, "step": 32722 }, { "epoch": 0.88, "learning_rate": 7.533136616718261e-05, "loss": 2.5415, "step": 32723 }, { "epoch": 0.88, "learning_rate": 7.529822751320226e-05, "loss": 2.6252, "step": 32724 }, { "epoch": 0.88, "learning_rate": 7.526509586459729e-05, "loss": 2.4274, "step": 32725 }, { "epoch": 0.88, "learning_rate": 7.523197122161829e-05, "loss": 2.4417, "step": 32726 }, { "epoch": 0.88, "learning_rate": 7.519885358451684e-05, "loss": 2.5155, "step": 32727 }, { "epoch": 0.88, "learning_rate": 7.516574295354339e-05, "loss": 2.3748, "step": 32728 }, { "epoch": 0.88, "learning_rate": 7.513263932894898e-05, "loss": 2.6421, "step": 32729 }, { "epoch": 0.88, "learning_rate": 7.509954271098452e-05, "loss": 2.6517, "step": 32730 }, { "epoch": 0.88, "learning_rate": 7.506645309990035e-05, "loss": 2.4468, "step": 32731 }, { "epoch": 0.88, "learning_rate": 7.503337049594738e-05, "loss": 2.2048, "step": 32732 }, { "epoch": 0.88, "learning_rate": 7.50002948993762e-05, "loss": 2.6667, "step": 32733 }, { "epoch": 0.88, "learning_rate": 7.496722631043739e-05, "loss": 2.338, "step": 32734 }, { "epoch": 0.88, "learning_rate": 7.493416472938174e-05, "loss": 2.6197, "step": 32735 }, { "epoch": 0.88, "learning_rate": 7.490111015645928e-05, "loss": 2.0987, "step": 32736 }, { "epoch": 0.88, "learning_rate": 7.486806259192058e-05, "loss": 2.3958, "step": 32737 }, { "epoch": 0.88, "learning_rate": 7.483502203601622e-05, "loss": 2.1878, "step": 32738 }, { "epoch": 0.88, "learning_rate": 7.4801988488996e-05, "loss": 2.6764, "step": 32739 }, { "epoch": 0.88, "learning_rate": 7.476896195111071e-05, "loss": 2.6812, "step": 32740 }, { "epoch": 0.88, "learning_rate": 7.47359424226105e-05, "loss": 2.5081, "step": 32741 }, { "epoch": 0.88, "learning_rate": 7.470292990374517e-05, "loss": 2.3657, "step": 32742 }, { "epoch": 0.88, "learning_rate": 7.466992439476528e-05, "loss": 2.6311, "step": 32743 }, { "epoch": 0.88, "learning_rate": 7.46369258959203e-05, "loss": 2.4813, "step": 32744 }, { "epoch": 0.88, "learning_rate": 7.46039344074606e-05, "loss": 2.4438, "step": 32745 }, { "epoch": 0.88, "learning_rate": 7.457094992963609e-05, "loss": 2.8849, "step": 32746 }, { "epoch": 0.88, "learning_rate": 7.453797246269656e-05, "loss": 2.1498, "step": 32747 }, { "epoch": 0.88, "learning_rate": 7.450500200689192e-05, "loss": 2.6224, "step": 32748 }, { "epoch": 0.88, "learning_rate": 7.447203856247198e-05, "loss": 2.3094, "step": 32749 }, { "epoch": 0.88, "learning_rate": 7.443908212968631e-05, "loss": 2.3233, "step": 32750 }, { "epoch": 0.88, "learning_rate": 7.440613270878471e-05, "loss": 2.6628, "step": 32751 }, { "epoch": 0.88, "learning_rate": 7.437319030001677e-05, "loss": 2.0631, "step": 32752 }, { "epoch": 0.88, "learning_rate": 7.434025490363205e-05, "loss": 2.5658, "step": 32753 }, { "epoch": 0.88, "learning_rate": 7.430732651988026e-05, "loss": 2.7269, "step": 32754 }, { "epoch": 0.88, "learning_rate": 7.427440514901041e-05, "loss": 2.4421, "step": 32755 }, { "epoch": 0.88, "learning_rate": 7.424149079127218e-05, "loss": 2.4795, "step": 32756 }, { "epoch": 0.88, "learning_rate": 7.420858344691516e-05, "loss": 2.3474, "step": 32757 }, { "epoch": 0.88, "learning_rate": 7.417568311618817e-05, "loss": 2.0466, "step": 32758 }, { "epoch": 0.88, "learning_rate": 7.414278979934064e-05, "loss": 2.2768, "step": 32759 }, { "epoch": 0.88, "learning_rate": 7.410990349662195e-05, "loss": 2.5683, "step": 32760 }, { "epoch": 0.88, "learning_rate": 7.4077024208281e-05, "loss": 2.7499, "step": 32761 }, { "epoch": 0.88, "learning_rate": 7.404415193456704e-05, "loss": 2.7844, "step": 32762 }, { "epoch": 0.88, "learning_rate": 7.401128667572898e-05, "loss": 2.598, "step": 32763 }, { "epoch": 0.88, "learning_rate": 7.397842843201586e-05, "loss": 2.6939, "step": 32764 }, { "epoch": 0.88, "learning_rate": 7.394557720367667e-05, "loss": 2.3007, "step": 32765 }, { "epoch": 0.88, "learning_rate": 7.391273299096013e-05, "loss": 2.7131, "step": 32766 }, { "epoch": 0.88, "learning_rate": 7.387989579411514e-05, "loss": 2.449, "step": 32767 }, { "epoch": 0.88, "learning_rate": 7.384706561339072e-05, "loss": 2.2836, "step": 32768 }, { "epoch": 0.88, "learning_rate": 7.381424244903524e-05, "loss": 2.3788, "step": 32769 }, { "epoch": 0.88, "learning_rate": 7.378142630129748e-05, "loss": 2.7205, "step": 32770 }, { "epoch": 0.88, "learning_rate": 7.374861717042602e-05, "loss": 2.6118, "step": 32771 }, { "epoch": 0.88, "learning_rate": 7.371581505666935e-05, "loss": 2.644, "step": 32772 }, { "epoch": 0.88, "learning_rate": 7.368301996027605e-05, "loss": 2.7115, "step": 32773 }, { "epoch": 0.88, "learning_rate": 7.365023188149467e-05, "loss": 2.6644, "step": 32774 }, { "epoch": 0.88, "learning_rate": 7.361745082057347e-05, "loss": 2.666, "step": 32775 }, { "epoch": 0.88, "learning_rate": 7.358467677776093e-05, "loss": 2.3548, "step": 32776 }, { "epoch": 0.88, "learning_rate": 7.355190975330517e-05, "loss": 2.1878, "step": 32777 }, { "epoch": 0.88, "learning_rate": 7.351914974745455e-05, "loss": 2.534, "step": 32778 }, { "epoch": 0.88, "learning_rate": 7.34863967604571e-05, "loss": 2.134, "step": 32779 }, { "epoch": 0.88, "learning_rate": 7.345365079256116e-05, "loss": 2.5498, "step": 32780 }, { "epoch": 0.88, "learning_rate": 7.342091184401478e-05, "loss": 2.7848, "step": 32781 }, { "epoch": 0.88, "learning_rate": 7.338817991506586e-05, "loss": 2.2687, "step": 32782 }, { "epoch": 0.88, "learning_rate": 7.33554550059623e-05, "loss": 2.4679, "step": 32783 }, { "epoch": 0.88, "learning_rate": 7.332273711695237e-05, "loss": 2.518, "step": 32784 }, { "epoch": 0.88, "learning_rate": 7.329002624828363e-05, "loss": 2.372, "step": 32785 }, { "epoch": 0.88, "learning_rate": 7.325732240020367e-05, "loss": 2.1716, "step": 32786 }, { "epoch": 0.88, "learning_rate": 7.322462557296095e-05, "loss": 2.2349, "step": 32787 }, { "epoch": 0.88, "learning_rate": 7.319193576680261e-05, "loss": 2.2213, "step": 32788 }, { "epoch": 0.88, "learning_rate": 7.315925298197667e-05, "loss": 2.3025, "step": 32789 }, { "epoch": 0.88, "learning_rate": 7.312657721873028e-05, "loss": 2.4269, "step": 32790 }, { "epoch": 0.88, "learning_rate": 7.309390847731123e-05, "loss": 2.6451, "step": 32791 }, { "epoch": 0.88, "learning_rate": 7.30612467579671e-05, "loss": 2.5292, "step": 32792 }, { "epoch": 0.88, "learning_rate": 7.302859206094514e-05, "loss": 2.4927, "step": 32793 }, { "epoch": 0.88, "learning_rate": 7.299594438649293e-05, "loss": 2.2703, "step": 32794 }, { "epoch": 0.88, "learning_rate": 7.296330373485782e-05, "loss": 2.3087, "step": 32795 }, { "epoch": 0.88, "learning_rate": 7.293067010628685e-05, "loss": 2.4302, "step": 32796 }, { "epoch": 0.88, "learning_rate": 7.289804350102747e-05, "loss": 2.1745, "step": 32797 }, { "epoch": 0.88, "learning_rate": 7.286542391932671e-05, "loss": 2.2025, "step": 32798 }, { "epoch": 0.88, "learning_rate": 7.283281136143149e-05, "loss": 2.0879, "step": 32799 }, { "epoch": 0.88, "learning_rate": 7.28002058275895e-05, "loss": 2.442, "step": 32800 }, { "epoch": 0.88, "learning_rate": 7.276760731804721e-05, "loss": 2.407, "step": 32801 }, { "epoch": 0.88, "learning_rate": 7.273501583305175e-05, "loss": 2.3475, "step": 32802 }, { "epoch": 0.88, "learning_rate": 7.270243137285026e-05, "loss": 2.8674, "step": 32803 }, { "epoch": 0.88, "learning_rate": 7.26698539376891e-05, "loss": 2.6709, "step": 32804 }, { "epoch": 0.88, "learning_rate": 7.26372835278154e-05, "loss": 2.8464, "step": 32805 }, { "epoch": 0.88, "learning_rate": 7.260472014347575e-05, "loss": 2.8717, "step": 32806 }, { "epoch": 0.88, "learning_rate": 7.257216378491705e-05, "loss": 2.4874, "step": 32807 }, { "epoch": 0.88, "learning_rate": 7.253961445238599e-05, "loss": 2.6106, "step": 32808 }, { "epoch": 0.88, "learning_rate": 7.250707214612873e-05, "loss": 2.6043, "step": 32809 }, { "epoch": 0.88, "learning_rate": 7.247453686639216e-05, "loss": 2.3178, "step": 32810 }, { "epoch": 0.88, "learning_rate": 7.244200861342276e-05, "loss": 2.2746, "step": 32811 }, { "epoch": 0.88, "learning_rate": 7.240948738746667e-05, "loss": 2.5285, "step": 32812 }, { "epoch": 0.88, "learning_rate": 7.237697318877067e-05, "loss": 2.6432, "step": 32813 }, { "epoch": 0.88, "learning_rate": 7.234446601758071e-05, "loss": 2.0432, "step": 32814 }, { "epoch": 0.88, "learning_rate": 7.231196587414335e-05, "loss": 2.3965, "step": 32815 }, { "epoch": 0.88, "learning_rate": 7.227947275870472e-05, "loss": 2.3517, "step": 32816 }, { "epoch": 0.88, "learning_rate": 7.224698667151086e-05, "loss": 2.7162, "step": 32817 }, { "epoch": 0.88, "learning_rate": 7.22145076128079e-05, "loss": 2.3489, "step": 32818 }, { "epoch": 0.88, "learning_rate": 7.218203558284198e-05, "loss": 2.3485, "step": 32819 }, { "epoch": 0.88, "learning_rate": 7.214957058185911e-05, "loss": 1.6963, "step": 32820 }, { "epoch": 0.88, "learning_rate": 7.211711261010523e-05, "loss": 3.0022, "step": 32821 }, { "epoch": 0.88, "learning_rate": 7.208466166782635e-05, "loss": 2.3439, "step": 32822 }, { "epoch": 0.88, "learning_rate": 7.205221775526794e-05, "loss": 2.6169, "step": 32823 }, { "epoch": 0.88, "learning_rate": 7.201978087267624e-05, "loss": 2.9516, "step": 32824 }, { "epoch": 0.88, "learning_rate": 7.198735102029652e-05, "loss": 2.2528, "step": 32825 }, { "epoch": 0.88, "learning_rate": 7.195492819837479e-05, "loss": 2.6512, "step": 32826 }, { "epoch": 0.88, "learning_rate": 7.192251240715675e-05, "loss": 2.4377, "step": 32827 }, { "epoch": 0.88, "learning_rate": 7.189010364688775e-05, "loss": 2.5974, "step": 32828 }, { "epoch": 0.88, "learning_rate": 7.185770191781338e-05, "loss": 2.5202, "step": 32829 }, { "epoch": 0.88, "learning_rate": 7.182530722017921e-05, "loss": 2.2143, "step": 32830 }, { "epoch": 0.88, "learning_rate": 7.179291955423051e-05, "loss": 2.619, "step": 32831 }, { "epoch": 0.88, "learning_rate": 7.176053892021262e-05, "loss": 2.4815, "step": 32832 }, { "epoch": 0.88, "learning_rate": 7.172816531837101e-05, "loss": 2.3541, "step": 32833 }, { "epoch": 0.88, "learning_rate": 7.169579874895082e-05, "loss": 2.4407, "step": 32834 }, { "epoch": 0.88, "learning_rate": 7.166343921219742e-05, "loss": 2.6655, "step": 32835 }, { "epoch": 0.88, "learning_rate": 7.163108670835572e-05, "loss": 2.2492, "step": 32836 }, { "epoch": 0.88, "learning_rate": 7.159874123767096e-05, "loss": 2.4684, "step": 32837 }, { "epoch": 0.88, "learning_rate": 7.156640280038807e-05, "loss": 2.8097, "step": 32838 }, { "epoch": 0.88, "learning_rate": 7.153407139675217e-05, "loss": 2.5117, "step": 32839 }, { "epoch": 0.88, "learning_rate": 7.150174702700829e-05, "loss": 3.0366, "step": 32840 }, { "epoch": 0.88, "learning_rate": 7.146942969140102e-05, "loss": 2.4482, "step": 32841 }, { "epoch": 0.88, "learning_rate": 7.143711939017539e-05, "loss": 2.4494, "step": 32842 }, { "epoch": 0.88, "learning_rate": 7.14048161235763e-05, "loss": 2.3308, "step": 32843 }, { "epoch": 0.88, "learning_rate": 7.1372519891848e-05, "loss": 2.1882, "step": 32844 }, { "epoch": 0.88, "learning_rate": 7.134023069523565e-05, "loss": 2.7026, "step": 32845 }, { "epoch": 0.88, "learning_rate": 7.130794853398359e-05, "loss": 2.428, "step": 32846 }, { "epoch": 0.88, "learning_rate": 7.127567340833651e-05, "loss": 2.8578, "step": 32847 }, { "epoch": 0.88, "learning_rate": 7.124340531853901e-05, "loss": 2.543, "step": 32848 }, { "epoch": 0.88, "learning_rate": 7.121114426483522e-05, "loss": 2.5818, "step": 32849 }, { "epoch": 0.88, "learning_rate": 7.117889024746982e-05, "loss": 2.4463, "step": 32850 }, { "epoch": 0.88, "learning_rate": 7.114664326668707e-05, "loss": 3.0275, "step": 32851 }, { "epoch": 0.88, "learning_rate": 7.111440332273133e-05, "loss": 2.1599, "step": 32852 }, { "epoch": 0.88, "learning_rate": 7.108217041584675e-05, "loss": 2.8664, "step": 32853 }, { "epoch": 0.88, "learning_rate": 7.104994454627778e-05, "loss": 2.8425, "step": 32854 }, { "epoch": 0.88, "learning_rate": 7.101772571426813e-05, "loss": 2.4027, "step": 32855 }, { "epoch": 0.88, "learning_rate": 7.098551392006236e-05, "loss": 2.3035, "step": 32856 }, { "epoch": 0.88, "learning_rate": 7.095330916390397e-05, "loss": 2.255, "step": 32857 }, { "epoch": 0.88, "learning_rate": 7.09211114460373e-05, "loss": 2.0144, "step": 32858 }, { "epoch": 0.88, "learning_rate": 7.088892076670617e-05, "loss": 2.1252, "step": 32859 }, { "epoch": 0.88, "learning_rate": 7.085673712615437e-05, "loss": 2.908, "step": 32860 }, { "epoch": 0.88, "learning_rate": 7.082456052462594e-05, "loss": 1.9862, "step": 32861 }, { "epoch": 0.88, "learning_rate": 7.079239096236468e-05, "loss": 2.7264, "step": 32862 }, { "epoch": 0.88, "learning_rate": 7.076022843961383e-05, "loss": 2.5758, "step": 32863 }, { "epoch": 0.88, "learning_rate": 7.072807295661754e-05, "loss": 2.5468, "step": 32864 }, { "epoch": 0.88, "learning_rate": 7.069592451361906e-05, "loss": 2.6836, "step": 32865 }, { "epoch": 0.88, "learning_rate": 7.066378311086219e-05, "loss": 2.1604, "step": 32866 }, { "epoch": 0.88, "learning_rate": 7.063164874859051e-05, "loss": 2.2336, "step": 32867 }, { "epoch": 0.88, "learning_rate": 7.059952142704718e-05, "loss": 2.9114, "step": 32868 }, { "epoch": 0.88, "learning_rate": 7.056740114647565e-05, "loss": 2.4821, "step": 32869 }, { "epoch": 0.88, "learning_rate": 7.05352879071196e-05, "loss": 2.7419, "step": 32870 }, { "epoch": 0.88, "learning_rate": 7.050318170922155e-05, "loss": 1.8215, "step": 32871 }, { "epoch": 0.88, "learning_rate": 7.047108255302547e-05, "loss": 2.3843, "step": 32872 }, { "epoch": 0.88, "learning_rate": 7.043899043877444e-05, "loss": 2.4134, "step": 32873 }, { "epoch": 0.88, "learning_rate": 7.040690536671124e-05, "loss": 2.7632, "step": 32874 }, { "epoch": 0.88, "learning_rate": 7.037482733707934e-05, "loss": 2.258, "step": 32875 }, { "epoch": 0.88, "learning_rate": 7.034275635012133e-05, "loss": 2.1824, "step": 32876 }, { "epoch": 0.88, "learning_rate": 7.031069240608045e-05, "loss": 2.6656, "step": 32877 }, { "epoch": 0.88, "learning_rate": 7.027863550519952e-05, "loss": 2.8904, "step": 32878 }, { "epoch": 0.88, "learning_rate": 7.024658564772146e-05, "loss": 2.824, "step": 32879 }, { "epoch": 0.88, "learning_rate": 7.021454283388895e-05, "loss": 2.5556, "step": 32880 }, { "epoch": 0.88, "learning_rate": 7.018250706394514e-05, "loss": 2.1937, "step": 32881 }, { "epoch": 0.88, "learning_rate": 7.015047833813215e-05, "loss": 2.0863, "step": 32882 }, { "epoch": 0.88, "learning_rate": 7.011845665669303e-05, "loss": 2.6476, "step": 32883 }, { "epoch": 0.88, "learning_rate": 7.008644201987003e-05, "loss": 2.5624, "step": 32884 }, { "epoch": 0.88, "learning_rate": 7.005443442790594e-05, "loss": 2.7414, "step": 32885 }, { "epoch": 0.88, "learning_rate": 7.002243388104345e-05, "loss": 2.4859, "step": 32886 }, { "epoch": 0.88, "learning_rate": 6.999044037952451e-05, "loss": 2.2725, "step": 32887 }, { "epoch": 0.88, "learning_rate": 6.995845392359168e-05, "loss": 2.2981, "step": 32888 }, { "epoch": 0.88, "learning_rate": 6.992647451348755e-05, "loss": 2.6703, "step": 32889 }, { "epoch": 0.88, "learning_rate": 6.989450214945404e-05, "loss": 2.0753, "step": 32890 }, { "epoch": 0.88, "learning_rate": 6.986253683173349e-05, "loss": 2.6683, "step": 32891 }, { "epoch": 0.88, "learning_rate": 6.983057856056807e-05, "loss": 2.242, "step": 32892 }, { "epoch": 0.88, "learning_rate": 6.979862733619979e-05, "loss": 2.7452, "step": 32893 }, { "epoch": 0.88, "learning_rate": 6.976668315887102e-05, "loss": 2.0588, "step": 32894 }, { "epoch": 0.88, "learning_rate": 6.973474602882345e-05, "loss": 2.8145, "step": 32895 }, { "epoch": 0.88, "learning_rate": 6.970281594629902e-05, "loss": 2.627, "step": 32896 }, { "epoch": 0.88, "learning_rate": 6.967089291153983e-05, "loss": 2.399, "step": 32897 }, { "epoch": 0.88, "learning_rate": 6.96389769247876e-05, "loss": 2.3219, "step": 32898 }, { "epoch": 0.88, "learning_rate": 6.960706798628414e-05, "loss": 2.4414, "step": 32899 }, { "epoch": 0.88, "learning_rate": 6.957516609627135e-05, "loss": 2.3957, "step": 32900 }, { "epoch": 0.88, "learning_rate": 6.95432712549906e-05, "loss": 2.7206, "step": 32901 }, { "epoch": 0.88, "learning_rate": 6.951138346268381e-05, "loss": 2.4433, "step": 32902 }, { "epoch": 0.88, "learning_rate": 6.947950271959236e-05, "loss": 1.9434, "step": 32903 }, { "epoch": 0.88, "learning_rate": 6.944762902595769e-05, "loss": 2.5161, "step": 32904 }, { "epoch": 0.88, "learning_rate": 6.941576238202153e-05, "loss": 2.6554, "step": 32905 }, { "epoch": 0.88, "learning_rate": 6.93839027880252e-05, "loss": 2.1138, "step": 32906 }, { "epoch": 0.88, "learning_rate": 6.935205024420998e-05, "loss": 2.4106, "step": 32907 }, { "epoch": 0.88, "learning_rate": 6.932020475081736e-05, "loss": 2.2684, "step": 32908 }, { "epoch": 0.88, "learning_rate": 6.928836630808844e-05, "loss": 2.2747, "step": 32909 }, { "epoch": 0.88, "learning_rate": 6.925653491626438e-05, "loss": 2.7569, "step": 32910 }, { "epoch": 0.88, "learning_rate": 6.922471057558644e-05, "loss": 2.305, "step": 32911 }, { "epoch": 0.88, "learning_rate": 6.919289328629564e-05, "loss": 2.5566, "step": 32912 }, { "epoch": 0.88, "learning_rate": 6.916108304863322e-05, "loss": 2.7443, "step": 32913 }, { "epoch": 0.88, "learning_rate": 6.91292798628399e-05, "loss": 2.4071, "step": 32914 }, { "epoch": 0.88, "learning_rate": 6.90974837291567e-05, "loss": 2.1473, "step": 32915 }, { "epoch": 0.88, "learning_rate": 6.906569464782475e-05, "loss": 2.2946, "step": 32916 }, { "epoch": 0.88, "learning_rate": 6.903391261908443e-05, "loss": 2.4068, "step": 32917 }, { "epoch": 0.88, "learning_rate": 6.900213764317686e-05, "loss": 2.112, "step": 32918 }, { "epoch": 0.88, "learning_rate": 6.897036972034254e-05, "loss": 2.4982, "step": 32919 }, { "epoch": 0.88, "learning_rate": 6.893860885082225e-05, "loss": 2.5388, "step": 32920 }, { "epoch": 0.88, "learning_rate": 6.890685503485684e-05, "loss": 2.3998, "step": 32921 }, { "epoch": 0.88, "learning_rate": 6.88751082726864e-05, "loss": 2.3106, "step": 32922 }, { "epoch": 0.88, "learning_rate": 6.884336856455165e-05, "loss": 2.6077, "step": 32923 }, { "epoch": 0.88, "learning_rate": 6.881163591069316e-05, "loss": 2.192, "step": 32924 }, { "epoch": 0.88, "learning_rate": 6.877991031135123e-05, "loss": 2.3525, "step": 32925 }, { "epoch": 0.88, "learning_rate": 6.874819176676627e-05, "loss": 2.333, "step": 32926 }, { "epoch": 0.88, "learning_rate": 6.871648027717836e-05, "loss": 2.5992, "step": 32927 }, { "epoch": 0.88, "learning_rate": 6.868477584282795e-05, "loss": 2.4716, "step": 32928 }, { "epoch": 0.88, "learning_rate": 6.865307846395541e-05, "loss": 2.5038, "step": 32929 }, { "epoch": 0.88, "learning_rate": 6.862138814080043e-05, "loss": 2.4694, "step": 32930 }, { "epoch": 0.88, "learning_rate": 6.858970487360305e-05, "loss": 2.5509, "step": 32931 }, { "epoch": 0.89, "learning_rate": 6.855802866260396e-05, "loss": 2.5315, "step": 32932 }, { "epoch": 0.89, "learning_rate": 6.852635950804253e-05, "loss": 2.6873, "step": 32933 }, { "epoch": 0.89, "learning_rate": 6.84946974101589e-05, "loss": 2.4994, "step": 32934 }, { "epoch": 0.89, "learning_rate": 6.846304236919299e-05, "loss": 2.52, "step": 32935 }, { "epoch": 0.89, "learning_rate": 6.843139438538437e-05, "loss": 2.3529, "step": 32936 }, { "epoch": 0.89, "learning_rate": 6.839975345897298e-05, "loss": 2.9473, "step": 32937 }, { "epoch": 0.89, "learning_rate": 6.836811959019851e-05, "loss": 2.5643, "step": 32938 }, { "epoch": 0.89, "learning_rate": 6.833649277930065e-05, "loss": 2.8194, "step": 32939 }, { "epoch": 0.89, "learning_rate": 6.830487302651911e-05, "loss": 2.41, "step": 32940 }, { "epoch": 0.89, "learning_rate": 6.827326033209303e-05, "loss": 2.574, "step": 32941 }, { "epoch": 0.89, "learning_rate": 6.824165469626232e-05, "loss": 2.6129, "step": 32942 }, { "epoch": 0.89, "learning_rate": 6.821005611926623e-05, "loss": 2.2565, "step": 32943 }, { "epoch": 0.89, "learning_rate": 6.817846460134391e-05, "loss": 2.3656, "step": 32944 }, { "epoch": 0.89, "learning_rate": 6.814688014273529e-05, "loss": 2.4624, "step": 32945 }, { "epoch": 0.89, "learning_rate": 6.811530274367916e-05, "loss": 2.2126, "step": 32946 }, { "epoch": 0.89, "learning_rate": 6.80837324044149e-05, "loss": 2.2877, "step": 32947 }, { "epoch": 0.89, "learning_rate": 6.805216912518175e-05, "loss": 1.9906, "step": 32948 }, { "epoch": 0.89, "learning_rate": 6.802061290621863e-05, "loss": 2.5193, "step": 32949 }, { "epoch": 0.89, "learning_rate": 6.79890637477647e-05, "loss": 2.4574, "step": 32950 }, { "epoch": 0.89, "learning_rate": 6.795752165005909e-05, "loss": 2.4998, "step": 32951 }, { "epoch": 0.89, "learning_rate": 6.79259866133406e-05, "loss": 2.6298, "step": 32952 }, { "epoch": 0.89, "learning_rate": 6.789445863784837e-05, "loss": 2.2218, "step": 32953 }, { "epoch": 0.89, "learning_rate": 6.786293772382091e-05, "loss": 2.3531, "step": 32954 }, { "epoch": 0.89, "learning_rate": 6.78314238714971e-05, "loss": 2.7277, "step": 32955 }, { "epoch": 0.89, "learning_rate": 6.7799917081116e-05, "loss": 2.2055, "step": 32956 }, { "epoch": 0.89, "learning_rate": 6.776841735291584e-05, "loss": 2.4827, "step": 32957 }, { "epoch": 0.89, "learning_rate": 6.773692468713543e-05, "loss": 2.2853, "step": 32958 }, { "epoch": 0.89, "learning_rate": 6.770543908401373e-05, "loss": 2.689, "step": 32959 }, { "epoch": 0.89, "learning_rate": 6.767396054378871e-05, "loss": 2.1207, "step": 32960 }, { "epoch": 0.89, "learning_rate": 6.764248906669934e-05, "loss": 2.833, "step": 32961 }, { "epoch": 0.89, "learning_rate": 6.761102465298353e-05, "loss": 1.8746, "step": 32962 }, { "epoch": 0.89, "learning_rate": 6.757956730287995e-05, "loss": 2.2894, "step": 32963 }, { "epoch": 0.89, "learning_rate": 6.754811701662677e-05, "loss": 2.265, "step": 32964 }, { "epoch": 0.89, "learning_rate": 6.751667379446247e-05, "loss": 2.506, "step": 32965 }, { "epoch": 0.89, "learning_rate": 6.748523763662507e-05, "loss": 2.476, "step": 32966 }, { "epoch": 0.89, "learning_rate": 6.745380854335303e-05, "loss": 2.4096, "step": 32967 }, { "epoch": 0.89, "learning_rate": 6.742238651488397e-05, "loss": 2.2408, "step": 32968 }, { "epoch": 0.89, "learning_rate": 6.739097155145635e-05, "loss": 1.8492, "step": 32969 }, { "epoch": 0.89, "learning_rate": 6.735956365330775e-05, "loss": 2.5325, "step": 32970 }, { "epoch": 0.89, "learning_rate": 6.732816282067645e-05, "loss": 2.4492, "step": 32971 }, { "epoch": 0.89, "learning_rate": 6.729676905380034e-05, "loss": 2.6609, "step": 32972 }, { "epoch": 0.89, "learning_rate": 6.726538235291712e-05, "loss": 2.8945, "step": 32973 }, { "epoch": 0.89, "learning_rate": 6.723400271826452e-05, "loss": 2.3851, "step": 32974 }, { "epoch": 0.89, "learning_rate": 6.720263015008055e-05, "loss": 2.7254, "step": 32975 }, { "epoch": 0.89, "learning_rate": 6.717126464860246e-05, "loss": 2.5177, "step": 32976 }, { "epoch": 0.89, "learning_rate": 6.713990621406818e-05, "loss": 2.7278, "step": 32977 }, { "epoch": 0.89, "learning_rate": 6.710855484671519e-05, "loss": 2.2689, "step": 32978 }, { "epoch": 0.89, "learning_rate": 6.707721054678096e-05, "loss": 2.5531, "step": 32979 }, { "epoch": 0.89, "learning_rate": 6.704587331450318e-05, "loss": 2.7335, "step": 32980 }, { "epoch": 0.89, "learning_rate": 6.70145431501189e-05, "loss": 2.626, "step": 32981 }, { "epoch": 0.89, "learning_rate": 6.698322005386558e-05, "loss": 2.6896, "step": 32982 }, { "epoch": 0.89, "learning_rate": 6.695190402598072e-05, "loss": 2.5125, "step": 32983 }, { "epoch": 0.89, "learning_rate": 6.692059506670133e-05, "loss": 2.4629, "step": 32984 }, { "epoch": 0.89, "learning_rate": 6.688929317626468e-05, "loss": 3.0687, "step": 32985 }, { "epoch": 0.89, "learning_rate": 6.685799835490802e-05, "loss": 2.4052, "step": 32986 }, { "epoch": 0.89, "learning_rate": 6.682671060286827e-05, "loss": 3.0072, "step": 32987 }, { "epoch": 0.89, "learning_rate": 6.679542992038267e-05, "loss": 2.9468, "step": 32988 }, { "epoch": 0.89, "learning_rate": 6.676415630768796e-05, "loss": 2.5332, "step": 32989 }, { "epoch": 0.89, "learning_rate": 6.6732889765021e-05, "loss": 2.3824, "step": 32990 }, { "epoch": 0.89, "learning_rate": 6.670163029261889e-05, "loss": 2.2439, "step": 32991 }, { "epoch": 0.89, "learning_rate": 6.667037789071839e-05, "loss": 2.6021, "step": 32992 }, { "epoch": 0.89, "learning_rate": 6.663913255955622e-05, "loss": 2.3307, "step": 32993 }, { "epoch": 0.89, "learning_rate": 6.660789429936931e-05, "loss": 2.3359, "step": 32994 }, { "epoch": 0.89, "learning_rate": 6.65766631103939e-05, "loss": 2.3364, "step": 32995 }, { "epoch": 0.89, "learning_rate": 6.654543899286691e-05, "loss": 2.1416, "step": 32996 }, { "epoch": 0.89, "learning_rate": 6.651422194702472e-05, "loss": 2.9378, "step": 32997 }, { "epoch": 0.89, "learning_rate": 6.64830119731038e-05, "loss": 2.6921, "step": 32998 }, { "epoch": 0.89, "learning_rate": 6.645180907134096e-05, "loss": 2.2246, "step": 32999 }, { "epoch": 0.89, "learning_rate": 6.642061324197213e-05, "loss": 2.1543, "step": 33000 }, { "epoch": 0.89, "learning_rate": 6.638942448523389e-05, "loss": 2.324, "step": 33001 }, { "epoch": 0.89, "learning_rate": 6.635824280136249e-05, "loss": 2.2773, "step": 33002 }, { "epoch": 0.89, "learning_rate": 6.632706819059408e-05, "loss": 1.9208, "step": 33003 }, { "epoch": 0.89, "learning_rate": 6.629590065316482e-05, "loss": 2.7317, "step": 33004 }, { "epoch": 0.89, "learning_rate": 6.626474018931083e-05, "loss": 2.3945, "step": 33005 }, { "epoch": 0.89, "learning_rate": 6.623358679926828e-05, "loss": 2.5969, "step": 33006 }, { "epoch": 0.89, "learning_rate": 6.620244048327328e-05, "loss": 1.9378, "step": 33007 }, { "epoch": 0.89, "learning_rate": 6.617130124156156e-05, "loss": 2.6018, "step": 33008 }, { "epoch": 0.89, "learning_rate": 6.614016907436903e-05, "loss": 2.6, "step": 33009 }, { "epoch": 0.89, "learning_rate": 6.610904398193162e-05, "loss": 2.7905, "step": 33010 }, { "epoch": 0.89, "learning_rate": 6.607792596448514e-05, "loss": 2.5736, "step": 33011 }, { "epoch": 0.89, "learning_rate": 6.60468150222654e-05, "loss": 2.5787, "step": 33012 }, { "epoch": 0.89, "learning_rate": 6.601571115550808e-05, "loss": 2.7125, "step": 33013 }, { "epoch": 0.89, "learning_rate": 6.598461436444858e-05, "loss": 2.9199, "step": 33014 }, { "epoch": 0.89, "learning_rate": 6.595352464932291e-05, "loss": 2.3824, "step": 33015 }, { "epoch": 0.89, "learning_rate": 6.592244201036612e-05, "loss": 2.523, "step": 33016 }, { "epoch": 0.89, "learning_rate": 6.58913664478138e-05, "loss": 2.8586, "step": 33017 }, { "epoch": 0.89, "learning_rate": 6.586029796190174e-05, "loss": 2.7241, "step": 33018 }, { "epoch": 0.89, "learning_rate": 6.582923655286488e-05, "loss": 2.441, "step": 33019 }, { "epoch": 0.89, "learning_rate": 6.57981822209388e-05, "loss": 2.7202, "step": 33020 }, { "epoch": 0.89, "learning_rate": 6.576713496635878e-05, "loss": 2.2727, "step": 33021 }, { "epoch": 0.89, "learning_rate": 6.57360947893597e-05, "loss": 2.5948, "step": 33022 }, { "epoch": 0.89, "learning_rate": 6.570506169017709e-05, "loss": 2.8876, "step": 33023 }, { "epoch": 0.89, "learning_rate": 6.567403566904573e-05, "loss": 2.5187, "step": 33024 }, { "epoch": 0.89, "learning_rate": 6.564301672620099e-05, "loss": 2.3945, "step": 33025 }, { "epoch": 0.89, "learning_rate": 6.56120048618778e-05, "loss": 2.861, "step": 33026 }, { "epoch": 0.89, "learning_rate": 6.558100007631085e-05, "loss": 2.7347, "step": 33027 }, { "epoch": 0.89, "learning_rate": 6.555000236973507e-05, "loss": 2.3971, "step": 33028 }, { "epoch": 0.89, "learning_rate": 6.551901174238573e-05, "loss": 2.542, "step": 33029 }, { "epoch": 0.89, "learning_rate": 6.548802819449696e-05, "loss": 2.7441, "step": 33030 }, { "epoch": 0.89, "learning_rate": 6.5457051726304e-05, "loss": 2.7615, "step": 33031 }, { "epoch": 0.89, "learning_rate": 6.542608233804126e-05, "loss": 2.0669, "step": 33032 }, { "epoch": 0.89, "learning_rate": 6.539512002994342e-05, "loss": 1.9485, "step": 33033 }, { "epoch": 0.89, "learning_rate": 6.536416480224528e-05, "loss": 2.684, "step": 33034 }, { "epoch": 0.89, "learning_rate": 6.533321665518088e-05, "loss": 2.3126, "step": 33035 }, { "epoch": 0.89, "learning_rate": 6.530227558898493e-05, "loss": 1.945, "step": 33036 }, { "epoch": 0.89, "learning_rate": 6.527134160389192e-05, "loss": 2.414, "step": 33037 }, { "epoch": 0.89, "learning_rate": 6.524041470013608e-05, "loss": 2.5681, "step": 33038 }, { "epoch": 0.89, "learning_rate": 6.52094948779518e-05, "loss": 2.5656, "step": 33039 }, { "epoch": 0.89, "learning_rate": 6.517858213757322e-05, "loss": 2.6261, "step": 33040 }, { "epoch": 0.89, "learning_rate": 6.514767647923459e-05, "loss": 2.3852, "step": 33041 }, { "epoch": 0.89, "learning_rate": 6.511677790316994e-05, "loss": 3.002, "step": 33042 }, { "epoch": 0.89, "learning_rate": 6.508588640961344e-05, "loss": 2.0949, "step": 33043 }, { "epoch": 0.89, "learning_rate": 6.505500199879922e-05, "loss": 1.9387, "step": 33044 }, { "epoch": 0.89, "learning_rate": 6.50241246709612e-05, "loss": 2.5084, "step": 33045 }, { "epoch": 0.89, "learning_rate": 6.499325442633308e-05, "loss": 2.2466, "step": 33046 }, { "epoch": 0.89, "learning_rate": 6.496239126514903e-05, "loss": 2.6622, "step": 33047 }, { "epoch": 0.89, "learning_rate": 6.493153518764282e-05, "loss": 2.6717, "step": 33048 }, { "epoch": 0.89, "learning_rate": 6.490068619404788e-05, "loss": 2.2553, "step": 33049 }, { "epoch": 0.89, "learning_rate": 6.486984428459831e-05, "loss": 2.6166, "step": 33050 }, { "epoch": 0.89, "learning_rate": 6.483900945952747e-05, "loss": 2.5751, "step": 33051 }, { "epoch": 0.89, "learning_rate": 6.480818171906922e-05, "loss": 2.3851, "step": 33052 }, { "epoch": 0.89, "learning_rate": 6.477736106345711e-05, "loss": 2.6862, "step": 33053 }, { "epoch": 0.89, "learning_rate": 6.474654749292442e-05, "loss": 2.7016, "step": 33054 }, { "epoch": 0.89, "learning_rate": 6.471574100770461e-05, "loss": 2.2864, "step": 33055 }, { "epoch": 0.89, "learning_rate": 6.468494160803107e-05, "loss": 2.4456, "step": 33056 }, { "epoch": 0.89, "learning_rate": 6.465414929413727e-05, "loss": 2.8243, "step": 33057 }, { "epoch": 0.89, "learning_rate": 6.462336406625657e-05, "loss": 2.3746, "step": 33058 }, { "epoch": 0.89, "learning_rate": 6.45925859246218e-05, "loss": 2.3178, "step": 33059 }, { "epoch": 0.89, "learning_rate": 6.456181486946644e-05, "loss": 2.3483, "step": 33060 }, { "epoch": 0.89, "learning_rate": 6.453105090102373e-05, "loss": 2.0875, "step": 33061 }, { "epoch": 0.89, "learning_rate": 6.450029401952628e-05, "loss": 2.7194, "step": 33062 }, { "epoch": 0.89, "learning_rate": 6.446954422520723e-05, "loss": 2.2116, "step": 33063 }, { "epoch": 0.89, "learning_rate": 6.443880151829995e-05, "loss": 2.3644, "step": 33064 }, { "epoch": 0.89, "learning_rate": 6.440806589903692e-05, "loss": 2.5413, "step": 33065 }, { "epoch": 0.89, "learning_rate": 6.437733736765128e-05, "loss": 2.5612, "step": 33066 }, { "epoch": 0.89, "learning_rate": 6.434661592437552e-05, "loss": 2.5435, "step": 33067 }, { "epoch": 0.89, "learning_rate": 6.431590156944244e-05, "loss": 1.8902, "step": 33068 }, { "epoch": 0.89, "learning_rate": 6.428519430308488e-05, "loss": 2.6359, "step": 33069 }, { "epoch": 0.89, "learning_rate": 6.42544941255353e-05, "loss": 2.0406, "step": 33070 }, { "epoch": 0.89, "learning_rate": 6.422380103702652e-05, "loss": 2.3152, "step": 33071 }, { "epoch": 0.89, "learning_rate": 6.419311503779102e-05, "loss": 2.2939, "step": 33072 }, { "epoch": 0.89, "learning_rate": 6.416243612806094e-05, "loss": 2.7529, "step": 33073 }, { "epoch": 0.89, "learning_rate": 6.413176430806921e-05, "loss": 2.4365, "step": 33074 }, { "epoch": 0.89, "learning_rate": 6.410109957804766e-05, "loss": 2.1195, "step": 33075 }, { "epoch": 0.89, "learning_rate": 6.407044193822876e-05, "loss": 2.718, "step": 33076 }, { "epoch": 0.89, "learning_rate": 6.403979138884508e-05, "loss": 2.4812, "step": 33077 }, { "epoch": 0.89, "learning_rate": 6.400914793012857e-05, "loss": 2.3821, "step": 33078 }, { "epoch": 0.89, "learning_rate": 6.397851156231138e-05, "loss": 2.5065, "step": 33079 }, { "epoch": 0.89, "learning_rate": 6.394788228562576e-05, "loss": 2.3858, "step": 33080 }, { "epoch": 0.89, "learning_rate": 6.391726010030352e-05, "loss": 2.3358, "step": 33081 }, { "epoch": 0.89, "learning_rate": 6.38866450065767e-05, "loss": 2.5982, "step": 33082 }, { "epoch": 0.89, "learning_rate": 6.385603700467735e-05, "loss": 2.2924, "step": 33083 }, { "epoch": 0.89, "learning_rate": 6.382543609483726e-05, "loss": 2.4057, "step": 33084 }, { "epoch": 0.89, "learning_rate": 6.379484227728849e-05, "loss": 2.5449, "step": 33085 }, { "epoch": 0.89, "learning_rate": 6.37642555522625e-05, "loss": 2.4766, "step": 33086 }, { "epoch": 0.89, "learning_rate": 6.373367591999102e-05, "loss": 2.0441, "step": 33087 }, { "epoch": 0.89, "learning_rate": 6.370310338070606e-05, "loss": 2.3903, "step": 33088 }, { "epoch": 0.89, "learning_rate": 6.367253793463867e-05, "loss": 2.7263, "step": 33089 }, { "epoch": 0.89, "learning_rate": 6.36419795820209e-05, "loss": 2.2371, "step": 33090 }, { "epoch": 0.89, "learning_rate": 6.361142832308419e-05, "loss": 2.6401, "step": 33091 }, { "epoch": 0.89, "learning_rate": 6.358088415805974e-05, "loss": 2.7217, "step": 33092 }, { "epoch": 0.89, "learning_rate": 6.355034708717932e-05, "loss": 2.4115, "step": 33093 }, { "epoch": 0.89, "learning_rate": 6.351981711067379e-05, "loss": 2.6307, "step": 33094 }, { "epoch": 0.89, "learning_rate": 6.348929422877481e-05, "loss": 2.5217, "step": 33095 }, { "epoch": 0.89, "learning_rate": 6.345877844171343e-05, "loss": 2.3784, "step": 33096 }, { "epoch": 0.89, "learning_rate": 6.342826974972094e-05, "loss": 2.3406, "step": 33097 }, { "epoch": 0.89, "learning_rate": 6.339776815302844e-05, "loss": 2.3781, "step": 33098 }, { "epoch": 0.89, "learning_rate": 6.336727365186712e-05, "loss": 2.7424, "step": 33099 }, { "epoch": 0.89, "learning_rate": 6.333678624646777e-05, "loss": 2.6348, "step": 33100 }, { "epoch": 0.89, "learning_rate": 6.330630593706155e-05, "loss": 2.4581, "step": 33101 }, { "epoch": 0.89, "learning_rate": 6.327583272387905e-05, "loss": 2.4195, "step": 33102 }, { "epoch": 0.89, "learning_rate": 6.324536660715152e-05, "loss": 2.5047, "step": 33103 }, { "epoch": 0.89, "learning_rate": 6.321490758710968e-05, "loss": 2.6917, "step": 33104 }, { "epoch": 0.89, "learning_rate": 6.318445566398423e-05, "loss": 2.3212, "step": 33105 }, { "epoch": 0.89, "learning_rate": 6.315401083800576e-05, "loss": 2.4266, "step": 33106 }, { "epoch": 0.89, "learning_rate": 6.312357310940509e-05, "loss": 2.5811, "step": 33107 }, { "epoch": 0.89, "learning_rate": 6.30931424784127e-05, "loss": 2.2219, "step": 33108 }, { "epoch": 0.89, "learning_rate": 6.306271894525905e-05, "loss": 2.4447, "step": 33109 }, { "epoch": 0.89, "learning_rate": 6.303230251017488e-05, "loss": 2.7404, "step": 33110 }, { "epoch": 0.89, "learning_rate": 6.300189317339034e-05, "loss": 2.5694, "step": 33111 }, { "epoch": 0.89, "learning_rate": 6.297149093513622e-05, "loss": 2.0868, "step": 33112 }, { "epoch": 0.89, "learning_rate": 6.294109579564222e-05, "loss": 2.5661, "step": 33113 }, { "epoch": 0.89, "learning_rate": 6.291070775513907e-05, "loss": 2.3308, "step": 33114 }, { "epoch": 0.89, "learning_rate": 6.288032681385691e-05, "loss": 2.4651, "step": 33115 }, { "epoch": 0.89, "learning_rate": 6.284995297202578e-05, "loss": 1.9585, "step": 33116 }, { "epoch": 0.89, "learning_rate": 6.281958622987604e-05, "loss": 2.773, "step": 33117 }, { "epoch": 0.89, "learning_rate": 6.278922658763742e-05, "loss": 2.7452, "step": 33118 }, { "epoch": 0.89, "learning_rate": 6.275887404554004e-05, "loss": 2.8087, "step": 33119 }, { "epoch": 0.89, "learning_rate": 6.272852860381395e-05, "loss": 2.5317, "step": 33120 }, { "epoch": 0.89, "learning_rate": 6.269819026268885e-05, "loss": 2.4772, "step": 33121 }, { "epoch": 0.89, "learning_rate": 6.26678590223947e-05, "loss": 2.6391, "step": 33122 }, { "epoch": 0.89, "learning_rate": 6.263753488316126e-05, "loss": 2.3969, "step": 33123 }, { "epoch": 0.89, "learning_rate": 6.260721784521839e-05, "loss": 2.7227, "step": 33124 }, { "epoch": 0.89, "learning_rate": 6.257690790879555e-05, "loss": 2.6448, "step": 33125 }, { "epoch": 0.89, "learning_rate": 6.254660507412258e-05, "loss": 2.6167, "step": 33126 }, { "epoch": 0.89, "learning_rate": 6.251630934142882e-05, "loss": 2.0236, "step": 33127 }, { "epoch": 0.89, "learning_rate": 6.248602071094389e-05, "loss": 2.5598, "step": 33128 }, { "epoch": 0.89, "learning_rate": 6.245573918289715e-05, "loss": 2.6111, "step": 33129 }, { "epoch": 0.89, "learning_rate": 6.242546475751832e-05, "loss": 2.487, "step": 33130 }, { "epoch": 0.89, "learning_rate": 6.239519743503652e-05, "loss": 2.8196, "step": 33131 }, { "epoch": 0.89, "learning_rate": 6.236493721568104e-05, "loss": 2.6734, "step": 33132 }, { "epoch": 0.89, "learning_rate": 6.233468409968112e-05, "loss": 2.3721, "step": 33133 }, { "epoch": 0.89, "learning_rate": 6.230443808726616e-05, "loss": 2.1983, "step": 33134 }, { "epoch": 0.89, "learning_rate": 6.227419917866494e-05, "loss": 1.9687, "step": 33135 }, { "epoch": 0.89, "learning_rate": 6.224396737410676e-05, "loss": 2.2818, "step": 33136 }, { "epoch": 0.89, "learning_rate": 6.221374267382063e-05, "loss": 2.8818, "step": 33137 }, { "epoch": 0.89, "learning_rate": 6.218352507803549e-05, "loss": 2.3845, "step": 33138 }, { "epoch": 0.89, "learning_rate": 6.215331458698047e-05, "loss": 3.1105, "step": 33139 }, { "epoch": 0.89, "learning_rate": 6.21231112008841e-05, "loss": 2.4954, "step": 33140 }, { "epoch": 0.89, "learning_rate": 6.209291491997538e-05, "loss": 2.6103, "step": 33141 }, { "epoch": 0.89, "learning_rate": 6.206272574448312e-05, "loss": 2.9261, "step": 33142 }, { "epoch": 0.89, "learning_rate": 6.203254367463585e-05, "loss": 2.4477, "step": 33143 }, { "epoch": 0.89, "learning_rate": 6.200236871066255e-05, "loss": 2.785, "step": 33144 }, { "epoch": 0.89, "learning_rate": 6.197220085279143e-05, "loss": 2.4788, "step": 33145 }, { "epoch": 0.89, "learning_rate": 6.194204010125126e-05, "loss": 2.147, "step": 33146 }, { "epoch": 0.89, "learning_rate": 6.191188645627066e-05, "loss": 2.7033, "step": 33147 }, { "epoch": 0.89, "learning_rate": 6.188173991807767e-05, "loss": 2.3044, "step": 33148 }, { "epoch": 0.89, "learning_rate": 6.185160048690075e-05, "loss": 2.5124, "step": 33149 }, { "epoch": 0.89, "learning_rate": 6.182146816296874e-05, "loss": 2.1342, "step": 33150 }, { "epoch": 0.89, "learning_rate": 6.179134294650934e-05, "loss": 2.2121, "step": 33151 }, { "epoch": 0.89, "learning_rate": 6.176122483775115e-05, "loss": 2.1063, "step": 33152 }, { "epoch": 0.89, "learning_rate": 6.173111383692209e-05, "loss": 2.8895, "step": 33153 }, { "epoch": 0.89, "learning_rate": 6.170100994425032e-05, "loss": 2.559, "step": 33154 }, { "epoch": 0.89, "learning_rate": 6.167091315996387e-05, "loss": 2.5619, "step": 33155 }, { "epoch": 0.89, "learning_rate": 6.16408234842909e-05, "loss": 2.0569, "step": 33156 }, { "epoch": 0.89, "learning_rate": 6.161074091745933e-05, "loss": 2.2205, "step": 33157 }, { "epoch": 0.89, "learning_rate": 6.158066545969709e-05, "loss": 2.7184, "step": 33158 }, { "epoch": 0.89, "learning_rate": 6.15505971112319e-05, "loss": 2.5861, "step": 33159 }, { "epoch": 0.89, "learning_rate": 6.152053587229156e-05, "loss": 2.5208, "step": 33160 }, { "epoch": 0.89, "learning_rate": 6.149048174310401e-05, "loss": 2.3641, "step": 33161 }, { "epoch": 0.89, "learning_rate": 6.146043472389639e-05, "loss": 2.1856, "step": 33162 }, { "epoch": 0.89, "learning_rate": 6.14303948148971e-05, "loss": 2.581, "step": 33163 }, { "epoch": 0.89, "learning_rate": 6.140036201633325e-05, "loss": 2.2085, "step": 33164 }, { "epoch": 0.89, "learning_rate": 6.137033632843237e-05, "loss": 2.2641, "step": 33165 }, { "epoch": 0.89, "learning_rate": 6.134031775142213e-05, "loss": 2.4148, "step": 33166 }, { "epoch": 0.89, "learning_rate": 6.131030628552981e-05, "loss": 2.3953, "step": 33167 }, { "epoch": 0.89, "learning_rate": 6.128030193098267e-05, "loss": 2.8243, "step": 33168 }, { "epoch": 0.89, "learning_rate": 6.125030468800818e-05, "loss": 2.2692, "step": 33169 }, { "epoch": 0.89, "learning_rate": 6.122031455683353e-05, "loss": 2.3747, "step": 33170 }, { "epoch": 0.89, "learning_rate": 6.119033153768605e-05, "loss": 2.865, "step": 33171 }, { "epoch": 0.89, "learning_rate": 6.11603556307927e-05, "loss": 2.262, "step": 33172 }, { "epoch": 0.89, "learning_rate": 6.113038683638062e-05, "loss": 2.3409, "step": 33173 }, { "epoch": 0.89, "learning_rate": 6.110042515467695e-05, "loss": 2.3336, "step": 33174 }, { "epoch": 0.89, "learning_rate": 6.107047058590843e-05, "loss": 2.5291, "step": 33175 }, { "epoch": 0.89, "learning_rate": 6.104052313030229e-05, "loss": 2.213, "step": 33176 }, { "epoch": 0.89, "learning_rate": 6.1010582788085355e-05, "loss": 2.3363, "step": 33177 }, { "epoch": 0.89, "learning_rate": 6.098064955948423e-05, "loss": 2.4028, "step": 33178 }, { "epoch": 0.89, "learning_rate": 6.0950723444725964e-05, "loss": 2.1138, "step": 33179 }, { "epoch": 0.89, "learning_rate": 6.0920804444037025e-05, "loss": 2.8542, "step": 33180 }, { "epoch": 0.89, "learning_rate": 6.089089255764424e-05, "loss": 2.28, "step": 33181 }, { "epoch": 0.89, "learning_rate": 6.086098778577398e-05, "loss": 2.2386, "step": 33182 }, { "epoch": 0.89, "learning_rate": 6.083109012865318e-05, "loss": 2.6947, "step": 33183 }, { "epoch": 0.89, "learning_rate": 6.080119958650798e-05, "loss": 2.3925, "step": 33184 }, { "epoch": 0.89, "learning_rate": 6.0771316159565214e-05, "loss": 2.5137, "step": 33185 }, { "epoch": 0.89, "learning_rate": 6.0741439848050804e-05, "loss": 2.5027, "step": 33186 }, { "epoch": 0.89, "learning_rate": 6.071157065219157e-05, "loss": 2.3493, "step": 33187 }, { "epoch": 0.89, "learning_rate": 6.0681708572213115e-05, "loss": 2.5683, "step": 33188 }, { "epoch": 0.89, "learning_rate": 6.0651853608342355e-05, "loss": 2.3958, "step": 33189 }, { "epoch": 0.89, "learning_rate": 6.062200576080534e-05, "loss": 2.1085, "step": 33190 }, { "epoch": 0.89, "learning_rate": 6.0592165029828004e-05, "loss": 2.6339, "step": 33191 }, { "epoch": 0.89, "learning_rate": 6.056233141563638e-05, "loss": 2.7654, "step": 33192 }, { "epoch": 0.89, "learning_rate": 6.0532504918456745e-05, "loss": 2.2725, "step": 33193 }, { "epoch": 0.89, "learning_rate": 6.050268553851468e-05, "loss": 2.2707, "step": 33194 }, { "epoch": 0.89, "learning_rate": 6.047287327603634e-05, "loss": 2.3057, "step": 33195 }, { "epoch": 0.89, "learning_rate": 6.0443068131247555e-05, "loss": 2.775, "step": 33196 }, { "epoch": 0.89, "learning_rate": 6.041327010437414e-05, "loss": 2.3604, "step": 33197 }, { "epoch": 0.89, "learning_rate": 6.038347919564191e-05, "loss": 2.4762, "step": 33198 }, { "epoch": 0.89, "learning_rate": 6.0353695405276355e-05, "loss": 2.3468, "step": 33199 }, { "epoch": 0.89, "learning_rate": 6.032391873350318e-05, "loss": 2.1942, "step": 33200 }, { "epoch": 0.89, "learning_rate": 6.029414918054798e-05, "loss": 2.1835, "step": 33201 }, { "epoch": 0.89, "learning_rate": 6.026438674663626e-05, "loss": 2.5397, "step": 33202 }, { "epoch": 0.89, "learning_rate": 6.023463143199359e-05, "loss": 2.2228, "step": 33203 }, { "epoch": 0.89, "learning_rate": 6.020488323684559e-05, "loss": 3.0225, "step": 33204 }, { "epoch": 0.89, "learning_rate": 6.0175142161417064e-05, "loss": 2.2175, "step": 33205 }, { "epoch": 0.89, "learning_rate": 6.014540820593384e-05, "loss": 2.394, "step": 33206 }, { "epoch": 0.89, "learning_rate": 6.0115681370620844e-05, "loss": 2.3968, "step": 33207 }, { "epoch": 0.89, "learning_rate": 6.0085961655703235e-05, "loss": 2.6957, "step": 33208 }, { "epoch": 0.89, "learning_rate": 6.005624906140672e-05, "loss": 2.2009, "step": 33209 }, { "epoch": 0.89, "learning_rate": 6.002654358795579e-05, "loss": 2.3051, "step": 33210 }, { "epoch": 0.89, "learning_rate": 5.999684523557569e-05, "loss": 2.498, "step": 33211 }, { "epoch": 0.89, "learning_rate": 5.99671540044916e-05, "loss": 2.6514, "step": 33212 }, { "epoch": 0.89, "learning_rate": 5.993746989492821e-05, "loss": 2.512, "step": 33213 }, { "epoch": 0.89, "learning_rate": 5.990779290711046e-05, "loss": 2.3395, "step": 33214 }, { "epoch": 0.89, "learning_rate": 5.9878123041263164e-05, "loss": 2.6785, "step": 33215 }, { "epoch": 0.89, "learning_rate": 5.984846029761104e-05, "loss": 2.669, "step": 33216 }, { "epoch": 0.89, "learning_rate": 5.9818804676379235e-05, "loss": 2.5987, "step": 33217 }, { "epoch": 0.89, "learning_rate": 5.9789156177791795e-05, "loss": 2.4327, "step": 33218 }, { "epoch": 0.89, "learning_rate": 5.9759514802073646e-05, "loss": 2.5778, "step": 33219 }, { "epoch": 0.89, "learning_rate": 5.97298805494495e-05, "loss": 2.2919, "step": 33220 }, { "epoch": 0.89, "learning_rate": 5.970025342014329e-05, "loss": 2.2688, "step": 33221 }, { "epoch": 0.89, "learning_rate": 5.9670633414380174e-05, "loss": 2.2771, "step": 33222 }, { "epoch": 0.89, "learning_rate": 5.9641020532384184e-05, "loss": 2.3952, "step": 33223 }, { "epoch": 0.89, "learning_rate": 5.961141477437959e-05, "loss": 2.5423, "step": 33224 }, { "epoch": 0.89, "learning_rate": 5.958181614059099e-05, "loss": 3.028, "step": 33225 }, { "epoch": 0.89, "learning_rate": 5.955222463124221e-05, "loss": 2.4832, "step": 33226 }, { "epoch": 0.89, "learning_rate": 5.952264024655773e-05, "loss": 2.6834, "step": 33227 }, { "epoch": 0.89, "learning_rate": 5.949306298676149e-05, "loss": 2.3947, "step": 33228 }, { "epoch": 0.89, "learning_rate": 5.946349285207775e-05, "loss": 2.6959, "step": 33229 }, { "epoch": 0.89, "learning_rate": 5.9433929842730324e-05, "loss": 2.7975, "step": 33230 }, { "epoch": 0.89, "learning_rate": 5.940437395894349e-05, "loss": 2.2638, "step": 33231 }, { "epoch": 0.89, "learning_rate": 5.937482520094084e-05, "loss": 2.1684, "step": 33232 }, { "epoch": 0.89, "learning_rate": 5.934528356894653e-05, "loss": 2.4301, "step": 33233 }, { "epoch": 0.89, "learning_rate": 5.931574906318382e-05, "loss": 2.5892, "step": 33234 }, { "epoch": 0.89, "learning_rate": 5.9286221683876986e-05, "loss": 2.823, "step": 33235 }, { "epoch": 0.89, "learning_rate": 5.925670143124973e-05, "loss": 2.3645, "step": 33236 }, { "epoch": 0.89, "learning_rate": 5.9227188305525314e-05, "loss": 2.5679, "step": 33237 }, { "epoch": 0.89, "learning_rate": 5.919768230692746e-05, "loss": 2.4412, "step": 33238 }, { "epoch": 0.89, "learning_rate": 5.9168183435679976e-05, "loss": 2.1496, "step": 33239 }, { "epoch": 0.89, "learning_rate": 5.913869169200603e-05, "loss": 2.4411, "step": 33240 }, { "epoch": 0.89, "learning_rate": 5.9109207076129104e-05, "loss": 2.1904, "step": 33241 }, { "epoch": 0.89, "learning_rate": 5.907972958827268e-05, "loss": 2.525, "step": 33242 }, { "epoch": 0.89, "learning_rate": 5.905025922865992e-05, "loss": 2.1638, "step": 33243 }, { "epoch": 0.89, "learning_rate": 5.902079599751431e-05, "loss": 2.0879, "step": 33244 }, { "epoch": 0.89, "learning_rate": 5.899133989505878e-05, "loss": 2.573, "step": 33245 }, { "epoch": 0.89, "learning_rate": 5.8961890921516716e-05, "loss": 2.6584, "step": 33246 }, { "epoch": 0.89, "learning_rate": 5.893244907711104e-05, "loss": 2.4353, "step": 33247 }, { "epoch": 0.89, "learning_rate": 5.89030143620648e-05, "loss": 2.5981, "step": 33248 }, { "epoch": 0.89, "learning_rate": 5.887358677660137e-05, "loss": 2.4745, "step": 33249 }, { "epoch": 0.89, "learning_rate": 5.884416632094314e-05, "loss": 2.8426, "step": 33250 }, { "epoch": 0.89, "learning_rate": 5.8814752995313356e-05, "loss": 2.2805, "step": 33251 }, { "epoch": 0.89, "learning_rate": 5.8785346799934744e-05, "loss": 2.4054, "step": 33252 }, { "epoch": 0.89, "learning_rate": 5.875594773503001e-05, "loss": 2.6372, "step": 33253 }, { "epoch": 0.89, "learning_rate": 5.872655580082198e-05, "loss": 2.2966, "step": 33254 }, { "epoch": 0.89, "learning_rate": 5.8697170997533133e-05, "loss": 2.565, "step": 33255 }, { "epoch": 0.89, "learning_rate": 5.86677933253863e-05, "loss": 2.6843, "step": 33256 }, { "epoch": 0.89, "learning_rate": 5.8638422784604184e-05, "loss": 2.3709, "step": 33257 }, { "epoch": 0.89, "learning_rate": 5.860905937540883e-05, "loss": 2.4884, "step": 33258 }, { "epoch": 0.89, "learning_rate": 5.857970309802308e-05, "loss": 2.354, "step": 33259 }, { "epoch": 0.89, "learning_rate": 5.8550353952669054e-05, "loss": 2.7218, "step": 33260 }, { "epoch": 0.89, "learning_rate": 5.852101193956927e-05, "loss": 2.4189, "step": 33261 }, { "epoch": 0.89, "learning_rate": 5.849167705894598e-05, "loss": 2.2459, "step": 33262 }, { "epoch": 0.89, "learning_rate": 5.8462349311021565e-05, "loss": 2.2988, "step": 33263 }, { "epoch": 0.89, "learning_rate": 5.843302869601785e-05, "loss": 2.3673, "step": 33264 }, { "epoch": 0.89, "learning_rate": 5.840371521415744e-05, "loss": 2.4941, "step": 33265 }, { "epoch": 0.89, "learning_rate": 5.837440886566192e-05, "loss": 2.3611, "step": 33266 }, { "epoch": 0.89, "learning_rate": 5.834510965075357e-05, "loss": 2.5372, "step": 33267 }, { "epoch": 0.89, "learning_rate": 5.831581756965432e-05, "loss": 2.7606, "step": 33268 }, { "epoch": 0.89, "learning_rate": 5.828653262258599e-05, "loss": 2.4001, "step": 33269 }, { "epoch": 0.89, "learning_rate": 5.825725480977062e-05, "loss": 2.8685, "step": 33270 }, { "epoch": 0.89, "learning_rate": 5.8227984131430045e-05, "loss": 2.5332, "step": 33271 }, { "epoch": 0.89, "learning_rate": 5.8198720587785744e-05, "loss": 2.908, "step": 33272 }, { "epoch": 0.89, "learning_rate": 5.816946417905955e-05, "loss": 2.7466, "step": 33273 }, { "epoch": 0.89, "learning_rate": 5.814021490547317e-05, "loss": 2.3963, "step": 33274 }, { "epoch": 0.89, "learning_rate": 5.811097276724797e-05, "loss": 2.5098, "step": 33275 }, { "epoch": 0.89, "learning_rate": 5.80817377646059e-05, "loss": 2.5495, "step": 33276 }, { "epoch": 0.89, "learning_rate": 5.805250989776811e-05, "loss": 2.8201, "step": 33277 }, { "epoch": 0.89, "learning_rate": 5.802328916695598e-05, "loss": 3.0536, "step": 33278 }, { "epoch": 0.89, "learning_rate": 5.799407557239123e-05, "loss": 2.4036, "step": 33279 }, { "epoch": 0.89, "learning_rate": 5.796486911429477e-05, "loss": 2.5341, "step": 33280 }, { "epoch": 0.89, "learning_rate": 5.793566979288789e-05, "loss": 2.613, "step": 33281 }, { "epoch": 0.89, "learning_rate": 5.790647760839229e-05, "loss": 2.4714, "step": 33282 }, { "epoch": 0.89, "learning_rate": 5.787729256102858e-05, "loss": 2.5499, "step": 33283 }, { "epoch": 0.89, "learning_rate": 5.7848114651018245e-05, "loss": 2.3649, "step": 33284 }, { "epoch": 0.89, "learning_rate": 5.781894387858189e-05, "loss": 2.3617, "step": 33285 }, { "epoch": 0.89, "learning_rate": 5.778978024394088e-05, "loss": 2.2424, "step": 33286 }, { "epoch": 0.89, "learning_rate": 5.7760623747316055e-05, "loss": 2.1373, "step": 33287 }, { "epoch": 0.89, "learning_rate": 5.773147438892823e-05, "loss": 2.0779, "step": 33288 }, { "epoch": 0.89, "learning_rate": 5.770233216899834e-05, "loss": 2.4191, "step": 33289 }, { "epoch": 0.89, "learning_rate": 5.767319708774732e-05, "loss": 2.5215, "step": 33290 }, { "epoch": 0.89, "learning_rate": 5.7644069145395436e-05, "loss": 2.3281, "step": 33291 }, { "epoch": 0.89, "learning_rate": 5.7614948342163744e-05, "loss": 2.3837, "step": 33292 }, { "epoch": 0.89, "learning_rate": 5.758583467827261e-05, "loss": 2.599, "step": 33293 }, { "epoch": 0.89, "learning_rate": 5.755672815394264e-05, "loss": 2.4787, "step": 33294 }, { "epoch": 0.89, "learning_rate": 5.752762876939455e-05, "loss": 2.3536, "step": 33295 }, { "epoch": 0.89, "learning_rate": 5.74985365248486e-05, "loss": 2.175, "step": 33296 }, { "epoch": 0.89, "learning_rate": 5.7469451420525175e-05, "loss": 2.3118, "step": 33297 }, { "epoch": 0.89, "learning_rate": 5.744037345664488e-05, "loss": 2.4109, "step": 33298 }, { "epoch": 0.89, "learning_rate": 5.741130263342764e-05, "loss": 2.5101, "step": 33299 }, { "epoch": 0.89, "learning_rate": 5.738223895109384e-05, "loss": 2.3342, "step": 33300 }, { "epoch": 0.89, "learning_rate": 5.735318240986365e-05, "loss": 2.2182, "step": 33301 }, { "epoch": 0.89, "learning_rate": 5.732413300995731e-05, "loss": 2.292, "step": 33302 }, { "epoch": 0.89, "learning_rate": 5.729509075159489e-05, "loss": 2.1844, "step": 33303 }, { "epoch": 0.9, "learning_rate": 5.726605563499609e-05, "loss": 2.4364, "step": 33304 }, { "epoch": 0.9, "learning_rate": 5.723702766038119e-05, "loss": 2.5402, "step": 33305 }, { "epoch": 0.9, "learning_rate": 5.720800682797023e-05, "loss": 2.687, "step": 33306 }, { "epoch": 0.9, "learning_rate": 5.717899313798247e-05, "loss": 2.703, "step": 33307 }, { "epoch": 0.9, "learning_rate": 5.7149986590638305e-05, "loss": 2.6728, "step": 33308 }, { "epoch": 0.9, "learning_rate": 5.7120987186157325e-05, "loss": 2.3925, "step": 33309 }, { "epoch": 0.9, "learning_rate": 5.709199492475914e-05, "loss": 2.2402, "step": 33310 }, { "epoch": 0.9, "learning_rate": 5.7063009806663456e-05, "loss": 2.7389, "step": 33311 }, { "epoch": 0.9, "learning_rate": 5.703403183208977e-05, "loss": 2.5856, "step": 33312 }, { "epoch": 0.9, "learning_rate": 5.700506100125768e-05, "loss": 2.6586, "step": 33313 }, { "epoch": 0.9, "learning_rate": 5.6976097314386575e-05, "loss": 2.5498, "step": 33314 }, { "epoch": 0.9, "learning_rate": 5.6947140771696046e-05, "loss": 2.5769, "step": 33315 }, { "epoch": 0.9, "learning_rate": 5.691819137340537e-05, "loss": 1.8898, "step": 33316 }, { "epoch": 0.9, "learning_rate": 5.6889249119734034e-05, "loss": 2.3315, "step": 33317 }, { "epoch": 0.9, "learning_rate": 5.686031401090086e-05, "loss": 2.071, "step": 33318 }, { "epoch": 0.9, "learning_rate": 5.683138604712557e-05, "loss": 2.4181, "step": 33319 }, { "epoch": 0.9, "learning_rate": 5.680246522862676e-05, "loss": 2.9585, "step": 33320 }, { "epoch": 0.9, "learning_rate": 5.677355155562403e-05, "loss": 2.4564, "step": 33321 }, { "epoch": 0.9, "learning_rate": 5.674464502833632e-05, "loss": 2.0117, "step": 33322 }, { "epoch": 0.9, "learning_rate": 5.6715745646982454e-05, "loss": 2.391, "step": 33323 }, { "epoch": 0.9, "learning_rate": 5.668685341178148e-05, "loss": 2.5167, "step": 33324 }, { "epoch": 0.9, "learning_rate": 5.6657968322952336e-05, "loss": 2.5169, "step": 33325 }, { "epoch": 0.9, "learning_rate": 5.6629090380713624e-05, "loss": 2.4147, "step": 33326 }, { "epoch": 0.9, "learning_rate": 5.6600219585284275e-05, "loss": 2.1152, "step": 33327 }, { "epoch": 0.9, "learning_rate": 5.6571355936883006e-05, "loss": 2.5309, "step": 33328 }, { "epoch": 0.9, "learning_rate": 5.6542499435728534e-05, "loss": 2.5526, "step": 33329 }, { "epoch": 0.9, "learning_rate": 5.651365008203946e-05, "loss": 2.21, "step": 33330 }, { "epoch": 0.9, "learning_rate": 5.648480787603416e-05, "loss": 2.5188, "step": 33331 }, { "epoch": 0.9, "learning_rate": 5.6455972817931355e-05, "loss": 2.7576, "step": 33332 }, { "epoch": 0.9, "learning_rate": 5.6427144907949315e-05, "loss": 2.2524, "step": 33333 }, { "epoch": 0.9, "learning_rate": 5.6398324146306636e-05, "loss": 2.0602, "step": 33334 }, { "epoch": 0.9, "learning_rate": 5.636951053322159e-05, "loss": 2.7803, "step": 33335 }, { "epoch": 0.9, "learning_rate": 5.634070406891234e-05, "loss": 2.7658, "step": 33336 }, { "epoch": 0.9, "learning_rate": 5.631190475359715e-05, "loss": 2.7699, "step": 33337 }, { "epoch": 0.9, "learning_rate": 5.628311258749452e-05, "loss": 2.6951, "step": 33338 }, { "epoch": 0.9, "learning_rate": 5.625432757082205e-05, "loss": 2.2781, "step": 33339 }, { "epoch": 0.9, "learning_rate": 5.622554970379812e-05, "loss": 2.6984, "step": 33340 }, { "epoch": 0.9, "learning_rate": 5.6196778986640664e-05, "loss": 2.0904, "step": 33341 }, { "epoch": 0.9, "learning_rate": 5.616801541956773e-05, "loss": 2.2885, "step": 33342 }, { "epoch": 0.9, "learning_rate": 5.613925900279704e-05, "loss": 2.3836, "step": 33343 }, { "epoch": 0.9, "learning_rate": 5.611050973654685e-05, "loss": 2.7095, "step": 33344 }, { "epoch": 0.9, "learning_rate": 5.608176762103445e-05, "loss": 2.6408, "step": 33345 }, { "epoch": 0.9, "learning_rate": 5.605303265647788e-05, "loss": 2.8828, "step": 33346 }, { "epoch": 0.9, "learning_rate": 5.602430484309484e-05, "loss": 2.3481, "step": 33347 }, { "epoch": 0.9, "learning_rate": 5.5995584181102847e-05, "loss": 2.8377, "step": 33348 }, { "epoch": 0.9, "learning_rate": 5.5966870670719596e-05, "loss": 2.5188, "step": 33349 }, { "epoch": 0.9, "learning_rate": 5.5938164312162474e-05, "loss": 2.2729, "step": 33350 }, { "epoch": 0.9, "learning_rate": 5.590946510564909e-05, "loss": 2.6137, "step": 33351 }, { "epoch": 0.9, "learning_rate": 5.588077305139683e-05, "loss": 2.5382, "step": 33352 }, { "epoch": 0.9, "learning_rate": 5.585208814962295e-05, "loss": 2.6335, "step": 33353 }, { "epoch": 0.9, "learning_rate": 5.582341040054495e-05, "loss": 2.1465, "step": 33354 }, { "epoch": 0.9, "learning_rate": 5.579473980437988e-05, "loss": 2.5618, "step": 33355 }, { "epoch": 0.9, "learning_rate": 5.576607636134512e-05, "loss": 2.0713, "step": 33356 }, { "epoch": 0.9, "learning_rate": 5.573742007165783e-05, "loss": 2.2797, "step": 33357 }, { "epoch": 0.9, "learning_rate": 5.5708770935534835e-05, "loss": 2.3392, "step": 33358 }, { "epoch": 0.9, "learning_rate": 5.5680128953193524e-05, "loss": 2.7743, "step": 33359 }, { "epoch": 0.9, "learning_rate": 5.56514941248506e-05, "loss": 2.4979, "step": 33360 }, { "epoch": 0.9, "learning_rate": 5.562286645072323e-05, "loss": 2.4616, "step": 33361 }, { "epoch": 0.9, "learning_rate": 5.5594245931028245e-05, "loss": 2.4746, "step": 33362 }, { "epoch": 0.9, "learning_rate": 5.556563256598224e-05, "loss": 2.2412, "step": 33363 }, { "epoch": 0.9, "learning_rate": 5.5537026355802266e-05, "loss": 2.2902, "step": 33364 }, { "epoch": 0.9, "learning_rate": 5.5508427300704935e-05, "loss": 2.4001, "step": 33365 }, { "epoch": 0.9, "learning_rate": 5.547983540090684e-05, "loss": 2.3825, "step": 33366 }, { "epoch": 0.9, "learning_rate": 5.5451250656624486e-05, "loss": 2.9996, "step": 33367 }, { "epoch": 0.9, "learning_rate": 5.542267306807491e-05, "loss": 2.5805, "step": 33368 }, { "epoch": 0.9, "learning_rate": 5.5394102635474174e-05, "loss": 2.2551, "step": 33369 }, { "epoch": 0.9, "learning_rate": 5.536553935903887e-05, "loss": 2.3455, "step": 33370 }, { "epoch": 0.9, "learning_rate": 5.533698323898529e-05, "loss": 2.4682, "step": 33371 }, { "epoch": 0.9, "learning_rate": 5.530843427552978e-05, "loss": 2.6735, "step": 33372 }, { "epoch": 0.9, "learning_rate": 5.527989246888876e-05, "loss": 2.0821, "step": 33373 }, { "epoch": 0.9, "learning_rate": 5.525135781927826e-05, "loss": 2.1001, "step": 33374 }, { "epoch": 0.9, "learning_rate": 5.522283032691466e-05, "loss": 2.1983, "step": 33375 }, { "epoch": 0.9, "learning_rate": 5.5194309992014026e-05, "loss": 2.62, "step": 33376 }, { "epoch": 0.9, "learning_rate": 5.516579681479239e-05, "loss": 2.4479, "step": 33377 }, { "epoch": 0.9, "learning_rate": 5.513729079546581e-05, "loss": 2.5812, "step": 33378 }, { "epoch": 0.9, "learning_rate": 5.510879193424989e-05, "loss": 2.7379, "step": 33379 }, { "epoch": 0.9, "learning_rate": 5.5080300231361014e-05, "loss": 2.8326, "step": 33380 }, { "epoch": 0.9, "learning_rate": 5.505181568701501e-05, "loss": 2.6723, "step": 33381 }, { "epoch": 0.9, "learning_rate": 5.502333830142725e-05, "loss": 2.1734, "step": 33382 }, { "epoch": 0.9, "learning_rate": 5.499486807481391e-05, "loss": 2.3545, "step": 33383 }, { "epoch": 0.9, "learning_rate": 5.4966405007390474e-05, "loss": 2.7435, "step": 33384 }, { "epoch": 0.9, "learning_rate": 5.493794909937255e-05, "loss": 2.9182, "step": 33385 }, { "epoch": 0.9, "learning_rate": 5.490950035097575e-05, "loss": 2.7432, "step": 33386 }, { "epoch": 0.9, "learning_rate": 5.488105876241556e-05, "loss": 2.6244, "step": 33387 }, { "epoch": 0.9, "learning_rate": 5.485262433390759e-05, "loss": 2.73, "step": 33388 }, { "epoch": 0.9, "learning_rate": 5.482419706566721e-05, "loss": 2.3763, "step": 33389 }, { "epoch": 0.9, "learning_rate": 5.479577695790972e-05, "loss": 2.576, "step": 33390 }, { "epoch": 0.9, "learning_rate": 5.476736401085025e-05, "loss": 2.8287, "step": 33391 }, { "epoch": 0.9, "learning_rate": 5.473895822470443e-05, "loss": 2.577, "step": 33392 }, { "epoch": 0.9, "learning_rate": 5.4710559599687074e-05, "loss": 2.5873, "step": 33393 }, { "epoch": 0.9, "learning_rate": 5.468216813601368e-05, "loss": 2.6981, "step": 33394 }, { "epoch": 0.9, "learning_rate": 5.465378383389918e-05, "loss": 2.6128, "step": 33395 }, { "epoch": 0.9, "learning_rate": 5.462540669355853e-05, "loss": 2.4424, "step": 33396 }, { "epoch": 0.9, "learning_rate": 5.459703671520699e-05, "loss": 2.5736, "step": 33397 }, { "epoch": 0.9, "learning_rate": 5.4568673899059064e-05, "loss": 2.8947, "step": 33398 }, { "epoch": 0.9, "learning_rate": 5.454031824532979e-05, "loss": 2.1759, "step": 33399 }, { "epoch": 0.9, "learning_rate": 5.4511969754234116e-05, "loss": 2.324, "step": 33400 }, { "epoch": 0.9, "learning_rate": 5.448362842598664e-05, "loss": 2.6642, "step": 33401 }, { "epoch": 0.9, "learning_rate": 5.4455294260802316e-05, "loss": 2.9299, "step": 33402 }, { "epoch": 0.9, "learning_rate": 5.442696725889562e-05, "loss": 3.1177, "step": 33403 }, { "epoch": 0.9, "learning_rate": 5.439864742048106e-05, "loss": 2.6006, "step": 33404 }, { "epoch": 0.9, "learning_rate": 5.4370334745773245e-05, "loss": 2.6659, "step": 33405 }, { "epoch": 0.9, "learning_rate": 5.434202923498677e-05, "loss": 2.7729, "step": 33406 }, { "epoch": 0.9, "learning_rate": 5.431373088833602e-05, "loss": 2.4522, "step": 33407 }, { "epoch": 0.9, "learning_rate": 5.42854397060355e-05, "loss": 2.1121, "step": 33408 }, { "epoch": 0.9, "learning_rate": 5.4257155688299254e-05, "loss": 2.1637, "step": 33409 }, { "epoch": 0.9, "learning_rate": 5.422887883534178e-05, "loss": 2.571, "step": 33410 }, { "epoch": 0.9, "learning_rate": 5.4200609147377345e-05, "loss": 2.7478, "step": 33411 }, { "epoch": 0.9, "learning_rate": 5.4172346624619784e-05, "loss": 2.4927, "step": 33412 }, { "epoch": 0.9, "learning_rate": 5.414409126728348e-05, "loss": 2.5468, "step": 33413 }, { "epoch": 0.9, "learning_rate": 5.411584307558248e-05, "loss": 2.0641, "step": 33414 }, { "epoch": 0.9, "learning_rate": 5.408760204973073e-05, "loss": 2.1841, "step": 33415 }, { "epoch": 0.9, "learning_rate": 5.405936818994228e-05, "loss": 2.2826, "step": 33416 }, { "epoch": 0.9, "learning_rate": 5.403114149643085e-05, "loss": 2.6589, "step": 33417 }, { "epoch": 0.9, "learning_rate": 5.4002921969410365e-05, "loss": 2.467, "step": 33418 }, { "epoch": 0.9, "learning_rate": 5.397470960909456e-05, "loss": 2.385, "step": 33419 }, { "epoch": 0.9, "learning_rate": 5.394650441569726e-05, "loss": 2.5099, "step": 33420 }, { "epoch": 0.9, "learning_rate": 5.391830638943207e-05, "loss": 2.4249, "step": 33421 }, { "epoch": 0.9, "learning_rate": 5.389011553051282e-05, "loss": 2.5398, "step": 33422 }, { "epoch": 0.9, "learning_rate": 5.386193183915278e-05, "loss": 2.4727, "step": 33423 }, { "epoch": 0.9, "learning_rate": 5.383375531556578e-05, "loss": 2.0951, "step": 33424 }, { "epoch": 0.9, "learning_rate": 5.380558595996487e-05, "loss": 2.6145, "step": 33425 }, { "epoch": 0.9, "learning_rate": 5.377742377256356e-05, "loss": 2.1828, "step": 33426 }, { "epoch": 0.9, "learning_rate": 5.3749268753575557e-05, "loss": 2.2121, "step": 33427 }, { "epoch": 0.9, "learning_rate": 5.3721120903213794e-05, "loss": 2.3139, "step": 33428 }, { "epoch": 0.9, "learning_rate": 5.3692980221691664e-05, "loss": 2.1106, "step": 33429 }, { "epoch": 0.9, "learning_rate": 5.366484670922245e-05, "loss": 2.6016, "step": 33430 }, { "epoch": 0.9, "learning_rate": 5.363672036601907e-05, "loss": 2.4345, "step": 33431 }, { "epoch": 0.9, "learning_rate": 5.360860119229472e-05, "loss": 2.7268, "step": 33432 }, { "epoch": 0.9, "learning_rate": 5.3580489188262305e-05, "loss": 2.1414, "step": 33433 }, { "epoch": 0.9, "learning_rate": 5.355238435413501e-05, "loss": 2.1026, "step": 33434 }, { "epoch": 0.9, "learning_rate": 5.3524286690125766e-05, "loss": 2.8073, "step": 33435 }, { "epoch": 0.9, "learning_rate": 5.349619619644708e-05, "loss": 2.3672, "step": 33436 }, { "epoch": 0.9, "learning_rate": 5.34681128733121e-05, "loss": 2.4626, "step": 33437 }, { "epoch": 0.9, "learning_rate": 5.344003672093356e-05, "loss": 2.5002, "step": 33438 }, { "epoch": 0.9, "learning_rate": 5.341196773952372e-05, "loss": 2.5689, "step": 33439 }, { "epoch": 0.9, "learning_rate": 5.338390592929598e-05, "loss": 2.8641, "step": 33440 }, { "epoch": 0.9, "learning_rate": 5.3355851290462385e-05, "loss": 2.3946, "step": 33441 }, { "epoch": 0.9, "learning_rate": 5.3327803823235546e-05, "loss": 2.609, "step": 33442 }, { "epoch": 0.9, "learning_rate": 5.3299763527828174e-05, "loss": 2.2702, "step": 33443 }, { "epoch": 0.9, "learning_rate": 5.3271730404452434e-05, "loss": 2.4845, "step": 33444 }, { "epoch": 0.9, "learning_rate": 5.324370445332083e-05, "loss": 2.0465, "step": 33445 }, { "epoch": 0.9, "learning_rate": 5.3215685674645634e-05, "loss": 2.878, "step": 33446 }, { "epoch": 0.9, "learning_rate": 5.3187674068639004e-05, "loss": 2.6567, "step": 33447 }, { "epoch": 0.9, "learning_rate": 5.3159669635513554e-05, "loss": 2.2325, "step": 33448 }, { "epoch": 0.9, "learning_rate": 5.3131672375481e-05, "loss": 2.9405, "step": 33449 }, { "epoch": 0.9, "learning_rate": 5.310368228875362e-05, "loss": 2.4586, "step": 33450 }, { "epoch": 0.9, "learning_rate": 5.307569937554357e-05, "loss": 2.3796, "step": 33451 }, { "epoch": 0.9, "learning_rate": 5.304772363606247e-05, "loss": 2.3276, "step": 33452 }, { "epoch": 0.9, "learning_rate": 5.30197550705227e-05, "loss": 2.6663, "step": 33453 }, { "epoch": 0.9, "learning_rate": 5.299179367913609e-05, "loss": 2.3726, "step": 33454 }, { "epoch": 0.9, "learning_rate": 5.296383946211414e-05, "loss": 2.1301, "step": 33455 }, { "epoch": 0.9, "learning_rate": 5.29358924196689e-05, "loss": 2.3969, "step": 33456 }, { "epoch": 0.9, "learning_rate": 5.290795255201208e-05, "loss": 2.7023, "step": 33457 }, { "epoch": 0.9, "learning_rate": 5.28800198593552e-05, "loss": 2.251, "step": 33458 }, { "epoch": 0.9, "learning_rate": 5.285209434190985e-05, "loss": 2.4449, "step": 33459 }, { "epoch": 0.9, "learning_rate": 5.282417599988787e-05, "loss": 2.4692, "step": 33460 }, { "epoch": 0.9, "learning_rate": 5.279626483350053e-05, "loss": 2.3213, "step": 33461 }, { "epoch": 0.9, "learning_rate": 5.276836084295944e-05, "loss": 2.327, "step": 33462 }, { "epoch": 0.9, "learning_rate": 5.2740464028475766e-05, "loss": 2.4484, "step": 33463 }, { "epoch": 0.9, "learning_rate": 5.2712574390261e-05, "loss": 2.6032, "step": 33464 }, { "epoch": 0.9, "learning_rate": 5.268469192852643e-05, "loss": 2.3026, "step": 33465 }, { "epoch": 0.9, "learning_rate": 5.265681664348321e-05, "loss": 2.4724, "step": 33466 }, { "epoch": 0.9, "learning_rate": 5.262894853534283e-05, "loss": 2.1074, "step": 33467 }, { "epoch": 0.9, "learning_rate": 5.2601087604315925e-05, "loss": 2.5276, "step": 33468 }, { "epoch": 0.9, "learning_rate": 5.2573233850613854e-05, "loss": 2.5579, "step": 33469 }, { "epoch": 0.9, "learning_rate": 5.2545387274447685e-05, "loss": 2.7921, "step": 33470 }, { "epoch": 0.9, "learning_rate": 5.251754787602814e-05, "loss": 2.3389, "step": 33471 }, { "epoch": 0.9, "learning_rate": 5.248971565556626e-05, "loss": 2.6199, "step": 33472 }, { "epoch": 0.9, "learning_rate": 5.2461890613272887e-05, "loss": 2.2833, "step": 33473 }, { "epoch": 0.9, "learning_rate": 5.243407274935885e-05, "loss": 2.3937, "step": 33474 }, { "epoch": 0.9, "learning_rate": 5.240626206403498e-05, "loss": 2.3027, "step": 33475 }, { "epoch": 0.9, "learning_rate": 5.237845855751178e-05, "loss": 2.5262, "step": 33476 }, { "epoch": 0.9, "learning_rate": 5.2350662229999846e-05, "loss": 2.6812, "step": 33477 }, { "epoch": 0.9, "learning_rate": 5.232287308170991e-05, "loss": 2.1448, "step": 33478 }, { "epoch": 0.9, "learning_rate": 5.229509111285258e-05, "loss": 2.207, "step": 33479 }, { "epoch": 0.9, "learning_rate": 5.226731632363801e-05, "loss": 2.2853, "step": 33480 }, { "epoch": 0.9, "learning_rate": 5.223954871427716e-05, "loss": 2.8511, "step": 33481 }, { "epoch": 0.9, "learning_rate": 5.221178828497974e-05, "loss": 2.097, "step": 33482 }, { "epoch": 0.9, "learning_rate": 5.218403503595659e-05, "loss": 2.6493, "step": 33483 }, { "epoch": 0.9, "learning_rate": 5.215628896741753e-05, "loss": 2.6148, "step": 33484 }, { "epoch": 0.9, "learning_rate": 5.2128550079573064e-05, "loss": 2.4979, "step": 33485 }, { "epoch": 0.9, "learning_rate": 5.210081837263314e-05, "loss": 2.9925, "step": 33486 }, { "epoch": 0.9, "learning_rate": 5.207309384680803e-05, "loss": 2.5893, "step": 33487 }, { "epoch": 0.9, "learning_rate": 5.204537650230756e-05, "loss": 2.379, "step": 33488 }, { "epoch": 0.9, "learning_rate": 5.201766633934213e-05, "loss": 2.2438, "step": 33489 }, { "epoch": 0.9, "learning_rate": 5.198996335812112e-05, "loss": 2.7438, "step": 33490 }, { "epoch": 0.9, "learning_rate": 5.196226755885469e-05, "loss": 2.3619, "step": 33491 }, { "epoch": 0.9, "learning_rate": 5.193457894175269e-05, "loss": 2.1989, "step": 33492 }, { "epoch": 0.9, "learning_rate": 5.190689750702482e-05, "loss": 2.6088, "step": 33493 }, { "epoch": 0.9, "learning_rate": 5.187922325488081e-05, "loss": 2.2399, "step": 33494 }, { "epoch": 0.9, "learning_rate": 5.185155618553028e-05, "loss": 2.3462, "step": 33495 }, { "epoch": 0.9, "learning_rate": 5.1823896299182824e-05, "loss": 2.6896, "step": 33496 }, { "epoch": 0.9, "learning_rate": 5.179624359604807e-05, "loss": 2.1606, "step": 33497 }, { "epoch": 0.9, "learning_rate": 5.176859807633538e-05, "loss": 2.6043, "step": 33498 }, { "epoch": 0.9, "learning_rate": 5.174095974025417e-05, "loss": 2.5621, "step": 33499 }, { "epoch": 0.9, "learning_rate": 5.171332858801414e-05, "loss": 2.2528, "step": 33500 }, { "epoch": 0.9, "learning_rate": 5.168570461982425e-05, "loss": 2.6975, "step": 33501 }, { "epoch": 0.9, "learning_rate": 5.1658087835894095e-05, "loss": 2.3711, "step": 33502 }, { "epoch": 0.9, "learning_rate": 5.163047823643252e-05, "loss": 2.497, "step": 33503 }, { "epoch": 0.9, "learning_rate": 5.1602875821648907e-05, "loss": 2.4725, "step": 33504 }, { "epoch": 0.9, "learning_rate": 5.1575280591752314e-05, "loss": 2.3579, "step": 33505 }, { "epoch": 0.9, "learning_rate": 5.154769254695191e-05, "loss": 2.5116, "step": 33506 }, { "epoch": 0.9, "learning_rate": 5.152011168745663e-05, "loss": 2.3865, "step": 33507 }, { "epoch": 0.9, "learning_rate": 5.1492538013475535e-05, "loss": 2.0294, "step": 33508 }, { "epoch": 0.9, "learning_rate": 5.146497152521723e-05, "loss": 2.8299, "step": 33509 }, { "epoch": 0.9, "learning_rate": 5.143741222289078e-05, "loss": 2.4779, "step": 33510 }, { "epoch": 0.9, "learning_rate": 5.1409860106704895e-05, "loss": 2.8917, "step": 33511 }, { "epoch": 0.9, "learning_rate": 5.138231517686809e-05, "loss": 2.218, "step": 33512 }, { "epoch": 0.9, "learning_rate": 5.135477743358963e-05, "loss": 2.3385, "step": 33513 }, { "epoch": 0.9, "learning_rate": 5.132724687707757e-05, "loss": 2.4908, "step": 33514 }, { "epoch": 0.9, "learning_rate": 5.1299723507540755e-05, "loss": 2.244, "step": 33515 }, { "epoch": 0.9, "learning_rate": 5.127220732518767e-05, "loss": 2.572, "step": 33516 }, { "epoch": 0.9, "learning_rate": 5.1244698330226605e-05, "loss": 2.7654, "step": 33517 }, { "epoch": 0.9, "learning_rate": 5.121719652286616e-05, "loss": 2.5436, "step": 33518 }, { "epoch": 0.9, "learning_rate": 5.118970190331451e-05, "loss": 2.6316, "step": 33519 }, { "epoch": 0.9, "learning_rate": 5.1162214471780155e-05, "loss": 2.7127, "step": 33520 }, { "epoch": 0.9, "learning_rate": 5.113473422847126e-05, "loss": 2.1215, "step": 33521 }, { "epoch": 0.9, "learning_rate": 5.1107261173595877e-05, "loss": 2.0739, "step": 33522 }, { "epoch": 0.9, "learning_rate": 5.107979530736229e-05, "loss": 2.5055, "step": 33523 }, { "epoch": 0.9, "learning_rate": 5.105233662997854e-05, "loss": 2.1924, "step": 33524 }, { "epoch": 0.9, "learning_rate": 5.102488514165249e-05, "loss": 2.1052, "step": 33525 }, { "epoch": 0.9, "learning_rate": 5.099744084259239e-05, "loss": 2.5809, "step": 33526 }, { "epoch": 0.9, "learning_rate": 5.097000373300598e-05, "loss": 2.6698, "step": 33527 }, { "epoch": 0.9, "learning_rate": 5.094257381310119e-05, "loss": 2.1158, "step": 33528 }, { "epoch": 0.9, "learning_rate": 5.0915151083085756e-05, "loss": 2.3743, "step": 33529 }, { "epoch": 0.9, "learning_rate": 5.08877355431675e-05, "loss": 2.0835, "step": 33530 }, { "epoch": 0.9, "learning_rate": 5.086032719355393e-05, "loss": 2.6989, "step": 33531 }, { "epoch": 0.9, "learning_rate": 5.0832926034452886e-05, "loss": 2.3533, "step": 33532 }, { "epoch": 0.9, "learning_rate": 5.0805532066071966e-05, "loss": 2.5764, "step": 33533 }, { "epoch": 0.9, "learning_rate": 5.077814528861857e-05, "loss": 2.3157, "step": 33534 }, { "epoch": 0.9, "learning_rate": 5.0750765702300305e-05, "loss": 2.2108, "step": 33535 }, { "epoch": 0.9, "learning_rate": 5.072339330732445e-05, "loss": 2.4996, "step": 33536 }, { "epoch": 0.9, "learning_rate": 5.0696028103898505e-05, "loss": 2.737, "step": 33537 }, { "epoch": 0.9, "learning_rate": 5.0668670092229755e-05, "loss": 2.1833, "step": 33538 }, { "epoch": 0.9, "learning_rate": 5.0641319272525354e-05, "loss": 2.5491, "step": 33539 }, { "epoch": 0.9, "learning_rate": 5.0613975644992704e-05, "loss": 2.922, "step": 33540 }, { "epoch": 0.9, "learning_rate": 5.0586639209838746e-05, "loss": 2.6799, "step": 33541 }, { "epoch": 0.9, "learning_rate": 5.055930996727065e-05, "loss": 2.3997, "step": 33542 }, { "epoch": 0.9, "learning_rate": 5.0531987917495695e-05, "loss": 2.9105, "step": 33543 }, { "epoch": 0.9, "learning_rate": 5.050467306072048e-05, "loss": 2.6383, "step": 33544 }, { "epoch": 0.9, "learning_rate": 5.047736539715209e-05, "loss": 2.2892, "step": 33545 }, { "epoch": 0.9, "learning_rate": 5.045006492699733e-05, "loss": 2.4619, "step": 33546 }, { "epoch": 0.9, "learning_rate": 5.042277165046327e-05, "loss": 2.4433, "step": 33547 }, { "epoch": 0.9, "learning_rate": 5.039548556775653e-05, "loss": 2.5077, "step": 33548 }, { "epoch": 0.9, "learning_rate": 5.036820667908382e-05, "loss": 2.6606, "step": 33549 }, { "epoch": 0.9, "learning_rate": 5.034093498465164e-05, "loss": 2.5048, "step": 33550 }, { "epoch": 0.9, "learning_rate": 5.031367048466684e-05, "loss": 2.217, "step": 33551 }, { "epoch": 0.9, "learning_rate": 5.028641317933591e-05, "loss": 2.5193, "step": 33552 }, { "epoch": 0.9, "learning_rate": 5.0259163068865466e-05, "loss": 2.6335, "step": 33553 }, { "epoch": 0.9, "learning_rate": 5.0231920153461564e-05, "loss": 2.5711, "step": 33554 }, { "epoch": 0.9, "learning_rate": 5.020468443333093e-05, "loss": 2.28, "step": 33555 }, { "epoch": 0.9, "learning_rate": 5.017745590867984e-05, "loss": 2.2543, "step": 33556 }, { "epoch": 0.9, "learning_rate": 5.015023457971446e-05, "loss": 2.2977, "step": 33557 }, { "epoch": 0.9, "learning_rate": 5.0123020446640963e-05, "loss": 2.3042, "step": 33558 }, { "epoch": 0.9, "learning_rate": 5.0095813509665855e-05, "loss": 2.2406, "step": 33559 }, { "epoch": 0.9, "learning_rate": 5.006861376899496e-05, "loss": 2.5979, "step": 33560 }, { "epoch": 0.9, "learning_rate": 5.004142122483457e-05, "loss": 2.1819, "step": 33561 }, { "epoch": 0.9, "learning_rate": 5.00142358773904e-05, "loss": 2.4338, "step": 33562 }, { "epoch": 0.9, "learning_rate": 4.99870577268684e-05, "loss": 2.6316, "step": 33563 }, { "epoch": 0.9, "learning_rate": 4.995988677347474e-05, "loss": 2.7472, "step": 33564 }, { "epoch": 0.9, "learning_rate": 4.993272301741514e-05, "loss": 2.3065, "step": 33565 }, { "epoch": 0.9, "learning_rate": 4.9905566458895324e-05, "loss": 2.2229, "step": 33566 }, { "epoch": 0.9, "learning_rate": 4.987841709812113e-05, "loss": 2.4769, "step": 33567 }, { "epoch": 0.9, "learning_rate": 4.9851274935298175e-05, "loss": 2.375, "step": 33568 }, { "epoch": 0.9, "learning_rate": 4.9824139970632066e-05, "loss": 2.7769, "step": 33569 }, { "epoch": 0.9, "learning_rate": 4.979701220432853e-05, "loss": 2.2927, "step": 33570 }, { "epoch": 0.9, "learning_rate": 4.976989163659262e-05, "loss": 2.1595, "step": 33571 }, { "epoch": 0.9, "learning_rate": 4.974277826763041e-05, "loss": 2.3153, "step": 33572 }, { "epoch": 0.9, "learning_rate": 4.971567209764693e-05, "loss": 2.2451, "step": 33573 }, { "epoch": 0.9, "learning_rate": 4.9688573126847605e-05, "loss": 2.5561, "step": 33574 }, { "epoch": 0.9, "learning_rate": 4.966148135543791e-05, "loss": 2.5644, "step": 33575 }, { "epoch": 0.9, "learning_rate": 4.9634396783622695e-05, "loss": 2.7682, "step": 33576 }, { "epoch": 0.9, "learning_rate": 4.9607319411607455e-05, "loss": 2.526, "step": 33577 }, { "epoch": 0.9, "learning_rate": 4.958024923959725e-05, "loss": 2.2348, "step": 33578 }, { "epoch": 0.9, "learning_rate": 4.9553186267797144e-05, "loss": 2.186, "step": 33579 }, { "epoch": 0.9, "learning_rate": 4.9526130496412416e-05, "loss": 2.3906, "step": 33580 }, { "epoch": 0.9, "learning_rate": 4.949908192564756e-05, "loss": 2.8753, "step": 33581 }, { "epoch": 0.9, "learning_rate": 4.947204055570764e-05, "loss": 2.4087, "step": 33582 }, { "epoch": 0.9, "learning_rate": 4.944500638679783e-05, "loss": 2.2615, "step": 33583 }, { "epoch": 0.9, "learning_rate": 4.941797941912252e-05, "loss": 2.1302, "step": 33584 }, { "epoch": 0.9, "learning_rate": 4.939095965288665e-05, "loss": 2.3685, "step": 33585 }, { "epoch": 0.9, "learning_rate": 4.936394708829517e-05, "loss": 2.7205, "step": 33586 }, { "epoch": 0.9, "learning_rate": 4.933694172555225e-05, "loss": 2.5385, "step": 33587 }, { "epoch": 0.9, "learning_rate": 4.9309943564862845e-05, "loss": 2.1442, "step": 33588 }, { "epoch": 0.9, "learning_rate": 4.928295260643112e-05, "loss": 2.2833, "step": 33589 }, { "epoch": 0.9, "learning_rate": 4.925596885046191e-05, "loss": 2.3324, "step": 33590 }, { "epoch": 0.9, "learning_rate": 4.922899229715949e-05, "loss": 2.461, "step": 33591 }, { "epoch": 0.9, "learning_rate": 4.920202294672815e-05, "loss": 2.9376, "step": 33592 }, { "epoch": 0.9, "learning_rate": 4.9175060799372396e-05, "loss": 2.5448, "step": 33593 }, { "epoch": 0.9, "learning_rate": 4.91481058552965e-05, "loss": 2.4278, "step": 33594 }, { "epoch": 0.9, "learning_rate": 4.9121158114704414e-05, "loss": 2.4931, "step": 33595 }, { "epoch": 0.9, "learning_rate": 4.9094217577800525e-05, "loss": 2.6723, "step": 33596 }, { "epoch": 0.9, "learning_rate": 4.906728424478857e-05, "loss": 2.5464, "step": 33597 }, { "epoch": 0.9, "learning_rate": 4.904035811587304e-05, "loss": 2.547, "step": 33598 }, { "epoch": 0.9, "learning_rate": 4.901343919125789e-05, "loss": 3.1267, "step": 33599 }, { "epoch": 0.9, "learning_rate": 4.898652747114674e-05, "loss": 2.72, "step": 33600 }, { "epoch": 0.9, "learning_rate": 4.8959622955743634e-05, "loss": 2.3749, "step": 33601 }, { "epoch": 0.9, "learning_rate": 4.893272564525253e-05, "loss": 2.7795, "step": 33602 }, { "epoch": 0.9, "learning_rate": 4.890583553987693e-05, "loss": 2.5417, "step": 33603 }, { "epoch": 0.9, "learning_rate": 4.8878952639820675e-05, "loss": 2.3203, "step": 33604 }, { "epoch": 0.9, "learning_rate": 4.8852076945287374e-05, "loss": 2.3908, "step": 33605 }, { "epoch": 0.9, "learning_rate": 4.882520845648075e-05, "loss": 2.583, "step": 33606 }, { "epoch": 0.9, "learning_rate": 4.879834717360443e-05, "loss": 2.8758, "step": 33607 }, { "epoch": 0.9, "learning_rate": 4.877149309686169e-05, "loss": 2.1122, "step": 33608 }, { "epoch": 0.9, "learning_rate": 4.874464622645591e-05, "loss": 2.6262, "step": 33609 }, { "epoch": 0.9, "learning_rate": 4.8717806562590725e-05, "loss": 2.3423, "step": 33610 }, { "epoch": 0.9, "learning_rate": 4.869097410546941e-05, "loss": 2.0918, "step": 33611 }, { "epoch": 0.9, "learning_rate": 4.866414885529513e-05, "loss": 2.4185, "step": 33612 }, { "epoch": 0.9, "learning_rate": 4.863733081227128e-05, "loss": 1.8274, "step": 33613 }, { "epoch": 0.9, "learning_rate": 4.861051997660082e-05, "loss": 2.8896, "step": 33614 }, { "epoch": 0.9, "learning_rate": 4.8583716348487126e-05, "loss": 2.5027, "step": 33615 }, { "epoch": 0.9, "learning_rate": 4.855691992813294e-05, "loss": 2.3697, "step": 33616 }, { "epoch": 0.9, "learning_rate": 4.853013071574142e-05, "loss": 2.7133, "step": 33617 }, { "epoch": 0.9, "learning_rate": 4.8503348711515514e-05, "loss": 2.1186, "step": 33618 }, { "epoch": 0.9, "learning_rate": 4.847657391565818e-05, "loss": 2.8586, "step": 33619 }, { "epoch": 0.9, "learning_rate": 4.844980632837215e-05, "loss": 2.4026, "step": 33620 }, { "epoch": 0.9, "learning_rate": 4.842304594986047e-05, "loss": 2.7655, "step": 33621 }, { "epoch": 0.9, "learning_rate": 4.8396292780325424e-05, "loss": 3.0051, "step": 33622 }, { "epoch": 0.9, "learning_rate": 4.836954681997008e-05, "loss": 2.8243, "step": 33623 }, { "epoch": 0.9, "learning_rate": 4.8342808068996826e-05, "loss": 2.4034, "step": 33624 }, { "epoch": 0.9, "learning_rate": 4.8316076527608275e-05, "loss": 2.4913, "step": 33625 }, { "epoch": 0.9, "learning_rate": 4.8289352196007165e-05, "loss": 2.6399, "step": 33626 }, { "epoch": 0.9, "learning_rate": 4.826263507439565e-05, "loss": 2.2032, "step": 33627 }, { "epoch": 0.9, "learning_rate": 4.823592516297626e-05, "loss": 2.3179, "step": 33628 }, { "epoch": 0.9, "learning_rate": 4.8209222461951474e-05, "loss": 2.0912, "step": 33629 }, { "epoch": 0.9, "learning_rate": 4.8182526971523256e-05, "loss": 2.3446, "step": 33630 }, { "epoch": 0.9, "learning_rate": 4.815583869189411e-05, "loss": 2.2259, "step": 33631 }, { "epoch": 0.9, "learning_rate": 4.81291576232662e-05, "loss": 2.3948, "step": 33632 }, { "epoch": 0.9, "learning_rate": 4.8102483765841474e-05, "loss": 2.5898, "step": 33633 }, { "epoch": 0.9, "learning_rate": 4.807581711982234e-05, "loss": 2.1713, "step": 33634 }, { "epoch": 0.9, "learning_rate": 4.804915768541052e-05, "loss": 2.3503, "step": 33635 }, { "epoch": 0.9, "learning_rate": 4.8022505462808174e-05, "loss": 2.1384, "step": 33636 }, { "epoch": 0.9, "learning_rate": 4.799586045221704e-05, "loss": 2.7657, "step": 33637 }, { "epoch": 0.9, "learning_rate": 4.7969222653838964e-05, "loss": 2.0125, "step": 33638 }, { "epoch": 0.9, "learning_rate": 4.794259206787599e-05, "loss": 2.5972, "step": 33639 }, { "epoch": 0.9, "learning_rate": 4.7915968694529855e-05, "loss": 2.3909, "step": 33640 }, { "epoch": 0.9, "learning_rate": 4.788935253400195e-05, "loss": 2.2974, "step": 33641 }, { "epoch": 0.9, "learning_rate": 4.786274358649423e-05, "loss": 1.9457, "step": 33642 }, { "epoch": 0.9, "learning_rate": 4.783614185220797e-05, "loss": 2.164, "step": 33643 }, { "epoch": 0.9, "learning_rate": 4.780954733134479e-05, "loss": 2.2648, "step": 33644 }, { "epoch": 0.9, "learning_rate": 4.7782960024106534e-05, "loss": 2.1614, "step": 33645 }, { "epoch": 0.9, "learning_rate": 4.775637993069415e-05, "loss": 2.7917, "step": 33646 }, { "epoch": 0.9, "learning_rate": 4.772980705130914e-05, "loss": 2.4256, "step": 33647 }, { "epoch": 0.9, "learning_rate": 4.770324138615301e-05, "loss": 2.3394, "step": 33648 }, { "epoch": 0.9, "learning_rate": 4.767668293542682e-05, "loss": 2.6769, "step": 33649 }, { "epoch": 0.9, "learning_rate": 4.7650131699331744e-05, "loss": 2.6552, "step": 33650 }, { "epoch": 0.9, "learning_rate": 4.762358767806907e-05, "loss": 2.6147, "step": 33651 }, { "epoch": 0.9, "learning_rate": 4.759705087183974e-05, "loss": 2.4318, "step": 33652 }, { "epoch": 0.9, "learning_rate": 4.757052128084505e-05, "loss": 2.2773, "step": 33653 }, { "epoch": 0.9, "learning_rate": 4.754399890528571e-05, "loss": 2.5217, "step": 33654 }, { "epoch": 0.9, "learning_rate": 4.75174837453628e-05, "loss": 2.4214, "step": 33655 }, { "epoch": 0.9, "learning_rate": 4.749097580127715e-05, "loss": 2.2669, "step": 33656 }, { "epoch": 0.9, "learning_rate": 4.746447507322938e-05, "loss": 1.9541, "step": 33657 }, { "epoch": 0.9, "learning_rate": 4.743798156142076e-05, "loss": 2.549, "step": 33658 }, { "epoch": 0.9, "learning_rate": 4.741149526605149e-05, "loss": 2.2979, "step": 33659 }, { "epoch": 0.9, "learning_rate": 4.7385016187322385e-05, "loss": 2.619, "step": 33660 }, { "epoch": 0.9, "learning_rate": 4.735854432543429e-05, "loss": 2.802, "step": 33661 }, { "epoch": 0.9, "learning_rate": 4.733207968058739e-05, "loss": 2.4787, "step": 33662 }, { "epoch": 0.9, "learning_rate": 4.73056222529823e-05, "loss": 2.7321, "step": 33663 }, { "epoch": 0.9, "learning_rate": 4.7279172042819504e-05, "loss": 2.2679, "step": 33664 }, { "epoch": 0.9, "learning_rate": 4.725272905029943e-05, "loss": 2.5516, "step": 33665 }, { "epoch": 0.9, "learning_rate": 4.722629327562245e-05, "loss": 2.7975, "step": 33666 }, { "epoch": 0.9, "learning_rate": 4.719986471898863e-05, "loss": 2.7195, "step": 33667 }, { "epoch": 0.9, "learning_rate": 4.717344338059826e-05, "loss": 2.2374, "step": 33668 }, { "epoch": 0.9, "learning_rate": 4.714702926065162e-05, "loss": 2.1307, "step": 33669 }, { "epoch": 0.9, "learning_rate": 4.7120622359348555e-05, "loss": 2.3733, "step": 33670 }, { "epoch": 0.9, "learning_rate": 4.7094222676889345e-05, "loss": 2.63, "step": 33671 }, { "epoch": 0.9, "learning_rate": 4.706783021347405e-05, "loss": 2.5696, "step": 33672 }, { "epoch": 0.9, "learning_rate": 4.704144496930251e-05, "loss": 2.6827, "step": 33673 }, { "epoch": 0.9, "learning_rate": 4.701506694457458e-05, "loss": 2.0057, "step": 33674 }, { "epoch": 0.9, "learning_rate": 4.6988696139490086e-05, "loss": 2.2979, "step": 33675 }, { "epoch": 0.91, "learning_rate": 4.6962332554248864e-05, "loss": 2.5189, "step": 33676 }, { "epoch": 0.91, "learning_rate": 4.6935976189050544e-05, "loss": 2.2259, "step": 33677 }, { "epoch": 0.91, "learning_rate": 4.690962704409496e-05, "loss": 2.6273, "step": 33678 }, { "epoch": 0.91, "learning_rate": 4.688328511958162e-05, "loss": 2.4045, "step": 33679 }, { "epoch": 0.91, "learning_rate": 4.685695041571025e-05, "loss": 2.4453, "step": 33680 }, { "epoch": 0.91, "learning_rate": 4.683062293268003e-05, "loss": 2.2598, "step": 33681 }, { "epoch": 0.91, "learning_rate": 4.680430267069069e-05, "loss": 2.5486, "step": 33682 }, { "epoch": 0.91, "learning_rate": 4.677798962994151e-05, "loss": 2.1856, "step": 33683 }, { "epoch": 0.91, "learning_rate": 4.6751683810631776e-05, "loss": 2.4842, "step": 33684 }, { "epoch": 0.91, "learning_rate": 4.67253852129611e-05, "loss": 2.486, "step": 33685 }, { "epoch": 0.91, "learning_rate": 4.669909383712823e-05, "loss": 2.7364, "step": 33686 }, { "epoch": 0.91, "learning_rate": 4.667280968333265e-05, "loss": 2.3179, "step": 33687 }, { "epoch": 0.91, "learning_rate": 4.6646532751773666e-05, "loss": 2.9601, "step": 33688 }, { "epoch": 0.91, "learning_rate": 4.662026304264988e-05, "loss": 2.247, "step": 33689 }, { "epoch": 0.91, "learning_rate": 4.659400055616048e-05, "loss": 2.5217, "step": 33690 }, { "epoch": 0.91, "learning_rate": 4.656774529250451e-05, "loss": 2.7136, "step": 33691 }, { "epoch": 0.91, "learning_rate": 4.654149725188084e-05, "loss": 2.6215, "step": 33692 }, { "epoch": 0.91, "learning_rate": 4.651525643448851e-05, "loss": 2.1525, "step": 33693 }, { "epoch": 0.91, "learning_rate": 4.648902284052592e-05, "loss": 2.8373, "step": 33694 }, { "epoch": 0.91, "learning_rate": 4.646279647019214e-05, "loss": 2.743, "step": 33695 }, { "epoch": 0.91, "learning_rate": 4.643657732368567e-05, "loss": 2.5487, "step": 33696 }, { "epoch": 0.91, "learning_rate": 4.6410365401205134e-05, "loss": 2.8046, "step": 33697 }, { "epoch": 0.91, "learning_rate": 4.638416070294926e-05, "loss": 2.6442, "step": 33698 }, { "epoch": 0.91, "learning_rate": 4.635796322911667e-05, "loss": 2.1725, "step": 33699 }, { "epoch": 0.91, "learning_rate": 4.6331772979905426e-05, "loss": 2.6142, "step": 33700 }, { "epoch": 0.91, "learning_rate": 4.630558995551437e-05, "loss": 2.9006, "step": 33701 }, { "epoch": 0.91, "learning_rate": 4.627941415614145e-05, "loss": 2.2042, "step": 33702 }, { "epoch": 0.91, "learning_rate": 4.625324558198518e-05, "loss": 2.2279, "step": 33703 }, { "epoch": 0.91, "learning_rate": 4.622708423324395e-05, "loss": 2.1307, "step": 33704 }, { "epoch": 0.91, "learning_rate": 4.620093011011572e-05, "loss": 2.5288, "step": 33705 }, { "epoch": 0.91, "learning_rate": 4.617478321279878e-05, "loss": 2.3752, "step": 33706 }, { "epoch": 0.91, "learning_rate": 4.614864354149117e-05, "loss": 1.9487, "step": 33707 }, { "epoch": 0.91, "learning_rate": 4.612251109639087e-05, "loss": 2.1089, "step": 33708 }, { "epoch": 0.91, "learning_rate": 4.6096385877695825e-05, "loss": 2.7878, "step": 33709 }, { "epoch": 0.91, "learning_rate": 4.607026788560409e-05, "loss": 2.7493, "step": 33710 }, { "epoch": 0.91, "learning_rate": 4.6044157120313405e-05, "loss": 2.6035, "step": 33711 }, { "epoch": 0.91, "learning_rate": 4.601805358202171e-05, "loss": 2.637, "step": 33712 }, { "epoch": 0.91, "learning_rate": 4.5991957270926644e-05, "loss": 2.4667, "step": 33713 }, { "epoch": 0.91, "learning_rate": 4.5965868187225925e-05, "loss": 2.4147, "step": 33714 }, { "epoch": 0.91, "learning_rate": 4.5939786331117395e-05, "loss": 2.5958, "step": 33715 }, { "epoch": 0.91, "learning_rate": 4.591371170279812e-05, "loss": 2.5217, "step": 33716 }, { "epoch": 0.91, "learning_rate": 4.5887644302466166e-05, "loss": 2.4315, "step": 33717 }, { "epoch": 0.91, "learning_rate": 4.5861584130319046e-05, "loss": 2.3683, "step": 33718 }, { "epoch": 0.91, "learning_rate": 4.5835531186553704e-05, "loss": 2.8324, "step": 33719 }, { "epoch": 0.91, "learning_rate": 4.580948547136798e-05, "loss": 2.1675, "step": 33720 }, { "epoch": 0.91, "learning_rate": 4.578344698495895e-05, "loss": 2.6523, "step": 33721 }, { "epoch": 0.91, "learning_rate": 4.5757415727523786e-05, "loss": 2.4721, "step": 33722 }, { "epoch": 0.91, "learning_rate": 4.5731391699259995e-05, "loss": 2.4506, "step": 33723 }, { "epoch": 0.91, "learning_rate": 4.570537490036442e-05, "loss": 1.7584, "step": 33724 }, { "epoch": 0.91, "learning_rate": 4.567936533103445e-05, "loss": 2.3094, "step": 33725 }, { "epoch": 0.91, "learning_rate": 4.565336299146705e-05, "loss": 2.2518, "step": 33726 }, { "epoch": 0.91, "learning_rate": 4.562736788185906e-05, "loss": 2.0617, "step": 33727 }, { "epoch": 0.91, "learning_rate": 4.5601380002407544e-05, "loss": 2.5565, "step": 33728 }, { "epoch": 0.91, "learning_rate": 4.557539935330912e-05, "loss": 2.6742, "step": 33729 }, { "epoch": 0.91, "learning_rate": 4.5549425934760966e-05, "loss": 2.8991, "step": 33730 }, { "epoch": 0.91, "learning_rate": 4.552345974695993e-05, "loss": 2.7716, "step": 33731 }, { "epoch": 0.91, "learning_rate": 4.549750079010229e-05, "loss": 2.3773, "step": 33732 }, { "epoch": 0.91, "learning_rate": 4.5471549064385e-05, "loss": 2.46, "step": 33733 }, { "epoch": 0.91, "learning_rate": 4.5445604570004684e-05, "loss": 2.356, "step": 33734 }, { "epoch": 0.91, "learning_rate": 4.541966730715774e-05, "loss": 2.2471, "step": 33735 }, { "epoch": 0.91, "learning_rate": 4.539373727604068e-05, "loss": 2.3482, "step": 33736 }, { "epoch": 0.91, "learning_rate": 4.536781447685001e-05, "loss": 2.7312, "step": 33737 }, { "epoch": 0.91, "learning_rate": 4.534189890978213e-05, "loss": 2.4006, "step": 33738 }, { "epoch": 0.91, "learning_rate": 4.531599057503344e-05, "loss": 2.6086, "step": 33739 }, { "epoch": 0.91, "learning_rate": 4.52900894728e-05, "loss": 2.5361, "step": 33740 }, { "epoch": 0.91, "learning_rate": 4.5264195603278216e-05, "loss": 2.3288, "step": 33741 }, { "epoch": 0.91, "learning_rate": 4.5238308966664146e-05, "loss": 2.6747, "step": 33742 }, { "epoch": 0.91, "learning_rate": 4.521242956315397e-05, "loss": 2.1111, "step": 33743 }, { "epoch": 0.91, "learning_rate": 4.518655739294375e-05, "loss": 2.4606, "step": 33744 }, { "epoch": 0.91, "learning_rate": 4.516069245622945e-05, "loss": 2.2855, "step": 33745 }, { "epoch": 0.91, "learning_rate": 4.513483475320701e-05, "loss": 2.4359, "step": 33746 }, { "epoch": 0.91, "learning_rate": 4.510898428407251e-05, "loss": 2.4236, "step": 33747 }, { "epoch": 0.91, "learning_rate": 4.508314104902145e-05, "loss": 2.3013, "step": 33748 }, { "epoch": 0.91, "learning_rate": 4.505730504824979e-05, "loss": 2.9517, "step": 33749 }, { "epoch": 0.91, "learning_rate": 4.503147628195325e-05, "loss": 2.4952, "step": 33750 }, { "epoch": 0.91, "learning_rate": 4.5005654750327585e-05, "loss": 2.1912, "step": 33751 }, { "epoch": 0.91, "learning_rate": 4.497984045356829e-05, "loss": 2.319, "step": 33752 }, { "epoch": 0.91, "learning_rate": 4.49540333918711e-05, "loss": 2.7691, "step": 33753 }, { "epoch": 0.91, "learning_rate": 4.49282335654313e-05, "loss": 2.2839, "step": 33754 }, { "epoch": 0.91, "learning_rate": 4.4902440974444404e-05, "loss": 2.8725, "step": 33755 }, { "epoch": 0.91, "learning_rate": 4.487665561910592e-05, "loss": 2.4562, "step": 33756 }, { "epoch": 0.91, "learning_rate": 4.485087749961114e-05, "loss": 2.5761, "step": 33757 }, { "epoch": 0.91, "learning_rate": 4.4825106616155464e-05, "loss": 3.1131, "step": 33758 }, { "epoch": 0.91, "learning_rate": 4.479934296893384e-05, "loss": 2.1008, "step": 33759 }, { "epoch": 0.91, "learning_rate": 4.477358655814168e-05, "loss": 2.511, "step": 33760 }, { "epoch": 0.91, "learning_rate": 4.474783738397414e-05, "loss": 2.5887, "step": 33761 }, { "epoch": 0.91, "learning_rate": 4.472209544662609e-05, "loss": 1.8699, "step": 33762 }, { "epoch": 0.91, "learning_rate": 4.469636074629257e-05, "loss": 2.6509, "step": 33763 }, { "epoch": 0.91, "learning_rate": 4.467063328316878e-05, "loss": 2.2665, "step": 33764 }, { "epoch": 0.91, "learning_rate": 4.464491305744933e-05, "loss": 2.3801, "step": 33765 }, { "epoch": 0.91, "learning_rate": 4.461920006932951e-05, "loss": 2.2491, "step": 33766 }, { "epoch": 0.91, "learning_rate": 4.4593494319003615e-05, "loss": 2.1562, "step": 33767 }, { "epoch": 0.91, "learning_rate": 4.456779580666648e-05, "loss": 2.347, "step": 33768 }, { "epoch": 0.91, "learning_rate": 4.454210453251306e-05, "loss": 2.5404, "step": 33769 }, { "epoch": 0.91, "learning_rate": 4.451642049673776e-05, "loss": 2.4355, "step": 33770 }, { "epoch": 0.91, "learning_rate": 4.449074369953543e-05, "loss": 2.1586, "step": 33771 }, { "epoch": 0.91, "learning_rate": 4.446507414110024e-05, "loss": 2.2504, "step": 33772 }, { "epoch": 0.91, "learning_rate": 4.443941182162681e-05, "loss": 2.7312, "step": 33773 }, { "epoch": 0.91, "learning_rate": 4.4413756741309654e-05, "loss": 2.2921, "step": 33774 }, { "epoch": 0.91, "learning_rate": 4.438810890034295e-05, "loss": 2.3063, "step": 33775 }, { "epoch": 0.91, "learning_rate": 4.4362468298920875e-05, "loss": 2.5467, "step": 33776 }, { "epoch": 0.91, "learning_rate": 4.433683493723828e-05, "loss": 2.307, "step": 33777 }, { "epoch": 0.91, "learning_rate": 4.431120881548878e-05, "loss": 2.287, "step": 33778 }, { "epoch": 0.91, "learning_rate": 4.428558993386678e-05, "loss": 2.2521, "step": 33779 }, { "epoch": 0.91, "learning_rate": 4.425997829256623e-05, "loss": 2.3684, "step": 33780 }, { "epoch": 0.91, "learning_rate": 4.4234373891781085e-05, "loss": 2.5001, "step": 33781 }, { "epoch": 0.91, "learning_rate": 4.420877673170565e-05, "loss": 2.7209, "step": 33782 }, { "epoch": 0.91, "learning_rate": 4.418318681253353e-05, "loss": 2.4738, "step": 33783 }, { "epoch": 0.91, "learning_rate": 4.4157604134458684e-05, "loss": 2.7643, "step": 33784 }, { "epoch": 0.91, "learning_rate": 4.413202869767507e-05, "loss": 2.4515, "step": 33785 }, { "epoch": 0.91, "learning_rate": 4.410646050237621e-05, "loss": 2.4251, "step": 33786 }, { "epoch": 0.91, "learning_rate": 4.4080899548756045e-05, "loss": 2.5437, "step": 33787 }, { "epoch": 0.91, "learning_rate": 4.405534583700787e-05, "loss": 2.211, "step": 33788 }, { "epoch": 0.91, "learning_rate": 4.4029799367325426e-05, "loss": 2.5218, "step": 33789 }, { "epoch": 0.91, "learning_rate": 4.400426013990266e-05, "loss": 2.3666, "step": 33790 }, { "epoch": 0.91, "learning_rate": 4.3978728154932426e-05, "loss": 2.5032, "step": 33791 }, { "epoch": 0.91, "learning_rate": 4.395320341260856e-05, "loss": 2.9283, "step": 33792 }, { "epoch": 0.91, "learning_rate": 4.392768591312435e-05, "loss": 2.7263, "step": 33793 }, { "epoch": 0.91, "learning_rate": 4.390217565667287e-05, "loss": 2.1925, "step": 33794 }, { "epoch": 0.91, "learning_rate": 4.387667264344763e-05, "loss": 2.7337, "step": 33795 }, { "epoch": 0.91, "learning_rate": 4.3851176873641815e-05, "loss": 2.7176, "step": 33796 }, { "epoch": 0.91, "learning_rate": 4.382568834744849e-05, "loss": 2.6032, "step": 33797 }, { "epoch": 0.91, "learning_rate": 4.380020706506105e-05, "loss": 2.6932, "step": 33798 }, { "epoch": 0.91, "learning_rate": 4.377473302667201e-05, "loss": 2.4212, "step": 33799 }, { "epoch": 0.91, "learning_rate": 4.374926623247466e-05, "loss": 2.1894, "step": 33800 }, { "epoch": 0.91, "learning_rate": 4.372380668266207e-05, "loss": 2.2573, "step": 33801 }, { "epoch": 0.91, "learning_rate": 4.369835437742675e-05, "loss": 2.5669, "step": 33802 }, { "epoch": 0.91, "learning_rate": 4.367290931696177e-05, "loss": 2.5018, "step": 33803 }, { "epoch": 0.91, "learning_rate": 4.364747150146009e-05, "loss": 2.4738, "step": 33804 }, { "epoch": 0.91, "learning_rate": 4.362204093111388e-05, "loss": 2.7615, "step": 33805 }, { "epoch": 0.91, "learning_rate": 4.3596617606116437e-05, "loss": 2.6772, "step": 33806 }, { "epoch": 0.91, "learning_rate": 4.357120152665972e-05, "loss": 2.5096, "step": 33807 }, { "epoch": 0.91, "learning_rate": 4.354579269293668e-05, "loss": 2.3799, "step": 33808 }, { "epoch": 0.91, "learning_rate": 4.3520391105139726e-05, "loss": 2.6467, "step": 33809 }, { "epoch": 0.91, "learning_rate": 4.3494996763461246e-05, "loss": 2.495, "step": 33810 }, { "epoch": 0.91, "learning_rate": 4.346960966809366e-05, "loss": 2.4882, "step": 33811 }, { "epoch": 0.91, "learning_rate": 4.344422981922946e-05, "loss": 2.3855, "step": 33812 }, { "epoch": 0.91, "learning_rate": 4.3418857217060623e-05, "loss": 2.7858, "step": 33813 }, { "epoch": 0.91, "learning_rate": 4.3393491861779655e-05, "loss": 3.0115, "step": 33814 }, { "epoch": 0.91, "learning_rate": 4.336813375357829e-05, "loss": 1.7943, "step": 33815 }, { "epoch": 0.91, "learning_rate": 4.334278289264904e-05, "loss": 2.3446, "step": 33816 }, { "epoch": 0.91, "learning_rate": 4.331743927918397e-05, "loss": 2.4642, "step": 33817 }, { "epoch": 0.91, "learning_rate": 4.3292102913374706e-05, "loss": 2.4167, "step": 33818 }, { "epoch": 0.91, "learning_rate": 4.326677379541355e-05, "loss": 2.2083, "step": 33819 }, { "epoch": 0.91, "learning_rate": 4.324145192549234e-05, "loss": 2.5351, "step": 33820 }, { "epoch": 0.91, "learning_rate": 4.32161373038028e-05, "loss": 2.4091, "step": 33821 }, { "epoch": 0.91, "learning_rate": 4.3190829930536693e-05, "loss": 2.5647, "step": 33822 }, { "epoch": 0.91, "learning_rate": 4.316552980588573e-05, "loss": 2.269, "step": 33823 }, { "epoch": 0.91, "learning_rate": 4.3140236930041765e-05, "loss": 2.3015, "step": 33824 }, { "epoch": 0.91, "learning_rate": 4.311495130319631e-05, "loss": 2.8675, "step": 33825 }, { "epoch": 0.91, "learning_rate": 4.308967292554089e-05, "loss": 2.5654, "step": 33826 }, { "epoch": 0.91, "learning_rate": 4.306440179726689e-05, "loss": 2.8183, "step": 33827 }, { "epoch": 0.91, "learning_rate": 4.303913791856606e-05, "loss": 2.7126, "step": 33828 }, { "epoch": 0.91, "learning_rate": 4.3013881289629465e-05, "loss": 2.3354, "step": 33829 }, { "epoch": 0.91, "learning_rate": 4.298863191064872e-05, "loss": 2.477, "step": 33830 }, { "epoch": 0.91, "learning_rate": 4.296338978181513e-05, "loss": 2.6454, "step": 33831 }, { "epoch": 0.91, "learning_rate": 4.293815490331965e-05, "loss": 2.6008, "step": 33832 }, { "epoch": 0.91, "learning_rate": 4.2912927275353675e-05, "loss": 2.6037, "step": 33833 }, { "epoch": 0.91, "learning_rate": 4.288770689810817e-05, "loss": 2.6569, "step": 33834 }, { "epoch": 0.91, "learning_rate": 4.286249377177431e-05, "loss": 2.5876, "step": 33835 }, { "epoch": 0.91, "learning_rate": 4.283728789654306e-05, "loss": 2.506, "step": 33836 }, { "epoch": 0.91, "learning_rate": 4.2812089272605383e-05, "loss": 2.3926, "step": 33837 }, { "epoch": 0.91, "learning_rate": 4.278689790015222e-05, "loss": 2.6938, "step": 33838 }, { "epoch": 0.91, "learning_rate": 4.276171377937443e-05, "loss": 2.4426, "step": 33839 }, { "epoch": 0.91, "learning_rate": 4.273653691046275e-05, "loss": 2.0993, "step": 33840 }, { "epoch": 0.91, "learning_rate": 4.2711367293607805e-05, "loss": 2.6394, "step": 33841 }, { "epoch": 0.91, "learning_rate": 4.2686204929000436e-05, "loss": 2.2335, "step": 33842 }, { "epoch": 0.91, "learning_rate": 4.2661049816831274e-05, "loss": 2.7212, "step": 33843 }, { "epoch": 0.91, "learning_rate": 4.263590195729095e-05, "loss": 2.0498, "step": 33844 }, { "epoch": 0.91, "learning_rate": 4.261076135056974e-05, "loss": 2.292, "step": 33845 }, { "epoch": 0.91, "learning_rate": 4.258562799685817e-05, "loss": 2.161, "step": 33846 }, { "epoch": 0.91, "learning_rate": 4.256050189634697e-05, "loss": 2.284, "step": 33847 }, { "epoch": 0.91, "learning_rate": 4.2535383049226e-05, "loss": 2.1077, "step": 33848 }, { "epoch": 0.91, "learning_rate": 4.251027145568587e-05, "loss": 2.5868, "step": 33849 }, { "epoch": 0.91, "learning_rate": 4.2485167115916656e-05, "loss": 2.0327, "step": 33850 }, { "epoch": 0.91, "learning_rate": 4.2460070030108655e-05, "loss": 2.5295, "step": 33851 }, { "epoch": 0.91, "learning_rate": 4.243498019845216e-05, "loss": 2.4055, "step": 33852 }, { "epoch": 0.91, "learning_rate": 4.240989762113678e-05, "loss": 2.1403, "step": 33853 }, { "epoch": 0.91, "learning_rate": 4.2384822298352944e-05, "loss": 2.7429, "step": 33854 }, { "epoch": 0.91, "learning_rate": 4.235975423029048e-05, "loss": 2.7691, "step": 33855 }, { "epoch": 0.91, "learning_rate": 4.2334693417139244e-05, "loss": 2.8121, "step": 33856 }, { "epoch": 0.91, "learning_rate": 4.230963985908931e-05, "loss": 2.6366, "step": 33857 }, { "epoch": 0.91, "learning_rate": 4.22845935563303e-05, "loss": 2.5007, "step": 33858 }, { "epoch": 0.91, "learning_rate": 4.225955450905183e-05, "loss": 2.4427, "step": 33859 }, { "epoch": 0.91, "learning_rate": 4.223452271744399e-05, "loss": 2.6442, "step": 33860 }, { "epoch": 0.91, "learning_rate": 4.220949818169595e-05, "loss": 2.5312, "step": 33861 }, { "epoch": 0.91, "learning_rate": 4.2184480901997445e-05, "loss": 2.3347, "step": 33862 }, { "epoch": 0.91, "learning_rate": 4.215947087853833e-05, "loss": 2.6136, "step": 33863 }, { "epoch": 0.91, "learning_rate": 4.213446811150767e-05, "loss": 2.3889, "step": 33864 }, { "epoch": 0.91, "learning_rate": 4.21094726010951e-05, "loss": 2.3568, "step": 33865 }, { "epoch": 0.91, "learning_rate": 4.20844843474899e-05, "loss": 2.9531, "step": 33866 }, { "epoch": 0.91, "learning_rate": 4.205950335088138e-05, "loss": 2.7582, "step": 33867 }, { "epoch": 0.91, "learning_rate": 4.2034529611458703e-05, "loss": 2.8713, "step": 33868 }, { "epoch": 0.91, "learning_rate": 4.200956312941129e-05, "loss": 2.3475, "step": 33869 }, { "epoch": 0.91, "learning_rate": 4.198460390492809e-05, "loss": 2.4753, "step": 33870 }, { "epoch": 0.91, "learning_rate": 4.195965193819829e-05, "loss": 2.4749, "step": 33871 }, { "epoch": 0.91, "learning_rate": 4.193470722941084e-05, "loss": 2.2579, "step": 33872 }, { "epoch": 0.91, "learning_rate": 4.1909769778754826e-05, "loss": 2.4721, "step": 33873 }, { "epoch": 0.91, "learning_rate": 4.188483958641898e-05, "loss": 2.2246, "step": 33874 }, { "epoch": 0.91, "learning_rate": 4.1859916652592366e-05, "loss": 2.1646, "step": 33875 }, { "epoch": 0.91, "learning_rate": 4.1835000977463846e-05, "loss": 2.5184, "step": 33876 }, { "epoch": 0.91, "learning_rate": 4.1810092561221926e-05, "loss": 2.7646, "step": 33877 }, { "epoch": 0.91, "learning_rate": 4.1785191404055454e-05, "loss": 2.609, "step": 33878 }, { "epoch": 0.91, "learning_rate": 4.1760297506153176e-05, "loss": 2.0747, "step": 33879 }, { "epoch": 0.91, "learning_rate": 4.1735410867703385e-05, "loss": 2.3535, "step": 33880 }, { "epoch": 0.91, "learning_rate": 4.171053148889481e-05, "loss": 2.3521, "step": 33881 }, { "epoch": 0.91, "learning_rate": 4.168565936991597e-05, "loss": 2.3029, "step": 33882 }, { "epoch": 0.91, "learning_rate": 4.166079451095528e-05, "loss": 2.2215, "step": 33883 }, { "epoch": 0.91, "learning_rate": 4.163593691220113e-05, "loss": 2.309, "step": 33884 }, { "epoch": 0.91, "learning_rate": 4.1611086573841715e-05, "loss": 2.6631, "step": 33885 }, { "epoch": 0.91, "learning_rate": 4.158624349606532e-05, "loss": 2.4322, "step": 33886 }, { "epoch": 0.91, "learning_rate": 4.156140767906014e-05, "loss": 2.1721, "step": 33887 }, { "epoch": 0.91, "learning_rate": 4.153657912301445e-05, "loss": 1.9189, "step": 33888 }, { "epoch": 0.91, "learning_rate": 4.151175782811634e-05, "loss": 2.2729, "step": 33889 }, { "epoch": 0.91, "learning_rate": 4.1486943794553756e-05, "loss": 2.752, "step": 33890 }, { "epoch": 0.91, "learning_rate": 4.146213702251478e-05, "loss": 2.5452, "step": 33891 }, { "epoch": 0.91, "learning_rate": 4.1437337512187255e-05, "loss": 2.9375, "step": 33892 }, { "epoch": 0.91, "learning_rate": 4.141254526375904e-05, "loss": 2.9279, "step": 33893 }, { "epoch": 0.91, "learning_rate": 4.1387760277417975e-05, "loss": 2.2271, "step": 33894 }, { "epoch": 0.91, "learning_rate": 4.1362982553351914e-05, "loss": 2.3767, "step": 33895 }, { "epoch": 0.91, "learning_rate": 4.1338212091748376e-05, "loss": 2.4167, "step": 33896 }, { "epoch": 0.91, "learning_rate": 4.131344889279531e-05, "loss": 2.3546, "step": 33897 }, { "epoch": 0.91, "learning_rate": 4.1288692956680144e-05, "loss": 2.8136, "step": 33898 }, { "epoch": 0.91, "learning_rate": 4.126394428359037e-05, "loss": 2.4132, "step": 33899 }, { "epoch": 0.91, "learning_rate": 4.123920287371363e-05, "loss": 2.6557, "step": 33900 }, { "epoch": 0.91, "learning_rate": 4.121446872723711e-05, "loss": 2.6931, "step": 33901 }, { "epoch": 0.91, "learning_rate": 4.118974184434854e-05, "loss": 2.1639, "step": 33902 }, { "epoch": 0.91, "learning_rate": 4.1165022225235104e-05, "loss": 1.9614, "step": 33903 }, { "epoch": 0.91, "learning_rate": 4.114030987008388e-05, "loss": 2.2565, "step": 33904 }, { "epoch": 0.91, "learning_rate": 4.111560477908227e-05, "loss": 2.4055, "step": 33905 }, { "epoch": 0.91, "learning_rate": 4.1090906952417574e-05, "loss": 2.51, "step": 33906 }, { "epoch": 0.91, "learning_rate": 4.106621639027652e-05, "loss": 2.6638, "step": 33907 }, { "epoch": 0.91, "learning_rate": 4.1041533092846304e-05, "loss": 2.7852, "step": 33908 }, { "epoch": 0.91, "learning_rate": 4.1016857060314214e-05, "loss": 2.6624, "step": 33909 }, { "epoch": 0.91, "learning_rate": 4.0992188292866884e-05, "loss": 2.2896, "step": 33910 }, { "epoch": 0.91, "learning_rate": 4.096752679069138e-05, "loss": 2.7013, "step": 33911 }, { "epoch": 0.91, "learning_rate": 4.094287255397422e-05, "loss": 2.2683, "step": 33912 }, { "epoch": 0.91, "learning_rate": 4.091822558290248e-05, "loss": 2.6298, "step": 33913 }, { "epoch": 0.91, "learning_rate": 4.089358587766279e-05, "loss": 2.3247, "step": 33914 }, { "epoch": 0.91, "learning_rate": 4.086895343844188e-05, "loss": 2.3154, "step": 33915 }, { "epoch": 0.91, "learning_rate": 4.0844328265426164e-05, "loss": 2.2947, "step": 33916 }, { "epoch": 0.91, "learning_rate": 4.0819710358802606e-05, "loss": 2.3088, "step": 33917 }, { "epoch": 0.91, "learning_rate": 4.079509971875717e-05, "loss": 2.3426, "step": 33918 }, { "epoch": 0.91, "learning_rate": 4.07704963454768e-05, "loss": 3.0578, "step": 33919 }, { "epoch": 0.91, "learning_rate": 4.074590023914748e-05, "loss": 2.6686, "step": 33920 }, { "epoch": 0.91, "learning_rate": 4.0721311399955604e-05, "loss": 2.22, "step": 33921 }, { "epoch": 0.91, "learning_rate": 4.069672982808792e-05, "loss": 2.6925, "step": 33922 }, { "epoch": 0.91, "learning_rate": 4.067215552373005e-05, "loss": 2.6065, "step": 33923 }, { "epoch": 0.91, "learning_rate": 4.064758848706851e-05, "loss": 2.7262, "step": 33924 }, { "epoch": 0.91, "learning_rate": 4.062302871828938e-05, "loss": 2.4358, "step": 33925 }, { "epoch": 0.91, "learning_rate": 4.059847621757851e-05, "loss": 2.3866, "step": 33926 }, { "epoch": 0.91, "learning_rate": 4.0573930985122076e-05, "loss": 2.7649, "step": 33927 }, { "epoch": 0.91, "learning_rate": 4.054939302110605e-05, "loss": 2.7628, "step": 33928 }, { "epoch": 0.91, "learning_rate": 4.0524862325716286e-05, "loss": 2.3565, "step": 33929 }, { "epoch": 0.91, "learning_rate": 4.0500338899138734e-05, "loss": 2.624, "step": 33930 }, { "epoch": 0.91, "learning_rate": 4.047582274155903e-05, "loss": 2.2999, "step": 33931 }, { "epoch": 0.91, "learning_rate": 4.045131385316281e-05, "loss": 2.3161, "step": 33932 }, { "epoch": 0.91, "learning_rate": 4.042681223413613e-05, "loss": 2.1817, "step": 33933 }, { "epoch": 0.91, "learning_rate": 4.0402317884664084e-05, "loss": 2.1154, "step": 33934 }, { "epoch": 0.91, "learning_rate": 4.0377830804932733e-05, "loss": 2.7191, "step": 33935 }, { "epoch": 0.91, "learning_rate": 4.035335099512716e-05, "loss": 2.312, "step": 33936 }, { "epoch": 0.91, "learning_rate": 4.03288784554332e-05, "loss": 2.65, "step": 33937 }, { "epoch": 0.91, "learning_rate": 4.030441318603617e-05, "loss": 2.5048, "step": 33938 }, { "epoch": 0.91, "learning_rate": 4.027995518712113e-05, "loss": 2.2804, "step": 33939 }, { "epoch": 0.91, "learning_rate": 4.0255504458873606e-05, "loss": 2.5749, "step": 33940 }, { "epoch": 0.91, "learning_rate": 4.023106100147877e-05, "loss": 2.1615, "step": 33941 }, { "epoch": 0.91, "learning_rate": 4.020662481512183e-05, "loss": 2.5231, "step": 33942 }, { "epoch": 0.91, "learning_rate": 4.018219589998795e-05, "loss": 2.8299, "step": 33943 }, { "epoch": 0.91, "learning_rate": 4.0157774256262214e-05, "loss": 2.6838, "step": 33944 }, { "epoch": 0.91, "learning_rate": 4.013335988412958e-05, "loss": 2.2798, "step": 33945 }, { "epoch": 0.91, "learning_rate": 4.010895278377502e-05, "loss": 2.38, "step": 33946 }, { "epoch": 0.91, "learning_rate": 4.008455295538316e-05, "loss": 2.2616, "step": 33947 }, { "epoch": 0.91, "learning_rate": 4.006016039913929e-05, "loss": 2.8677, "step": 33948 }, { "epoch": 0.91, "learning_rate": 4.003577511522816e-05, "loss": 2.521, "step": 33949 }, { "epoch": 0.91, "learning_rate": 4.001139710383417e-05, "loss": 2.5277, "step": 33950 }, { "epoch": 0.91, "learning_rate": 3.998702636514229e-05, "loss": 2.1114, "step": 33951 }, { "epoch": 0.91, "learning_rate": 3.996266289933714e-05, "loss": 2.4534, "step": 33952 }, { "epoch": 0.91, "learning_rate": 3.9938306706603036e-05, "loss": 1.8633, "step": 33953 }, { "epoch": 0.91, "learning_rate": 3.991395778712481e-05, "loss": 2.7288, "step": 33954 }, { "epoch": 0.91, "learning_rate": 3.988961614108666e-05, "loss": 2.5346, "step": 33955 }, { "epoch": 0.91, "learning_rate": 3.986528176867321e-05, "loss": 2.5743, "step": 33956 }, { "epoch": 0.91, "learning_rate": 3.9840954670068873e-05, "loss": 2.5098, "step": 33957 }, { "epoch": 0.91, "learning_rate": 3.981663484545761e-05, "loss": 2.4804, "step": 33958 }, { "epoch": 0.91, "learning_rate": 3.979232229502383e-05, "loss": 2.0383, "step": 33959 }, { "epoch": 0.91, "learning_rate": 3.976801701895183e-05, "loss": 2.4255, "step": 33960 }, { "epoch": 0.91, "learning_rate": 3.9743719017425686e-05, "loss": 1.9211, "step": 33961 }, { "epoch": 0.91, "learning_rate": 3.971942829062947e-05, "loss": 2.988, "step": 33962 }, { "epoch": 0.91, "learning_rate": 3.969514483874714e-05, "loss": 2.2483, "step": 33963 }, { "epoch": 0.91, "learning_rate": 3.967086866196268e-05, "loss": 2.5702, "step": 33964 }, { "epoch": 0.91, "learning_rate": 3.964659976046015e-05, "loss": 2.6479, "step": 33965 }, { "epoch": 0.91, "learning_rate": 3.962233813442317e-05, "loss": 2.4568, "step": 33966 }, { "epoch": 0.91, "learning_rate": 3.959808378403562e-05, "loss": 2.3677, "step": 33967 }, { "epoch": 0.91, "learning_rate": 3.957383670948134e-05, "loss": 2.0341, "step": 33968 }, { "epoch": 0.91, "learning_rate": 3.9549596910943955e-05, "loss": 2.678, "step": 33969 }, { "epoch": 0.91, "learning_rate": 3.952536438860721e-05, "loss": 3.0279, "step": 33970 }, { "epoch": 0.91, "learning_rate": 3.950113914265441e-05, "loss": 2.239, "step": 33971 }, { "epoch": 0.91, "learning_rate": 3.947692117326929e-05, "loss": 2.4229, "step": 33972 }, { "epoch": 0.91, "learning_rate": 3.9452710480635364e-05, "loss": 2.4104, "step": 33973 }, { "epoch": 0.91, "learning_rate": 3.942850706493595e-05, "loss": 2.9464, "step": 33974 }, { "epoch": 0.91, "learning_rate": 3.940431092635444e-05, "loss": 2.3552, "step": 33975 }, { "epoch": 0.91, "learning_rate": 3.938012206507413e-05, "loss": 2.5923, "step": 33976 }, { "epoch": 0.91, "learning_rate": 3.935594048127833e-05, "loss": 2.0578, "step": 33977 }, { "epoch": 0.91, "learning_rate": 3.933176617515e-05, "loss": 2.1715, "step": 33978 }, { "epoch": 0.91, "learning_rate": 3.930759914687276e-05, "loss": 2.2358, "step": 33979 }, { "epoch": 0.91, "learning_rate": 3.928343939662915e-05, "loss": 2.8208, "step": 33980 }, { "epoch": 0.91, "learning_rate": 3.9259286924602456e-05, "loss": 2.2419, "step": 33981 }, { "epoch": 0.91, "learning_rate": 3.923514173097564e-05, "loss": 2.5764, "step": 33982 }, { "epoch": 0.91, "learning_rate": 3.9211003815931676e-05, "loss": 2.6721, "step": 33983 }, { "epoch": 0.91, "learning_rate": 3.918687317965341e-05, "loss": 2.7164, "step": 33984 }, { "epoch": 0.91, "learning_rate": 3.91627498223236e-05, "loss": 3.0567, "step": 33985 }, { "epoch": 0.91, "learning_rate": 3.9138633744124965e-05, "loss": 2.5098, "step": 33986 }, { "epoch": 0.91, "learning_rate": 3.9114524945240256e-05, "loss": 2.5557, "step": 33987 }, { "epoch": 0.91, "learning_rate": 3.909042342585212e-05, "loss": 2.5234, "step": 33988 }, { "epoch": 0.91, "learning_rate": 3.906632918614328e-05, "loss": 2.1686, "step": 33989 }, { "epoch": 0.91, "learning_rate": 3.904224222629593e-05, "loss": 1.6036, "step": 33990 }, { "epoch": 0.91, "learning_rate": 3.901816254649282e-05, "loss": 2.2548, "step": 33991 }, { "epoch": 0.91, "learning_rate": 3.899409014691635e-05, "loss": 2.0636, "step": 33992 }, { "epoch": 0.91, "learning_rate": 3.897002502774882e-05, "loss": 2.3292, "step": 33993 }, { "epoch": 0.91, "learning_rate": 3.894596718917243e-05, "loss": 2.6367, "step": 33994 }, { "epoch": 0.91, "learning_rate": 3.892191663136979e-05, "loss": 2.1224, "step": 33995 }, { "epoch": 0.91, "learning_rate": 3.889787335452277e-05, "loss": 1.7698, "step": 33996 }, { "epoch": 0.91, "learning_rate": 3.887383735881367e-05, "loss": 2.5833, "step": 33997 }, { "epoch": 0.91, "learning_rate": 3.8849808644424554e-05, "loss": 2.258, "step": 33998 }, { "epoch": 0.91, "learning_rate": 3.88257872115374e-05, "loss": 2.3878, "step": 33999 }, { "epoch": 0.91, "learning_rate": 3.880177306033417e-05, "loss": 2.3625, "step": 34000 }, { "epoch": 0.91, "learning_rate": 3.877776619099693e-05, "loss": 2.4244, "step": 34001 }, { "epoch": 0.91, "learning_rate": 3.875376660370744e-05, "loss": 2.3526, "step": 34002 }, { "epoch": 0.91, "learning_rate": 3.872977429864777e-05, "loss": 1.8567, "step": 34003 }, { "epoch": 0.91, "learning_rate": 3.8705789275999324e-05, "loss": 2.8716, "step": 34004 }, { "epoch": 0.91, "learning_rate": 3.868181153594408e-05, "loss": 2.3548, "step": 34005 }, { "epoch": 0.91, "learning_rate": 3.8657841078663326e-05, "loss": 2.4651, "step": 34006 }, { "epoch": 0.91, "learning_rate": 3.863387790433892e-05, "loss": 2.827, "step": 34007 }, { "epoch": 0.91, "learning_rate": 3.86099220131525e-05, "loss": 2.6231, "step": 34008 }, { "epoch": 0.91, "learning_rate": 3.8585973405285356e-05, "loss": 2.5849, "step": 34009 }, { "epoch": 0.91, "learning_rate": 3.856203208091902e-05, "loss": 2.8024, "step": 34010 }, { "epoch": 0.91, "learning_rate": 3.8538098040235004e-05, "loss": 2.1057, "step": 34011 }, { "epoch": 0.91, "learning_rate": 3.851417128341428e-05, "loss": 2.6553, "step": 34012 }, { "epoch": 0.91, "learning_rate": 3.849025181063826e-05, "loss": 2.5327, "step": 34013 }, { "epoch": 0.91, "learning_rate": 3.846633962208823e-05, "loss": 2.9376, "step": 34014 }, { "epoch": 0.91, "learning_rate": 3.844243471794539e-05, "loss": 2.0711, "step": 34015 }, { "epoch": 0.91, "learning_rate": 3.8418537098390716e-05, "loss": 2.485, "step": 34016 }, { "epoch": 0.91, "learning_rate": 3.839464676360527e-05, "loss": 2.5275, "step": 34017 }, { "epoch": 0.91, "learning_rate": 3.837076371377002e-05, "loss": 2.3586, "step": 34018 }, { "epoch": 0.91, "learning_rate": 3.834688794906616e-05, "loss": 2.7337, "step": 34019 }, { "epoch": 0.91, "learning_rate": 3.832301946967398e-05, "loss": 2.1695, "step": 34020 }, { "epoch": 0.91, "learning_rate": 3.8299158275774906e-05, "loss": 2.666, "step": 34021 }, { "epoch": 0.91, "learning_rate": 3.827530436754945e-05, "loss": 2.6739, "step": 34022 }, { "epoch": 0.91, "learning_rate": 3.8251457745178354e-05, "loss": 3.1475, "step": 34023 }, { "epoch": 0.91, "learning_rate": 3.822761840884237e-05, "loss": 2.3044, "step": 34024 }, { "epoch": 0.91, "learning_rate": 3.820378635872179e-05, "loss": 2.543, "step": 34025 }, { "epoch": 0.91, "learning_rate": 3.8179961594997484e-05, "loss": 2.6936, "step": 34026 }, { "epoch": 0.91, "learning_rate": 3.815614411784973e-05, "loss": 2.1826, "step": 34027 }, { "epoch": 0.91, "learning_rate": 3.8132333927459184e-05, "loss": 2.5687, "step": 34028 }, { "epoch": 0.91, "learning_rate": 3.810853102400602e-05, "loss": 2.2931, "step": 34029 }, { "epoch": 0.91, "learning_rate": 3.8084735407670765e-05, "loss": 2.1374, "step": 34030 }, { "epoch": 0.91, "learning_rate": 3.80609470786335e-05, "loss": 2.2636, "step": 34031 }, { "epoch": 0.91, "learning_rate": 3.8037166037074635e-05, "loss": 2.5051, "step": 34032 }, { "epoch": 0.91, "learning_rate": 3.801339228317402e-05, "loss": 2.3011, "step": 34033 }, { "epoch": 0.91, "learning_rate": 3.798962581711207e-05, "loss": 2.3635, "step": 34034 }, { "epoch": 0.91, "learning_rate": 3.7965866639068756e-05, "loss": 2.3689, "step": 34035 }, { "epoch": 0.91, "learning_rate": 3.794211474922404e-05, "loss": 2.8108, "step": 34036 }, { "epoch": 0.91, "learning_rate": 3.7918370147757787e-05, "loss": 2.3078, "step": 34037 }, { "epoch": 0.91, "learning_rate": 3.789463283485006e-05, "loss": 2.3114, "step": 34038 }, { "epoch": 0.91, "learning_rate": 3.7870902810680505e-05, "loss": 2.2426, "step": 34039 }, { "epoch": 0.91, "learning_rate": 3.784718007542898e-05, "loss": 2.7767, "step": 34040 }, { "epoch": 0.91, "learning_rate": 3.782346462927522e-05, "loss": 2.5629, "step": 34041 }, { "epoch": 0.91, "learning_rate": 3.779975647239875e-05, "loss": 2.4211, "step": 34042 }, { "epoch": 0.91, "learning_rate": 3.777605560497954e-05, "loss": 2.2907, "step": 34043 }, { "epoch": 0.91, "learning_rate": 3.775236202719678e-05, "loss": 2.8358, "step": 34044 }, { "epoch": 0.91, "learning_rate": 3.772867573923011e-05, "loss": 2.6739, "step": 34045 }, { "epoch": 0.91, "learning_rate": 3.770499674125882e-05, "loss": 2.623, "step": 34046 }, { "epoch": 0.91, "learning_rate": 3.7681325033462555e-05, "loss": 2.6635, "step": 34047 }, { "epoch": 0.91, "learning_rate": 3.765766061602061e-05, "loss": 2.3597, "step": 34048 }, { "epoch": 0.92, "learning_rate": 3.7634003489112054e-05, "loss": 2.398, "step": 34049 }, { "epoch": 0.92, "learning_rate": 3.7610353652916204e-05, "loss": 2.4104, "step": 34050 }, { "epoch": 0.92, "learning_rate": 3.758671110761247e-05, "loss": 2.7718, "step": 34051 }, { "epoch": 0.92, "learning_rate": 3.7563075853379594e-05, "loss": 2.6051, "step": 34052 }, { "epoch": 0.92, "learning_rate": 3.753944789039665e-05, "loss": 2.4602, "step": 34053 }, { "epoch": 0.92, "learning_rate": 3.751582721884295e-05, "loss": 2.2499, "step": 34054 }, { "epoch": 0.92, "learning_rate": 3.7492213838897225e-05, "loss": 2.9466, "step": 34055 }, { "epoch": 0.92, "learning_rate": 3.746860775073846e-05, "loss": 2.7661, "step": 34056 }, { "epoch": 0.92, "learning_rate": 3.744500895454539e-05, "loss": 2.7234, "step": 34057 }, { "epoch": 0.92, "learning_rate": 3.742141745049687e-05, "loss": 2.291, "step": 34058 }, { "epoch": 0.92, "learning_rate": 3.739783323877155e-05, "loss": 2.2982, "step": 34059 }, { "epoch": 0.92, "learning_rate": 3.737425631954816e-05, "loss": 2.4129, "step": 34060 }, { "epoch": 0.92, "learning_rate": 3.7350686693005233e-05, "loss": 2.4347, "step": 34061 }, { "epoch": 0.92, "learning_rate": 3.732712435932162e-05, "loss": 2.2344, "step": 34062 }, { "epoch": 0.92, "learning_rate": 3.73035693186754e-05, "loss": 2.734, "step": 34063 }, { "epoch": 0.92, "learning_rate": 3.728002157124533e-05, "loss": 2.6436, "step": 34064 }, { "epoch": 0.92, "learning_rate": 3.7256481117209695e-05, "loss": 2.5056, "step": 34065 }, { "epoch": 0.92, "learning_rate": 3.72329479567467e-05, "loss": 2.5843, "step": 34066 }, { "epoch": 0.92, "learning_rate": 3.720942209003497e-05, "loss": 2.6041, "step": 34067 }, { "epoch": 0.92, "learning_rate": 3.718590351725237e-05, "loss": 2.7336, "step": 34068 }, { "epoch": 0.92, "learning_rate": 3.716239223857731e-05, "loss": 2.3766, "step": 34069 }, { "epoch": 0.92, "learning_rate": 3.713888825418788e-05, "loss": 2.0405, "step": 34070 }, { "epoch": 0.92, "learning_rate": 3.711539156426191e-05, "loss": 2.6536, "step": 34071 }, { "epoch": 0.92, "learning_rate": 3.709190216897773e-05, "loss": 2.3296, "step": 34072 }, { "epoch": 0.92, "learning_rate": 3.7068420068513074e-05, "loss": 2.3664, "step": 34073 }, { "epoch": 0.92, "learning_rate": 3.704494526304592e-05, "loss": 2.5507, "step": 34074 }, { "epoch": 0.92, "learning_rate": 3.702147775275422e-05, "loss": 2.5386, "step": 34075 }, { "epoch": 0.92, "learning_rate": 3.6998017537815506e-05, "loss": 2.2458, "step": 34076 }, { "epoch": 0.92, "learning_rate": 3.697456461840765e-05, "loss": 2.3228, "step": 34077 }, { "epoch": 0.92, "learning_rate": 3.695111899470838e-05, "loss": 2.8421, "step": 34078 }, { "epoch": 0.92, "learning_rate": 3.6927680666895115e-05, "loss": 2.2539, "step": 34079 }, { "epoch": 0.92, "learning_rate": 3.69042496351456e-05, "loss": 2.3714, "step": 34080 }, { "epoch": 0.92, "learning_rate": 3.6880825899637484e-05, "loss": 2.7154, "step": 34081 }, { "epoch": 0.92, "learning_rate": 3.685740946054794e-05, "loss": 2.0841, "step": 34082 }, { "epoch": 0.92, "learning_rate": 3.683400031805451e-05, "loss": 1.7753, "step": 34083 }, { "epoch": 0.92, "learning_rate": 3.6810598472334476e-05, "loss": 2.2305, "step": 34084 }, { "epoch": 0.92, "learning_rate": 3.678720392356505e-05, "loss": 2.5773, "step": 34085 }, { "epoch": 0.92, "learning_rate": 3.6763816671923636e-05, "loss": 2.2137, "step": 34086 }, { "epoch": 0.92, "learning_rate": 3.67404367175872e-05, "loss": 2.5274, "step": 34087 }, { "epoch": 0.92, "learning_rate": 3.6717064060733166e-05, "loss": 2.5547, "step": 34088 }, { "epoch": 0.92, "learning_rate": 3.669369870153849e-05, "loss": 2.5202, "step": 34089 }, { "epoch": 0.92, "learning_rate": 3.6670340640180044e-05, "loss": 2.5435, "step": 34090 }, { "epoch": 0.92, "learning_rate": 3.664698987683479e-05, "loss": 2.2984, "step": 34091 }, { "epoch": 0.92, "learning_rate": 3.66236464116797e-05, "loss": 2.5076, "step": 34092 }, { "epoch": 0.92, "learning_rate": 3.660031024489174e-05, "loss": 1.9852, "step": 34093 }, { "epoch": 0.92, "learning_rate": 3.657698137664767e-05, "loss": 2.3892, "step": 34094 }, { "epoch": 0.92, "learning_rate": 3.6553659807124e-05, "loss": 2.4014, "step": 34095 }, { "epoch": 0.92, "learning_rate": 3.653034553649759e-05, "loss": 2.7852, "step": 34096 }, { "epoch": 0.92, "learning_rate": 3.650703856494508e-05, "loss": 2.512, "step": 34097 }, { "epoch": 0.92, "learning_rate": 3.6483738892642895e-05, "loss": 3.0268, "step": 34098 }, { "epoch": 0.92, "learning_rate": 3.646044651976765e-05, "loss": 2.3662, "step": 34099 }, { "epoch": 0.92, "learning_rate": 3.6437161446495784e-05, "loss": 2.4618, "step": 34100 }, { "epoch": 0.92, "learning_rate": 3.64138836730038e-05, "loss": 2.6954, "step": 34101 }, { "epoch": 0.92, "learning_rate": 3.639061319946801e-05, "loss": 2.2652, "step": 34102 }, { "epoch": 0.92, "learning_rate": 3.636735002606451e-05, "loss": 2.3812, "step": 34103 }, { "epoch": 0.92, "learning_rate": 3.63440941529698e-05, "loss": 2.711, "step": 34104 }, { "epoch": 0.92, "learning_rate": 3.632084558035986e-05, "loss": 2.4295, "step": 34105 }, { "epoch": 0.92, "learning_rate": 3.629760430841089e-05, "loss": 2.224, "step": 34106 }, { "epoch": 0.92, "learning_rate": 3.6274370337298966e-05, "loss": 2.7829, "step": 34107 }, { "epoch": 0.92, "learning_rate": 3.6251143667200284e-05, "loss": 2.2186, "step": 34108 }, { "epoch": 0.92, "learning_rate": 3.622792429829047e-05, "loss": 1.9658, "step": 34109 }, { "epoch": 0.92, "learning_rate": 3.620471223074573e-05, "loss": 2.8118, "step": 34110 }, { "epoch": 0.92, "learning_rate": 3.6181507464741694e-05, "loss": 2.136, "step": 34111 }, { "epoch": 0.92, "learning_rate": 3.615831000045422e-05, "loss": 2.5427, "step": 34112 }, { "epoch": 0.92, "learning_rate": 3.613511983805906e-05, "loss": 2.7366, "step": 34113 }, { "epoch": 0.92, "learning_rate": 3.611193697773196e-05, "loss": 2.6439, "step": 34114 }, { "epoch": 0.92, "learning_rate": 3.608876141964845e-05, "loss": 2.7137, "step": 34115 }, { "epoch": 0.92, "learning_rate": 3.606559316398428e-05, "loss": 2.4398, "step": 34116 }, { "epoch": 0.92, "learning_rate": 3.604243221091474e-05, "loss": 2.8957, "step": 34117 }, { "epoch": 0.92, "learning_rate": 3.601927856061538e-05, "loss": 2.898, "step": 34118 }, { "epoch": 0.92, "learning_rate": 3.599613221326159e-05, "loss": 2.7501, "step": 34119 }, { "epoch": 0.92, "learning_rate": 3.59729931690288e-05, "loss": 2.6587, "step": 34120 }, { "epoch": 0.92, "learning_rate": 3.5949861428092314e-05, "loss": 2.5609, "step": 34121 }, { "epoch": 0.92, "learning_rate": 3.592673699062732e-05, "loss": 2.3695, "step": 34122 }, { "epoch": 0.92, "learning_rate": 3.59036198568089e-05, "loss": 2.8621, "step": 34123 }, { "epoch": 0.92, "learning_rate": 3.588051002681247e-05, "loss": 2.6222, "step": 34124 }, { "epoch": 0.92, "learning_rate": 3.585740750081279e-05, "loss": 2.3858, "step": 34125 }, { "epoch": 0.92, "learning_rate": 3.583431227898493e-05, "loss": 2.5655, "step": 34126 }, { "epoch": 0.92, "learning_rate": 3.581122436150408e-05, "loss": 2.7035, "step": 34127 }, { "epoch": 0.92, "learning_rate": 3.5788143748545e-05, "loss": 2.2601, "step": 34128 }, { "epoch": 0.92, "learning_rate": 3.5765070440282656e-05, "loss": 2.3946, "step": 34129 }, { "epoch": 0.92, "learning_rate": 3.574200443689157e-05, "loss": 2.3854, "step": 34130 }, { "epoch": 0.92, "learning_rate": 3.571894573854673e-05, "loss": 2.2348, "step": 34131 }, { "epoch": 0.92, "learning_rate": 3.5695894345422755e-05, "loss": 2.5202, "step": 34132 }, { "epoch": 0.92, "learning_rate": 3.567285025769429e-05, "loss": 2.4759, "step": 34133 }, { "epoch": 0.92, "learning_rate": 3.5649813475535865e-05, "loss": 2.6747, "step": 34134 }, { "epoch": 0.92, "learning_rate": 3.5626783999122113e-05, "loss": 2.3907, "step": 34135 }, { "epoch": 0.92, "learning_rate": 3.5603761828627456e-05, "loss": 2.1981, "step": 34136 }, { "epoch": 0.92, "learning_rate": 3.558074696422631e-05, "loss": 2.3232, "step": 34137 }, { "epoch": 0.92, "learning_rate": 3.555773940609286e-05, "loss": 2.5041, "step": 34138 }, { "epoch": 0.92, "learning_rate": 3.553473915440153e-05, "loss": 2.4211, "step": 34139 }, { "epoch": 0.92, "learning_rate": 3.551174620932674e-05, "loss": 2.4217, "step": 34140 }, { "epoch": 0.92, "learning_rate": 3.548876057104244e-05, "loss": 2.4434, "step": 34141 }, { "epoch": 0.92, "learning_rate": 3.546578223972285e-05, "loss": 2.8796, "step": 34142 }, { "epoch": 0.92, "learning_rate": 3.544281121554216e-05, "loss": 2.7545, "step": 34143 }, { "epoch": 0.92, "learning_rate": 3.541984749867422e-05, "loss": 2.2829, "step": 34144 }, { "epoch": 0.92, "learning_rate": 3.5396891089293e-05, "loss": 2.5427, "step": 34145 }, { "epoch": 0.92, "learning_rate": 3.537394198757249e-05, "loss": 2.3607, "step": 34146 }, { "epoch": 0.92, "learning_rate": 3.535100019368653e-05, "loss": 2.5809, "step": 34147 }, { "epoch": 0.92, "learning_rate": 3.5328065707809e-05, "loss": 2.7118, "step": 34148 }, { "epoch": 0.92, "learning_rate": 3.530513853011352e-05, "loss": 2.7087, "step": 34149 }, { "epoch": 0.92, "learning_rate": 3.528221866077386e-05, "loss": 2.3599, "step": 34150 }, { "epoch": 0.92, "learning_rate": 3.525930609996375e-05, "loss": 2.6572, "step": 34151 }, { "epoch": 0.92, "learning_rate": 3.52364008478564e-05, "loss": 2.3168, "step": 34152 }, { "epoch": 0.92, "learning_rate": 3.521350290462577e-05, "loss": 2.453, "step": 34153 }, { "epoch": 0.92, "learning_rate": 3.519061227044518e-05, "loss": 2.554, "step": 34154 }, { "epoch": 0.92, "learning_rate": 3.516772894548792e-05, "loss": 2.6673, "step": 34155 }, { "epoch": 0.92, "learning_rate": 3.514485292992753e-05, "loss": 2.5058, "step": 34156 }, { "epoch": 0.92, "learning_rate": 3.51219842239372e-05, "loss": 2.4587, "step": 34157 }, { "epoch": 0.92, "learning_rate": 3.5099122827690236e-05, "loss": 2.4453, "step": 34158 }, { "epoch": 0.92, "learning_rate": 3.507626874135972e-05, "loss": 2.4169, "step": 34159 }, { "epoch": 0.92, "learning_rate": 3.505342196511896e-05, "loss": 2.8637, "step": 34160 }, { "epoch": 0.92, "learning_rate": 3.5030582499140816e-05, "loss": 2.5441, "step": 34161 }, { "epoch": 0.92, "learning_rate": 3.500775034359871e-05, "loss": 2.3289, "step": 34162 }, { "epoch": 0.92, "learning_rate": 3.498492549866528e-05, "loss": 2.359, "step": 34163 }, { "epoch": 0.92, "learning_rate": 3.496210796451349e-05, "loss": 2.761, "step": 34164 }, { "epoch": 0.92, "learning_rate": 3.49392977413161e-05, "loss": 2.3942, "step": 34165 }, { "epoch": 0.92, "learning_rate": 3.491649482924619e-05, "loss": 2.5522, "step": 34166 }, { "epoch": 0.92, "learning_rate": 3.48936992284764e-05, "loss": 2.5938, "step": 34167 }, { "epoch": 0.92, "learning_rate": 3.487091093917938e-05, "loss": 2.2956, "step": 34168 }, { "epoch": 0.92, "learning_rate": 3.4848129961527755e-05, "loss": 2.3027, "step": 34169 }, { "epoch": 0.92, "learning_rate": 3.4825356295694276e-05, "loss": 2.5806, "step": 34170 }, { "epoch": 0.92, "learning_rate": 3.480258994185126e-05, "loss": 2.8339, "step": 34171 }, { "epoch": 0.92, "learning_rate": 3.4779830900171116e-05, "loss": 2.6765, "step": 34172 }, { "epoch": 0.92, "learning_rate": 3.475707917082649e-05, "loss": 2.0132, "step": 34173 }, { "epoch": 0.92, "learning_rate": 3.473433475398968e-05, "loss": 2.2963, "step": 34174 }, { "epoch": 0.92, "learning_rate": 3.471159764983311e-05, "loss": 2.4827, "step": 34175 }, { "epoch": 0.92, "learning_rate": 3.468886785852876e-05, "loss": 2.5389, "step": 34176 }, { "epoch": 0.92, "learning_rate": 3.4666145380249034e-05, "loss": 2.3504, "step": 34177 }, { "epoch": 0.92, "learning_rate": 3.4643430215165915e-05, "loss": 2.4143, "step": 34178 }, { "epoch": 0.92, "learning_rate": 3.46207223634516e-05, "loss": 2.2941, "step": 34179 }, { "epoch": 0.92, "learning_rate": 3.459802182527816e-05, "loss": 2.3789, "step": 34180 }, { "epoch": 0.92, "learning_rate": 3.457532860081747e-05, "loss": 2.6499, "step": 34181 }, { "epoch": 0.92, "learning_rate": 3.45526426902415e-05, "loss": 2.4654, "step": 34182 }, { "epoch": 0.92, "learning_rate": 3.452996409372211e-05, "loss": 2.6382, "step": 34183 }, { "epoch": 0.92, "learning_rate": 3.4507292811431054e-05, "loss": 2.6727, "step": 34184 }, { "epoch": 0.92, "learning_rate": 3.44846288435402e-05, "loss": 2.3347, "step": 34185 }, { "epoch": 0.92, "learning_rate": 3.446197219022107e-05, "loss": 2.2492, "step": 34186 }, { "epoch": 0.92, "learning_rate": 3.4439322851645524e-05, "loss": 2.5948, "step": 34187 }, { "epoch": 0.92, "learning_rate": 3.4416680827985105e-05, "loss": 2.058, "step": 34188 }, { "epoch": 0.92, "learning_rate": 3.43940461194111e-05, "loss": 2.3558, "step": 34189 }, { "epoch": 0.92, "learning_rate": 3.437141872609528e-05, "loss": 2.312, "step": 34190 }, { "epoch": 0.92, "learning_rate": 3.4348798648208944e-05, "loss": 2.7175, "step": 34191 }, { "epoch": 0.92, "learning_rate": 3.43261858859234e-05, "loss": 2.8417, "step": 34192 }, { "epoch": 0.92, "learning_rate": 3.4303580439410064e-05, "loss": 2.4058, "step": 34193 }, { "epoch": 0.92, "learning_rate": 3.428098230884025e-05, "loss": 2.3281, "step": 34194 }, { "epoch": 0.92, "learning_rate": 3.425839149438492e-05, "loss": 2.1253, "step": 34195 }, { "epoch": 0.92, "learning_rate": 3.423580799621551e-05, "loss": 2.3269, "step": 34196 }, { "epoch": 0.92, "learning_rate": 3.421323181450287e-05, "loss": 2.1245, "step": 34197 }, { "epoch": 0.92, "learning_rate": 3.419066294941808e-05, "loss": 2.8245, "step": 34198 }, { "epoch": 0.92, "learning_rate": 3.4168101401132136e-05, "loss": 2.693, "step": 34199 }, { "epoch": 0.92, "learning_rate": 3.414554716981599e-05, "loss": 2.567, "step": 34200 }, { "epoch": 0.92, "learning_rate": 3.4123000255640525e-05, "loss": 2.4937, "step": 34201 }, { "epoch": 0.92, "learning_rate": 3.410046065877659e-05, "loss": 2.4418, "step": 34202 }, { "epoch": 0.92, "learning_rate": 3.407792837939483e-05, "loss": 2.4923, "step": 34203 }, { "epoch": 0.92, "learning_rate": 3.4055403417666e-05, "loss": 1.9661, "step": 34204 }, { "epoch": 0.92, "learning_rate": 3.403288577376074e-05, "loss": 2.715, "step": 34205 }, { "epoch": 0.92, "learning_rate": 3.4010375447849576e-05, "loss": 2.4722, "step": 34206 }, { "epoch": 0.92, "learning_rate": 3.398787244010326e-05, "loss": 2.5479, "step": 34207 }, { "epoch": 0.92, "learning_rate": 3.3965376750692e-05, "loss": 2.4338, "step": 34208 }, { "epoch": 0.92, "learning_rate": 3.394288837978632e-05, "loss": 2.2468, "step": 34209 }, { "epoch": 0.92, "learning_rate": 3.392040732755675e-05, "loss": 2.3912, "step": 34210 }, { "epoch": 0.92, "learning_rate": 3.3897933594173145e-05, "loss": 2.4485, "step": 34211 }, { "epoch": 0.92, "learning_rate": 3.387546717980627e-05, "loss": 2.5529, "step": 34212 }, { "epoch": 0.92, "learning_rate": 3.385300808462621e-05, "loss": 2.3931, "step": 34213 }, { "epoch": 0.92, "learning_rate": 3.383055630880294e-05, "loss": 2.3127, "step": 34214 }, { "epoch": 0.92, "learning_rate": 3.380811185250676e-05, "loss": 2.537, "step": 34215 }, { "epoch": 0.92, "learning_rate": 3.3785674715907436e-05, "loss": 2.5496, "step": 34216 }, { "epoch": 0.92, "learning_rate": 3.376324489917504e-05, "loss": 2.7822, "step": 34217 }, { "epoch": 0.92, "learning_rate": 3.3740822402479666e-05, "loss": 2.6835, "step": 34218 }, { "epoch": 0.92, "learning_rate": 3.3718407225991065e-05, "loss": 2.5648, "step": 34219 }, { "epoch": 0.92, "learning_rate": 3.3695999369878994e-05, "loss": 2.4303, "step": 34220 }, { "epoch": 0.92, "learning_rate": 3.367359883431342e-05, "loss": 2.1066, "step": 34221 }, { "epoch": 0.92, "learning_rate": 3.365120561946378e-05, "loss": 2.295, "step": 34222 }, { "epoch": 0.92, "learning_rate": 3.362881972549991e-05, "loss": 2.7351, "step": 34223 }, { "epoch": 0.92, "learning_rate": 3.360644115259115e-05, "loss": 2.6069, "step": 34224 }, { "epoch": 0.92, "learning_rate": 3.3584069900907344e-05, "loss": 2.5933, "step": 34225 }, { "epoch": 0.92, "learning_rate": 3.3561705970617915e-05, "loss": 2.5457, "step": 34226 }, { "epoch": 0.92, "learning_rate": 3.353934936189218e-05, "loss": 2.3999, "step": 34227 }, { "epoch": 0.92, "learning_rate": 3.351700007489944e-05, "loss": 2.7485, "step": 34228 }, { "epoch": 0.92, "learning_rate": 3.349465810980934e-05, "loss": 2.5504, "step": 34229 }, { "epoch": 0.92, "learning_rate": 3.347232346679074e-05, "loss": 2.4734, "step": 34230 }, { "epoch": 0.92, "learning_rate": 3.3449996146012965e-05, "loss": 2.2805, "step": 34231 }, { "epoch": 0.92, "learning_rate": 3.34276761476453e-05, "loss": 2.1178, "step": 34232 }, { "epoch": 0.92, "learning_rate": 3.340536347185674e-05, "loss": 2.4892, "step": 34233 }, { "epoch": 0.92, "learning_rate": 3.338305811881637e-05, "loss": 2.3344, "step": 34234 }, { "epoch": 0.92, "learning_rate": 3.336076008869316e-05, "loss": 2.217, "step": 34235 }, { "epoch": 0.92, "learning_rate": 3.3338469381655964e-05, "loss": 2.1977, "step": 34236 }, { "epoch": 0.92, "learning_rate": 3.331618599787367e-05, "loss": 2.3961, "step": 34237 }, { "epoch": 0.92, "learning_rate": 3.3293909937515136e-05, "loss": 2.0599, "step": 34238 }, { "epoch": 0.92, "learning_rate": 3.3271641200749106e-05, "loss": 2.4185, "step": 34239 }, { "epoch": 0.92, "learning_rate": 3.324937978774434e-05, "loss": 2.1016, "step": 34240 }, { "epoch": 0.92, "learning_rate": 3.322712569866948e-05, "loss": 2.0908, "step": 34241 }, { "epoch": 0.92, "learning_rate": 3.320487893369306e-05, "loss": 2.6877, "step": 34242 }, { "epoch": 0.92, "learning_rate": 3.31826394929835e-05, "loss": 2.4583, "step": 34243 }, { "epoch": 0.92, "learning_rate": 3.316040737670945e-05, "loss": 2.5678, "step": 34244 }, { "epoch": 0.92, "learning_rate": 3.313818258503931e-05, "loss": 2.4569, "step": 34245 }, { "epoch": 0.92, "learning_rate": 3.311596511814152e-05, "loss": 2.7218, "step": 34246 }, { "epoch": 0.92, "learning_rate": 3.3093754976184166e-05, "loss": 2.4752, "step": 34247 }, { "epoch": 0.92, "learning_rate": 3.307155215933588e-05, "loss": 2.3238, "step": 34248 }, { "epoch": 0.92, "learning_rate": 3.304935666776443e-05, "loss": 2.3228, "step": 34249 }, { "epoch": 0.92, "learning_rate": 3.3027168501638336e-05, "loss": 2.2141, "step": 34250 }, { "epoch": 0.92, "learning_rate": 3.300498766112536e-05, "loss": 2.1585, "step": 34251 }, { "epoch": 0.92, "learning_rate": 3.298281414639381e-05, "loss": 2.5647, "step": 34252 }, { "epoch": 0.92, "learning_rate": 3.296064795761167e-05, "loss": 2.3575, "step": 34253 }, { "epoch": 0.92, "learning_rate": 3.293848909494668e-05, "loss": 2.2322, "step": 34254 }, { "epoch": 0.92, "learning_rate": 3.291633755856682e-05, "loss": 2.65, "step": 34255 }, { "epoch": 0.92, "learning_rate": 3.289419334863997e-05, "loss": 2.4601, "step": 34256 }, { "epoch": 0.92, "learning_rate": 3.287205646533364e-05, "loss": 2.6751, "step": 34257 }, { "epoch": 0.92, "learning_rate": 3.2849926908815717e-05, "loss": 2.4168, "step": 34258 }, { "epoch": 0.92, "learning_rate": 3.282780467925395e-05, "loss": 2.6855, "step": 34259 }, { "epoch": 0.92, "learning_rate": 3.280568977681564e-05, "loss": 2.3859, "step": 34260 }, { "epoch": 0.92, "learning_rate": 3.278358220166877e-05, "loss": 2.3129, "step": 34261 }, { "epoch": 0.92, "learning_rate": 3.2761481953980434e-05, "loss": 2.127, "step": 34262 }, { "epoch": 0.92, "learning_rate": 3.273938903391816e-05, "loss": 2.2558, "step": 34263 }, { "epoch": 0.92, "learning_rate": 3.271730344164925e-05, "loss": 2.0568, "step": 34264 }, { "epoch": 0.92, "learning_rate": 3.269522517734125e-05, "loss": 2.5826, "step": 34265 }, { "epoch": 0.92, "learning_rate": 3.267315424116135e-05, "loss": 2.3316, "step": 34266 }, { "epoch": 0.92, "learning_rate": 3.2651090633276535e-05, "loss": 2.7386, "step": 34267 }, { "epoch": 0.92, "learning_rate": 3.262903435385422e-05, "loss": 2.4545, "step": 34268 }, { "epoch": 0.92, "learning_rate": 3.2606985403061394e-05, "loss": 2.2759, "step": 34269 }, { "epoch": 0.92, "learning_rate": 3.258494378106502e-05, "loss": 2.5952, "step": 34270 }, { "epoch": 0.92, "learning_rate": 3.256290948803209e-05, "loss": 2.6091, "step": 34271 }, { "epoch": 0.92, "learning_rate": 3.254088252412968e-05, "loss": 2.1724, "step": 34272 }, { "epoch": 0.92, "learning_rate": 3.251886288952466e-05, "loss": 2.391, "step": 34273 }, { "epoch": 0.92, "learning_rate": 3.249685058438368e-05, "loss": 2.0497, "step": 34274 }, { "epoch": 0.92, "learning_rate": 3.2474845608873594e-05, "loss": 2.5582, "step": 34275 }, { "epoch": 0.92, "learning_rate": 3.245284796316106e-05, "loss": 2.559, "step": 34276 }, { "epoch": 0.92, "learning_rate": 3.2430857647412825e-05, "loss": 2.7127, "step": 34277 }, { "epoch": 0.92, "learning_rate": 3.240887466179543e-05, "loss": 2.2429, "step": 34278 }, { "epoch": 0.92, "learning_rate": 3.23868990064754e-05, "loss": 2.7826, "step": 34279 }, { "epoch": 0.92, "learning_rate": 3.236493068161927e-05, "loss": 2.6164, "step": 34280 }, { "epoch": 0.92, "learning_rate": 3.2342969687393366e-05, "loss": 2.7339, "step": 34281 }, { "epoch": 0.92, "learning_rate": 3.232101602396409e-05, "loss": 2.2826, "step": 34282 }, { "epoch": 0.92, "learning_rate": 3.2299069691497985e-05, "loss": 2.5355, "step": 34283 }, { "epoch": 0.92, "learning_rate": 3.2277130690160804e-05, "loss": 2.362, "step": 34284 }, { "epoch": 0.92, "learning_rate": 3.225519902011931e-05, "loss": 2.4908, "step": 34285 }, { "epoch": 0.92, "learning_rate": 3.223327468153936e-05, "loss": 2.6209, "step": 34286 }, { "epoch": 0.92, "learning_rate": 3.221135767458705e-05, "loss": 2.5852, "step": 34287 }, { "epoch": 0.92, "learning_rate": 3.2189447999428576e-05, "loss": 2.7691, "step": 34288 }, { "epoch": 0.92, "learning_rate": 3.21675456562297e-05, "loss": 2.4086, "step": 34289 }, { "epoch": 0.92, "learning_rate": 3.214565064515651e-05, "loss": 2.3319, "step": 34290 }, { "epoch": 0.92, "learning_rate": 3.212376296637476e-05, "loss": 2.2036, "step": 34291 }, { "epoch": 0.92, "learning_rate": 3.210188262005043e-05, "loss": 2.6823, "step": 34292 }, { "epoch": 0.92, "learning_rate": 3.208000960634927e-05, "loss": 1.8716, "step": 34293 }, { "epoch": 0.92, "learning_rate": 3.2058143925436826e-05, "loss": 2.4115, "step": 34294 }, { "epoch": 0.92, "learning_rate": 3.203628557747873e-05, "loss": 2.4427, "step": 34295 }, { "epoch": 0.92, "learning_rate": 3.201443456264086e-05, "loss": 2.5847, "step": 34296 }, { "epoch": 0.92, "learning_rate": 3.199259088108841e-05, "loss": 2.1549, "step": 34297 }, { "epoch": 0.92, "learning_rate": 3.1970754532987035e-05, "loss": 2.3145, "step": 34298 }, { "epoch": 0.92, "learning_rate": 3.194892551850237e-05, "loss": 2.49, "step": 34299 }, { "epoch": 0.92, "learning_rate": 3.1927103837799397e-05, "loss": 3.1, "step": 34300 }, { "epoch": 0.92, "learning_rate": 3.190528949104377e-05, "loss": 2.5305, "step": 34301 }, { "epoch": 0.92, "learning_rate": 3.188348247840045e-05, "loss": 2.1769, "step": 34302 }, { "epoch": 0.92, "learning_rate": 3.1861682800034766e-05, "loss": 2.7827, "step": 34303 }, { "epoch": 0.92, "learning_rate": 3.18398904561118e-05, "loss": 3.0173, "step": 34304 }, { "epoch": 0.92, "learning_rate": 3.181810544679686e-05, "loss": 2.4624, "step": 34305 }, { "epoch": 0.92, "learning_rate": 3.179632777225483e-05, "loss": 2.4585, "step": 34306 }, { "epoch": 0.92, "learning_rate": 3.1774557432650783e-05, "loss": 2.6171, "step": 34307 }, { "epoch": 0.92, "learning_rate": 3.1752794428149604e-05, "loss": 2.305, "step": 34308 }, { "epoch": 0.92, "learning_rate": 3.173103875891603e-05, "loss": 2.6755, "step": 34309 }, { "epoch": 0.92, "learning_rate": 3.170929042511506e-05, "loss": 2.6526, "step": 34310 }, { "epoch": 0.92, "learning_rate": 3.168754942691132e-05, "loss": 2.6508, "step": 34311 }, { "epoch": 0.92, "learning_rate": 3.1665815764469805e-05, "loss": 3.001, "step": 34312 }, { "epoch": 0.92, "learning_rate": 3.164408943795471e-05, "loss": 2.0455, "step": 34313 }, { "epoch": 0.92, "learning_rate": 3.162237044753091e-05, "loss": 2.1195, "step": 34314 }, { "epoch": 0.92, "learning_rate": 3.1600658793363045e-05, "loss": 2.2403, "step": 34315 }, { "epoch": 0.92, "learning_rate": 3.157895447561532e-05, "loss": 2.7256, "step": 34316 }, { "epoch": 0.92, "learning_rate": 3.155725749445237e-05, "loss": 2.4429, "step": 34317 }, { "epoch": 0.92, "learning_rate": 3.1535567850038416e-05, "loss": 2.8138, "step": 34318 }, { "epoch": 0.92, "learning_rate": 3.1513885542537866e-05, "loss": 2.0346, "step": 34319 }, { "epoch": 0.92, "learning_rate": 3.1492210572115154e-05, "loss": 2.4544, "step": 34320 }, { "epoch": 0.92, "learning_rate": 3.147054293893414e-05, "loss": 2.6106, "step": 34321 }, { "epoch": 0.92, "learning_rate": 3.1448882643159036e-05, "loss": 2.2489, "step": 34322 }, { "epoch": 0.92, "learning_rate": 3.142722968495415e-05, "loss": 2.2881, "step": 34323 }, { "epoch": 0.92, "learning_rate": 3.140558406448335e-05, "loss": 2.2133, "step": 34324 }, { "epoch": 0.92, "learning_rate": 3.138394578191073e-05, "loss": 2.5335, "step": 34325 }, { "epoch": 0.92, "learning_rate": 3.1362314837400266e-05, "loss": 2.8297, "step": 34326 }, { "epoch": 0.92, "learning_rate": 3.13406912311156e-05, "loss": 2.5126, "step": 34327 }, { "epoch": 0.92, "learning_rate": 3.131907496322084e-05, "loss": 2.3069, "step": 34328 }, { "epoch": 0.92, "learning_rate": 3.12974660338794e-05, "loss": 2.3053, "step": 34329 }, { "epoch": 0.92, "learning_rate": 3.1275864443255145e-05, "loss": 2.2452, "step": 34330 }, { "epoch": 0.92, "learning_rate": 3.125427019151183e-05, "loss": 2.0665, "step": 34331 }, { "epoch": 0.92, "learning_rate": 3.12326832788129e-05, "loss": 2.5462, "step": 34332 }, { "epoch": 0.92, "learning_rate": 3.12111037053221e-05, "loss": 2.6116, "step": 34333 }, { "epoch": 0.92, "learning_rate": 3.1189531471202736e-05, "loss": 2.8468, "step": 34334 }, { "epoch": 0.92, "learning_rate": 3.1167966576618245e-05, "loss": 2.393, "step": 34335 }, { "epoch": 0.92, "learning_rate": 3.114640902173193e-05, "loss": 2.6392, "step": 34336 }, { "epoch": 0.92, "learning_rate": 3.1124858806707344e-05, "loss": 2.5511, "step": 34337 }, { "epoch": 0.92, "learning_rate": 3.110331593170756e-05, "loss": 2.5089, "step": 34338 }, { "epoch": 0.92, "learning_rate": 3.108178039689591e-05, "loss": 2.2785, "step": 34339 }, { "epoch": 0.92, "learning_rate": 3.106025220243536e-05, "loss": 2.7272, "step": 34340 }, { "epoch": 0.92, "learning_rate": 3.103873134848911e-05, "loss": 2.7227, "step": 34341 }, { "epoch": 0.92, "learning_rate": 3.101721783522027e-05, "loss": 2.3653, "step": 34342 }, { "epoch": 0.92, "learning_rate": 3.099571166279169e-05, "loss": 2.5273, "step": 34343 }, { "epoch": 0.92, "learning_rate": 3.097421283136637e-05, "loss": 2.2897, "step": 34344 }, { "epoch": 0.92, "learning_rate": 3.095272134110716e-05, "loss": 2.496, "step": 34345 }, { "epoch": 0.92, "learning_rate": 3.093123719217683e-05, "loss": 2.3054, "step": 34346 }, { "epoch": 0.92, "learning_rate": 3.090976038473836e-05, "loss": 2.7093, "step": 34347 }, { "epoch": 0.92, "learning_rate": 3.0888290918954176e-05, "loss": 2.2965, "step": 34348 }, { "epoch": 0.92, "learning_rate": 3.086682879498703e-05, "loss": 2.4462, "step": 34349 }, { "epoch": 0.92, "learning_rate": 3.084537401299947e-05, "loss": 2.3326, "step": 34350 }, { "epoch": 0.92, "learning_rate": 3.082392657315414e-05, "loss": 2.7982, "step": 34351 }, { "epoch": 0.92, "learning_rate": 3.0802486475613456e-05, "loss": 2.8469, "step": 34352 }, { "epoch": 0.92, "learning_rate": 3.0781053720540076e-05, "loss": 2.4293, "step": 34353 }, { "epoch": 0.92, "learning_rate": 3.075962830809587e-05, "loss": 2.6909, "step": 34354 }, { "epoch": 0.92, "learning_rate": 3.0738210238443695e-05, "loss": 2.5283, "step": 34355 }, { "epoch": 0.92, "learning_rate": 3.071679951174533e-05, "loss": 1.8682, "step": 34356 }, { "epoch": 0.92, "learning_rate": 3.069539612816308e-05, "loss": 2.6645, "step": 34357 }, { "epoch": 0.92, "learning_rate": 3.067400008785948e-05, "loss": 2.2097, "step": 34358 }, { "epoch": 0.92, "learning_rate": 3.0652611390996285e-05, "loss": 2.7456, "step": 34359 }, { "epoch": 0.92, "learning_rate": 3.0631230037735604e-05, "loss": 1.9594, "step": 34360 }, { "epoch": 0.92, "learning_rate": 3.0609856028239515e-05, "loss": 2.5819, "step": 34361 }, { "epoch": 0.92, "learning_rate": 3.058848936266967e-05, "loss": 3.0622, "step": 34362 }, { "epoch": 0.92, "learning_rate": 3.0567130041188166e-05, "loss": 2.7801, "step": 34363 }, { "epoch": 0.92, "learning_rate": 3.0545778063956755e-05, "loss": 2.4503, "step": 34364 }, { "epoch": 0.92, "learning_rate": 3.05244334311372e-05, "loss": 2.0599, "step": 34365 }, { "epoch": 0.92, "learning_rate": 3.0503096142891373e-05, "loss": 2.3695, "step": 34366 }, { "epoch": 0.92, "learning_rate": 3.048176619938059e-05, "loss": 2.1592, "step": 34367 }, { "epoch": 0.92, "learning_rate": 3.0460443600766607e-05, "loss": 2.6355, "step": 34368 }, { "epoch": 0.92, "learning_rate": 3.0439128347211075e-05, "loss": 2.2249, "step": 34369 }, { "epoch": 0.92, "learning_rate": 3.04178204388752e-05, "loss": 2.0888, "step": 34370 }, { "epoch": 0.92, "learning_rate": 3.0396519875920736e-05, "loss": 2.7724, "step": 34371 }, { "epoch": 0.92, "learning_rate": 3.037522665850878e-05, "loss": 2.5014, "step": 34372 }, { "epoch": 0.92, "learning_rate": 3.035394078680076e-05, "loss": 2.7146, "step": 34373 }, { "epoch": 0.92, "learning_rate": 3.03326622609581e-05, "loss": 2.7001, "step": 34374 }, { "epoch": 0.92, "learning_rate": 3.031139108114167e-05, "loss": 2.6657, "step": 34375 }, { "epoch": 0.92, "learning_rate": 3.029012724751279e-05, "loss": 2.5364, "step": 34376 }, { "epoch": 0.92, "learning_rate": 3.0268870760232547e-05, "loss": 2.6583, "step": 34377 }, { "epoch": 0.92, "learning_rate": 3.024762161946193e-05, "loss": 2.4551, "step": 34378 }, { "epoch": 0.92, "learning_rate": 3.022637982536214e-05, "loss": 2.3435, "step": 34379 }, { "epoch": 0.92, "learning_rate": 3.020514537809371e-05, "loss": 2.5485, "step": 34380 }, { "epoch": 0.92, "learning_rate": 3.0183918277817747e-05, "loss": 2.5885, "step": 34381 }, { "epoch": 0.92, "learning_rate": 3.0162698524695108e-05, "loss": 2.2215, "step": 34382 }, { "epoch": 0.92, "learning_rate": 3.014148611888634e-05, "loss": 2.4085, "step": 34383 }, { "epoch": 0.92, "learning_rate": 3.0120281060552422e-05, "loss": 2.1085, "step": 34384 }, { "epoch": 0.92, "learning_rate": 3.0099083349853896e-05, "loss": 2.3783, "step": 34385 }, { "epoch": 0.92, "learning_rate": 3.0077892986951183e-05, "loss": 2.1658, "step": 34386 }, { "epoch": 0.92, "learning_rate": 3.0056709972004935e-05, "loss": 2.3896, "step": 34387 }, { "epoch": 0.92, "learning_rate": 3.0035534305175803e-05, "loss": 2.3656, "step": 34388 }, { "epoch": 0.92, "learning_rate": 3.001436598662388e-05, "loss": 2.4383, "step": 34389 }, { "epoch": 0.92, "learning_rate": 2.9993205016509817e-05, "loss": 2.5283, "step": 34390 }, { "epoch": 0.92, "learning_rate": 2.9972051394993706e-05, "loss": 2.6826, "step": 34391 }, { "epoch": 0.92, "learning_rate": 2.995090512223597e-05, "loss": 3.124, "step": 34392 }, { "epoch": 0.92, "learning_rate": 2.9929766198396824e-05, "loss": 2.4284, "step": 34393 }, { "epoch": 0.92, "learning_rate": 2.9908634623636244e-05, "loss": 2.6074, "step": 34394 }, { "epoch": 0.92, "learning_rate": 2.9887510398114327e-05, "loss": 2.0238, "step": 34395 }, { "epoch": 0.92, "learning_rate": 2.9866393521991274e-05, "loss": 2.2751, "step": 34396 }, { "epoch": 0.92, "learning_rate": 2.9845283995426964e-05, "loss": 2.2242, "step": 34397 }, { "epoch": 0.92, "learning_rate": 2.9824181818581486e-05, "loss": 2.7513, "step": 34398 }, { "epoch": 0.92, "learning_rate": 2.980308699161438e-05, "loss": 2.0794, "step": 34399 }, { "epoch": 0.92, "learning_rate": 2.978199951468574e-05, "loss": 2.2427, "step": 34400 }, { "epoch": 0.92, "learning_rate": 2.9760919387955222e-05, "loss": 2.7029, "step": 34401 }, { "epoch": 0.92, "learning_rate": 2.9739846611582466e-05, "loss": 2.7445, "step": 34402 }, { "epoch": 0.92, "learning_rate": 2.9718781185727016e-05, "loss": 2.2899, "step": 34403 }, { "epoch": 0.92, "learning_rate": 2.9697723110548748e-05, "loss": 2.2477, "step": 34404 }, { "epoch": 0.92, "learning_rate": 2.967667238620708e-05, "loss": 2.0356, "step": 34405 }, { "epoch": 0.92, "learning_rate": 2.9655629012861562e-05, "loss": 2.3374, "step": 34406 }, { "epoch": 0.92, "learning_rate": 2.9634592990671284e-05, "loss": 2.6499, "step": 34407 }, { "epoch": 0.92, "learning_rate": 2.9613564319796004e-05, "loss": 2.6305, "step": 34408 }, { "epoch": 0.92, "learning_rate": 2.959254300039482e-05, "loss": 2.2925, "step": 34409 }, { "epoch": 0.92, "learning_rate": 2.9571529032626942e-05, "loss": 2.377, "step": 34410 }, { "epoch": 0.92, "learning_rate": 2.955052241665179e-05, "loss": 3.0024, "step": 34411 }, { "epoch": 0.92, "learning_rate": 2.9529523152628468e-05, "loss": 2.5206, "step": 34412 }, { "epoch": 0.92, "learning_rate": 2.950853124071573e-05, "loss": 2.4222, "step": 34413 }, { "epoch": 0.92, "learning_rate": 2.948754668107312e-05, "loss": 2.5084, "step": 34414 }, { "epoch": 0.92, "learning_rate": 2.9466569473859174e-05, "loss": 2.5824, "step": 34415 }, { "epoch": 0.92, "learning_rate": 2.9445599619232877e-05, "loss": 2.6461, "step": 34416 }, { "epoch": 0.92, "learning_rate": 2.9424637117353437e-05, "loss": 2.4136, "step": 34417 }, { "epoch": 0.92, "learning_rate": 2.9403681968379283e-05, "loss": 2.2757, "step": 34418 }, { "epoch": 0.92, "learning_rate": 2.9382734172469395e-05, "loss": 2.334, "step": 34419 }, { "epoch": 0.92, "learning_rate": 2.9361793729782315e-05, "loss": 2.3674, "step": 34420 }, { "epoch": 0.93, "learning_rate": 2.9340860640476807e-05, "loss": 2.2887, "step": 34421 }, { "epoch": 0.93, "learning_rate": 2.93199349047113e-05, "loss": 2.5606, "step": 34422 }, { "epoch": 0.93, "learning_rate": 2.9299016522644552e-05, "loss": 2.615, "step": 34423 }, { "epoch": 0.93, "learning_rate": 2.9278105494434772e-05, "loss": 2.3485, "step": 34424 }, { "epoch": 0.93, "learning_rate": 2.925720182024072e-05, "loss": 2.7729, "step": 34425 }, { "epoch": 0.93, "learning_rate": 2.9236305500220383e-05, "loss": 2.2661, "step": 34426 }, { "epoch": 0.93, "learning_rate": 2.9215416534532303e-05, "loss": 2.4254, "step": 34427 }, { "epoch": 0.93, "learning_rate": 2.919453492333468e-05, "loss": 2.3464, "step": 34428 }, { "epoch": 0.93, "learning_rate": 2.9173660666785507e-05, "loss": 2.5531, "step": 34429 }, { "epoch": 0.93, "learning_rate": 2.9152793765043316e-05, "loss": 2.251, "step": 34430 }, { "epoch": 0.93, "learning_rate": 2.913193421826599e-05, "loss": 2.9119, "step": 34431 }, { "epoch": 0.93, "learning_rate": 2.9111082026611502e-05, "loss": 2.6299, "step": 34432 }, { "epoch": 0.93, "learning_rate": 2.9090237190237955e-05, "loss": 2.4153, "step": 34433 }, { "epoch": 0.93, "learning_rate": 2.9069399709303114e-05, "loss": 2.6757, "step": 34434 }, { "epoch": 0.93, "learning_rate": 2.9048569583964846e-05, "loss": 2.9035, "step": 34435 }, { "epoch": 0.93, "learning_rate": 2.902774681438114e-05, "loss": 2.5132, "step": 34436 }, { "epoch": 0.93, "learning_rate": 2.9006931400709535e-05, "loss": 2.5484, "step": 34437 }, { "epoch": 0.93, "learning_rate": 2.8986123343107795e-05, "loss": 2.5781, "step": 34438 }, { "epoch": 0.93, "learning_rate": 2.8965322641733793e-05, "loss": 2.5975, "step": 34439 }, { "epoch": 0.93, "learning_rate": 2.894452929674474e-05, "loss": 2.8242, "step": 34440 }, { "epoch": 0.93, "learning_rate": 2.8923743308298502e-05, "loss": 2.4794, "step": 34441 }, { "epoch": 0.93, "learning_rate": 2.890296467655207e-05, "loss": 2.5565, "step": 34442 }, { "epoch": 0.93, "learning_rate": 2.8882193401663315e-05, "loss": 2.4951, "step": 34443 }, { "epoch": 0.93, "learning_rate": 2.8861429483789448e-05, "loss": 2.1637, "step": 34444 }, { "epoch": 0.93, "learning_rate": 2.8840672923087785e-05, "loss": 2.1403, "step": 34445 }, { "epoch": 0.93, "learning_rate": 2.8819923719715535e-05, "loss": 2.569, "step": 34446 }, { "epoch": 0.93, "learning_rate": 2.8799181873830015e-05, "loss": 2.7681, "step": 34447 }, { "epoch": 0.93, "learning_rate": 2.87784473855881e-05, "loss": 2.1939, "step": 34448 }, { "epoch": 0.93, "learning_rate": 2.8757720255147112e-05, "loss": 2.5293, "step": 34449 }, { "epoch": 0.93, "learning_rate": 2.8737000482663923e-05, "loss": 2.551, "step": 34450 }, { "epoch": 0.93, "learning_rate": 2.8716288068295625e-05, "loss": 2.3824, "step": 34451 }, { "epoch": 0.93, "learning_rate": 2.86955830121991e-05, "loss": 1.983, "step": 34452 }, { "epoch": 0.93, "learning_rate": 2.8674885314531107e-05, "loss": 2.4122, "step": 34453 }, { "epoch": 0.93, "learning_rate": 2.8654194975448632e-05, "loss": 2.46, "step": 34454 }, { "epoch": 0.93, "learning_rate": 2.8633511995108218e-05, "loss": 2.4982, "step": 34455 }, { "epoch": 0.93, "learning_rate": 2.861283637366663e-05, "loss": 2.801, "step": 34456 }, { "epoch": 0.93, "learning_rate": 2.8592168111280735e-05, "loss": 2.279, "step": 34457 }, { "epoch": 0.93, "learning_rate": 2.857150720810675e-05, "loss": 2.8221, "step": 34458 }, { "epoch": 0.93, "learning_rate": 2.8550853664301323e-05, "loss": 2.5899, "step": 34459 }, { "epoch": 0.93, "learning_rate": 2.853020748002111e-05, "loss": 2.839, "step": 34460 }, { "epoch": 0.93, "learning_rate": 2.8509568655422204e-05, "loss": 2.7275, "step": 34461 }, { "epoch": 0.93, "learning_rate": 2.8488937190661145e-05, "loss": 2.5099, "step": 34462 }, { "epoch": 0.93, "learning_rate": 2.8468313085894147e-05, "loss": 2.6753, "step": 34463 }, { "epoch": 0.93, "learning_rate": 2.8447696341277528e-05, "loss": 2.4359, "step": 34464 }, { "epoch": 0.93, "learning_rate": 2.8427086956967496e-05, "loss": 2.4591, "step": 34465 }, { "epoch": 0.93, "learning_rate": 2.840648493312026e-05, "loss": 2.3459, "step": 34466 }, { "epoch": 0.93, "learning_rate": 2.8385890269891688e-05, "loss": 2.6119, "step": 34467 }, { "epoch": 0.93, "learning_rate": 2.8365302967438e-05, "loss": 3.1195, "step": 34468 }, { "epoch": 0.93, "learning_rate": 2.8344723025914952e-05, "loss": 2.6563, "step": 34469 }, { "epoch": 0.93, "learning_rate": 2.8324150445478536e-05, "loss": 2.3791, "step": 34470 }, { "epoch": 0.93, "learning_rate": 2.8303585226284845e-05, "loss": 2.5134, "step": 34471 }, { "epoch": 0.93, "learning_rate": 2.828302736848931e-05, "loss": 2.8546, "step": 34472 }, { "epoch": 0.93, "learning_rate": 2.826247687224781e-05, "loss": 2.3282, "step": 34473 }, { "epoch": 0.93, "learning_rate": 2.8241933737716107e-05, "loss": 2.7975, "step": 34474 }, { "epoch": 0.93, "learning_rate": 2.8221397965049857e-05, "loss": 2.96, "step": 34475 }, { "epoch": 0.93, "learning_rate": 2.8200869554404373e-05, "loss": 2.7134, "step": 34476 }, { "epoch": 0.93, "learning_rate": 2.8180348505935425e-05, "loss": 2.42, "step": 34477 }, { "epoch": 0.93, "learning_rate": 2.8159834819798447e-05, "loss": 2.2732, "step": 34478 }, { "epoch": 0.93, "learning_rate": 2.8139328496148864e-05, "loss": 2.4363, "step": 34479 }, { "epoch": 0.93, "learning_rate": 2.811882953514189e-05, "loss": 2.2786, "step": 34480 }, { "epoch": 0.93, "learning_rate": 2.8098337936932948e-05, "loss": 2.0764, "step": 34481 }, { "epoch": 0.93, "learning_rate": 2.8077853701677258e-05, "loss": 2.5453, "step": 34482 }, { "epoch": 0.93, "learning_rate": 2.8057376829529914e-05, "loss": 2.7539, "step": 34483 }, { "epoch": 0.93, "learning_rate": 2.803690732064623e-05, "loss": 1.9546, "step": 34484 }, { "epoch": 0.93, "learning_rate": 2.8016445175181092e-05, "loss": 2.0198, "step": 34485 }, { "epoch": 0.93, "learning_rate": 2.7995990393289595e-05, "loss": 2.3904, "step": 34486 }, { "epoch": 0.93, "learning_rate": 2.7975542975126723e-05, "loss": 2.7937, "step": 34487 }, { "epoch": 0.93, "learning_rate": 2.7955102920847354e-05, "loss": 2.425, "step": 34488 }, { "epoch": 0.93, "learning_rate": 2.793467023060614e-05, "loss": 2.8501, "step": 34489 }, { "epoch": 0.93, "learning_rate": 2.7914244904558294e-05, "loss": 2.5746, "step": 34490 }, { "epoch": 0.93, "learning_rate": 2.789382694285836e-05, "loss": 2.0855, "step": 34491 }, { "epoch": 0.93, "learning_rate": 2.7873416345660983e-05, "loss": 2.6952, "step": 34492 }, { "epoch": 0.93, "learning_rate": 2.7853013113120716e-05, "loss": 2.9099, "step": 34493 }, { "epoch": 0.93, "learning_rate": 2.7832617245392213e-05, "loss": 2.5382, "step": 34494 }, { "epoch": 0.93, "learning_rate": 2.781222874263001e-05, "loss": 2.5222, "step": 34495 }, { "epoch": 0.93, "learning_rate": 2.779184760498854e-05, "loss": 2.5806, "step": 34496 }, { "epoch": 0.93, "learning_rate": 2.777147383262224e-05, "loss": 2.5175, "step": 34497 }, { "epoch": 0.93, "learning_rate": 2.775110742568554e-05, "loss": 2.1067, "step": 34498 }, { "epoch": 0.93, "learning_rate": 2.773074838433254e-05, "loss": 2.6634, "step": 34499 }, { "epoch": 0.93, "learning_rate": 2.7710396708717557e-05, "loss": 2.3241, "step": 34500 }, { "epoch": 0.93, "learning_rate": 2.7690052398994802e-05, "loss": 2.6821, "step": 34501 }, { "epoch": 0.93, "learning_rate": 2.7669715455318266e-05, "loss": 2.7541, "step": 34502 }, { "epoch": 0.93, "learning_rate": 2.764938587784227e-05, "loss": 2.211, "step": 34503 }, { "epoch": 0.93, "learning_rate": 2.7629063666720576e-05, "loss": 2.3132, "step": 34504 }, { "epoch": 0.93, "learning_rate": 2.76087488221074e-05, "loss": 2.7835, "step": 34505 }, { "epoch": 0.93, "learning_rate": 2.758844134415639e-05, "loss": 2.6811, "step": 34506 }, { "epoch": 0.93, "learning_rate": 2.756814123302154e-05, "loss": 2.3954, "step": 34507 }, { "epoch": 0.93, "learning_rate": 2.7547848488856607e-05, "loss": 2.104, "step": 34508 }, { "epoch": 0.93, "learning_rate": 2.7527563111815257e-05, "loss": 1.9561, "step": 34509 }, { "epoch": 0.93, "learning_rate": 2.750728510205114e-05, "loss": 2.3091, "step": 34510 }, { "epoch": 0.93, "learning_rate": 2.748701445971824e-05, "loss": 2.7439, "step": 34511 }, { "epoch": 0.93, "learning_rate": 2.7466751184969663e-05, "loss": 2.4177, "step": 34512 }, { "epoch": 0.93, "learning_rate": 2.744649527795906e-05, "loss": 2.5483, "step": 34513 }, { "epoch": 0.93, "learning_rate": 2.7426246738840088e-05, "loss": 2.4182, "step": 34514 }, { "epoch": 0.93, "learning_rate": 2.7406005567765848e-05, "loss": 2.6696, "step": 34515 }, { "epoch": 0.93, "learning_rate": 2.7385771764889768e-05, "loss": 2.4559, "step": 34516 }, { "epoch": 0.93, "learning_rate": 2.7365545330365395e-05, "loss": 2.5639, "step": 34517 }, { "epoch": 0.93, "learning_rate": 2.7345326264345717e-05, "loss": 2.3441, "step": 34518 }, { "epoch": 0.93, "learning_rate": 2.7325114566983945e-05, "loss": 2.5804, "step": 34519 }, { "epoch": 0.93, "learning_rate": 2.730491023843318e-05, "loss": 2.6398, "step": 34520 }, { "epoch": 0.93, "learning_rate": 2.7284713278846518e-05, "loss": 2.364, "step": 34521 }, { "epoch": 0.93, "learning_rate": 2.7264523688376953e-05, "loss": 2.4369, "step": 34522 }, { "epoch": 0.93, "learning_rate": 2.7244341467177358e-05, "loss": 2.81, "step": 34523 }, { "epoch": 0.93, "learning_rate": 2.7224166615400837e-05, "loss": 2.482, "step": 34524 }, { "epoch": 0.93, "learning_rate": 2.7203999133200152e-05, "loss": 2.7028, "step": 34525 }, { "epoch": 0.93, "learning_rate": 2.7183839020727962e-05, "loss": 2.8997, "step": 34526 }, { "epoch": 0.93, "learning_rate": 2.7163686278137147e-05, "loss": 2.7228, "step": 34527 }, { "epoch": 0.93, "learning_rate": 2.7143540905580134e-05, "loss": 2.5718, "step": 34528 }, { "epoch": 0.93, "learning_rate": 2.7123402903209915e-05, "loss": 2.3402, "step": 34529 }, { "epoch": 0.93, "learning_rate": 2.7103272271178813e-05, "loss": 2.5078, "step": 34530 }, { "epoch": 0.93, "learning_rate": 2.7083149009639373e-05, "loss": 2.6669, "step": 34531 }, { "epoch": 0.93, "learning_rate": 2.706303311874403e-05, "loss": 2.6896, "step": 34532 }, { "epoch": 0.93, "learning_rate": 2.7042924598645323e-05, "loss": 2.7562, "step": 34533 }, { "epoch": 0.93, "learning_rate": 2.702282344949547e-05, "loss": 2.2348, "step": 34534 }, { "epoch": 0.93, "learning_rate": 2.700272967144657e-05, "loss": 1.8458, "step": 34535 }, { "epoch": 0.93, "learning_rate": 2.6982643264651164e-05, "loss": 2.8044, "step": 34536 }, { "epoch": 0.93, "learning_rate": 2.6962564229261244e-05, "loss": 2.3488, "step": 34537 }, { "epoch": 0.93, "learning_rate": 2.694249256542902e-05, "loss": 2.7327, "step": 34538 }, { "epoch": 0.93, "learning_rate": 2.6922428273306488e-05, "loss": 2.612, "step": 34539 }, { "epoch": 0.93, "learning_rate": 2.690237135304563e-05, "loss": 2.5609, "step": 34540 }, { "epoch": 0.93, "learning_rate": 2.6882321804798437e-05, "loss": 2.4623, "step": 34541 }, { "epoch": 0.93, "learning_rate": 2.686227962871679e-05, "loss": 2.4561, "step": 34542 }, { "epoch": 0.93, "learning_rate": 2.6842244824952566e-05, "loss": 2.7331, "step": 34543 }, { "epoch": 0.93, "learning_rate": 2.6822217393657643e-05, "loss": 2.4697, "step": 34544 }, { "epoch": 0.93, "learning_rate": 2.680219733498346e-05, "loss": 2.2467, "step": 34545 }, { "epoch": 0.93, "learning_rate": 2.6782184649081885e-05, "loss": 2.6081, "step": 34546 }, { "epoch": 0.93, "learning_rate": 2.6762179336104475e-05, "loss": 2.3645, "step": 34547 }, { "epoch": 0.93, "learning_rate": 2.6742181396202657e-05, "loss": 2.6128, "step": 34548 }, { "epoch": 0.93, "learning_rate": 2.6722190829528316e-05, "loss": 2.6501, "step": 34549 }, { "epoch": 0.93, "learning_rate": 2.6702207636232433e-05, "loss": 2.625, "step": 34550 }, { "epoch": 0.93, "learning_rate": 2.6682231816466674e-05, "loss": 2.6784, "step": 34551 }, { "epoch": 0.93, "learning_rate": 2.6662263370382465e-05, "loss": 2.8477, "step": 34552 }, { "epoch": 0.93, "learning_rate": 2.6642302298130806e-05, "loss": 2.5262, "step": 34553 }, { "epoch": 0.93, "learning_rate": 2.662234859986301e-05, "loss": 2.1388, "step": 34554 }, { "epoch": 0.93, "learning_rate": 2.66024022757303e-05, "loss": 2.6681, "step": 34555 }, { "epoch": 0.93, "learning_rate": 2.6582463325883767e-05, "loss": 2.4973, "step": 34556 }, { "epoch": 0.93, "learning_rate": 2.6562531750474627e-05, "loss": 2.5271, "step": 34557 }, { "epoch": 0.93, "learning_rate": 2.6542607549653542e-05, "loss": 2.8266, "step": 34558 }, { "epoch": 0.93, "learning_rate": 2.652269072357161e-05, "loss": 2.5395, "step": 34559 }, { "epoch": 0.93, "learning_rate": 2.6502781272379817e-05, "loss": 2.3661, "step": 34560 }, { "epoch": 0.93, "learning_rate": 2.6482879196228714e-05, "loss": 2.4053, "step": 34561 }, { "epoch": 0.93, "learning_rate": 2.6462984495269516e-05, "loss": 2.2425, "step": 34562 }, { "epoch": 0.93, "learning_rate": 2.6443097169652652e-05, "loss": 2.5983, "step": 34563 }, { "epoch": 0.93, "learning_rate": 2.642321721952867e-05, "loss": 2.2264, "step": 34564 }, { "epoch": 0.93, "learning_rate": 2.6403344645048565e-05, "loss": 2.5264, "step": 34565 }, { "epoch": 0.93, "learning_rate": 2.6383479446362546e-05, "loss": 2.2064, "step": 34566 }, { "epoch": 0.93, "learning_rate": 2.636362162362116e-05, "loss": 2.4151, "step": 34567 }, { "epoch": 0.93, "learning_rate": 2.634377117697495e-05, "loss": 2.7503, "step": 34568 }, { "epoch": 0.93, "learning_rate": 2.6323928106574245e-05, "loss": 2.3055, "step": 34569 }, { "epoch": 0.93, "learning_rate": 2.6304092412569368e-05, "loss": 2.478, "step": 34570 }, { "epoch": 0.93, "learning_rate": 2.6284264095110643e-05, "loss": 3.0333, "step": 34571 }, { "epoch": 0.93, "learning_rate": 2.6264443154348285e-05, "loss": 2.0565, "step": 34572 }, { "epoch": 0.93, "learning_rate": 2.624462959043239e-05, "loss": 2.6691, "step": 34573 }, { "epoch": 0.93, "learning_rate": 2.6224823403512953e-05, "loss": 2.7722, "step": 34574 }, { "epoch": 0.93, "learning_rate": 2.62050245937403e-05, "loss": 2.8398, "step": 34575 }, { "epoch": 0.93, "learning_rate": 2.618523316126431e-05, "loss": 2.8835, "step": 34576 }, { "epoch": 0.93, "learning_rate": 2.616544910623486e-05, "loss": 2.3115, "step": 34577 }, { "epoch": 0.93, "learning_rate": 2.6145672428801837e-05, "loss": 2.0166, "step": 34578 }, { "epoch": 0.93, "learning_rate": 2.6125903129115226e-05, "loss": 2.6423, "step": 34579 }, { "epoch": 0.93, "learning_rate": 2.6106141207324463e-05, "loss": 2.4581, "step": 34580 }, { "epoch": 0.93, "learning_rate": 2.6086386663579543e-05, "loss": 2.3932, "step": 34581 }, { "epoch": 0.93, "learning_rate": 2.6066639498030008e-05, "loss": 2.7816, "step": 34582 }, { "epoch": 0.93, "learning_rate": 2.6046899710825523e-05, "loss": 2.559, "step": 34583 }, { "epoch": 0.93, "learning_rate": 2.602716730211563e-05, "loss": 2.5225, "step": 34584 }, { "epoch": 0.93, "learning_rate": 2.600744227204965e-05, "loss": 2.9225, "step": 34585 }, { "epoch": 0.93, "learning_rate": 2.5987724620777255e-05, "loss": 2.3916, "step": 34586 }, { "epoch": 0.93, "learning_rate": 2.5968014348447756e-05, "loss": 2.607, "step": 34587 }, { "epoch": 0.93, "learning_rate": 2.5948311455210373e-05, "loss": 2.133, "step": 34588 }, { "epoch": 0.93, "learning_rate": 2.592861594121454e-05, "loss": 2.2409, "step": 34589 }, { "epoch": 0.93, "learning_rate": 2.590892780660925e-05, "loss": 1.7448, "step": 34590 }, { "epoch": 0.93, "learning_rate": 2.5889247051543718e-05, "loss": 2.6496, "step": 34591 }, { "epoch": 0.93, "learning_rate": 2.586957367616727e-05, "loss": 2.7264, "step": 34592 }, { "epoch": 0.93, "learning_rate": 2.584990768062867e-05, "loss": 2.5422, "step": 34593 }, { "epoch": 0.93, "learning_rate": 2.5830249065077026e-05, "loss": 2.6165, "step": 34594 }, { "epoch": 0.93, "learning_rate": 2.581059782966122e-05, "loss": 2.4842, "step": 34595 }, { "epoch": 0.93, "learning_rate": 2.579095397453024e-05, "loss": 2.3943, "step": 34596 }, { "epoch": 0.93, "learning_rate": 2.577131749983286e-05, "loss": 2.2388, "step": 34597 }, { "epoch": 0.93, "learning_rate": 2.575168840571762e-05, "loss": 2.3429, "step": 34598 }, { "epoch": 0.93, "learning_rate": 2.5732066692333524e-05, "loss": 2.2726, "step": 34599 }, { "epoch": 0.93, "learning_rate": 2.5712452359829e-05, "loss": 2.5409, "step": 34600 }, { "epoch": 0.93, "learning_rate": 2.5692845408352817e-05, "loss": 2.6139, "step": 34601 }, { "epoch": 0.93, "learning_rate": 2.5673245838053527e-05, "loss": 2.5848, "step": 34602 }, { "epoch": 0.93, "learning_rate": 2.5653653649079456e-05, "loss": 2.687, "step": 34603 }, { "epoch": 0.93, "learning_rate": 2.563406884157915e-05, "loss": 2.3249, "step": 34604 }, { "epoch": 0.93, "learning_rate": 2.5614491415700937e-05, "loss": 2.3324, "step": 34605 }, { "epoch": 0.93, "learning_rate": 2.559492137159314e-05, "loss": 2.2944, "step": 34606 }, { "epoch": 0.93, "learning_rate": 2.5575358709403972e-05, "loss": 2.559, "step": 34607 }, { "epoch": 0.93, "learning_rate": 2.5555803429281656e-05, "loss": 2.6513, "step": 34608 }, { "epoch": 0.93, "learning_rate": 2.5536255531374398e-05, "loss": 2.4569, "step": 34609 }, { "epoch": 0.93, "learning_rate": 2.5516715015830196e-05, "loss": 2.5311, "step": 34610 }, { "epoch": 0.93, "learning_rate": 2.549718188279726e-05, "loss": 2.6861, "step": 34611 }, { "epoch": 0.93, "learning_rate": 2.5477656132423367e-05, "loss": 2.4552, "step": 34612 }, { "epoch": 0.93, "learning_rate": 2.5458137764856505e-05, "loss": 2.2227, "step": 34613 }, { "epoch": 0.93, "learning_rate": 2.5438626780244557e-05, "loss": 2.4252, "step": 34614 }, { "epoch": 0.93, "learning_rate": 2.5419123178735294e-05, "loss": 2.5567, "step": 34615 }, { "epoch": 0.93, "learning_rate": 2.5399626960476708e-05, "loss": 2.5728, "step": 34616 }, { "epoch": 0.93, "learning_rate": 2.5380138125616126e-05, "loss": 1.9668, "step": 34617 }, { "epoch": 0.93, "learning_rate": 2.536065667430143e-05, "loss": 2.7486, "step": 34618 }, { "epoch": 0.93, "learning_rate": 2.534118260668017e-05, "loss": 2.5172, "step": 34619 }, { "epoch": 0.93, "learning_rate": 2.5321715922899892e-05, "loss": 2.3294, "step": 34620 }, { "epoch": 0.93, "learning_rate": 2.530225662310781e-05, "loss": 2.7779, "step": 34621 }, { "epoch": 0.93, "learning_rate": 2.5282804707451813e-05, "loss": 2.7125, "step": 34622 }, { "epoch": 0.93, "learning_rate": 2.5263360176078888e-05, "loss": 2.5425, "step": 34623 }, { "epoch": 0.93, "learning_rate": 2.5243923029136694e-05, "loss": 2.3357, "step": 34624 }, { "epoch": 0.93, "learning_rate": 2.522449326677212e-05, "loss": 2.4571, "step": 34625 }, { "epoch": 0.93, "learning_rate": 2.5205070889132485e-05, "loss": 2.5292, "step": 34626 }, { "epoch": 0.93, "learning_rate": 2.51856558963649e-05, "loss": 2.616, "step": 34627 }, { "epoch": 0.93, "learning_rate": 2.5166248288616578e-05, "loss": 2.1447, "step": 34628 }, { "epoch": 0.93, "learning_rate": 2.514684806603451e-05, "loss": 2.8668, "step": 34629 }, { "epoch": 0.93, "learning_rate": 2.5127455228765696e-05, "loss": 2.6198, "step": 34630 }, { "epoch": 0.93, "learning_rate": 2.5108069776956898e-05, "loss": 2.5461, "step": 34631 }, { "epoch": 0.93, "learning_rate": 2.508869171075512e-05, "loss": 2.1581, "step": 34632 }, { "epoch": 0.93, "learning_rate": 2.5069321030307013e-05, "loss": 2.7532, "step": 34633 }, { "epoch": 0.93, "learning_rate": 2.5049957735759355e-05, "loss": 2.8202, "step": 34634 }, { "epoch": 0.93, "learning_rate": 2.5030601827259136e-05, "loss": 2.4515, "step": 34635 }, { "epoch": 0.93, "learning_rate": 2.5011253304952685e-05, "loss": 2.311, "step": 34636 }, { "epoch": 0.93, "learning_rate": 2.4991912168986664e-05, "loss": 2.7927, "step": 34637 }, { "epoch": 0.93, "learning_rate": 2.4972578419507618e-05, "loss": 2.8642, "step": 34638 }, { "epoch": 0.93, "learning_rate": 2.495325205666199e-05, "loss": 2.2211, "step": 34639 }, { "epoch": 0.93, "learning_rate": 2.4933933080596105e-05, "loss": 2.5903, "step": 34640 }, { "epoch": 0.93, "learning_rate": 2.4914621491456513e-05, "loss": 2.468, "step": 34641 }, { "epoch": 0.93, "learning_rate": 2.4895317289389428e-05, "loss": 2.756, "step": 34642 }, { "epoch": 0.93, "learning_rate": 2.4876020474541073e-05, "loss": 2.3107, "step": 34643 }, { "epoch": 0.93, "learning_rate": 2.4856731047057658e-05, "loss": 2.5256, "step": 34644 }, { "epoch": 0.93, "learning_rate": 2.483744900708529e-05, "loss": 2.2995, "step": 34645 }, { "epoch": 0.93, "learning_rate": 2.4818174354770183e-05, "loss": 1.8054, "step": 34646 }, { "epoch": 0.93, "learning_rate": 2.4798907090258004e-05, "loss": 2.1109, "step": 34647 }, { "epoch": 0.93, "learning_rate": 2.4779647213695077e-05, "loss": 2.223, "step": 34648 }, { "epoch": 0.93, "learning_rate": 2.4760394725227286e-05, "loss": 2.5295, "step": 34649 }, { "epoch": 0.93, "learning_rate": 2.474114962500018e-05, "loss": 2.7863, "step": 34650 }, { "epoch": 0.93, "learning_rate": 2.4721911913159977e-05, "loss": 2.4187, "step": 34651 }, { "epoch": 0.93, "learning_rate": 2.4702681589852116e-05, "loss": 2.6803, "step": 34652 }, { "epoch": 0.93, "learning_rate": 2.4683458655222367e-05, "loss": 2.3844, "step": 34653 }, { "epoch": 0.93, "learning_rate": 2.4664243109416285e-05, "loss": 2.7214, "step": 34654 }, { "epoch": 0.93, "learning_rate": 2.4645034952579637e-05, "loss": 2.949, "step": 34655 }, { "epoch": 0.93, "learning_rate": 2.4625834184857755e-05, "loss": 2.6022, "step": 34656 }, { "epoch": 0.93, "learning_rate": 2.4606640806396296e-05, "loss": 2.0809, "step": 34657 }, { "epoch": 0.93, "learning_rate": 2.458745481734048e-05, "loss": 2.6312, "step": 34658 }, { "epoch": 0.93, "learning_rate": 2.456827621783575e-05, "loss": 1.8716, "step": 34659 }, { "epoch": 0.93, "learning_rate": 2.4549105008027205e-05, "loss": 1.9883, "step": 34660 }, { "epoch": 0.93, "learning_rate": 2.452994118806029e-05, "loss": 2.2885, "step": 34661 }, { "epoch": 0.93, "learning_rate": 2.4510784758080328e-05, "loss": 2.4451, "step": 34662 }, { "epoch": 0.93, "learning_rate": 2.4491635718232098e-05, "loss": 2.635, "step": 34663 }, { "epoch": 0.93, "learning_rate": 2.4472494068660813e-05, "loss": 2.7147, "step": 34664 }, { "epoch": 0.93, "learning_rate": 2.4453359809511688e-05, "loss": 2.8979, "step": 34665 }, { "epoch": 0.93, "learning_rate": 2.443423294092939e-05, "loss": 2.4279, "step": 34666 }, { "epoch": 0.93, "learning_rate": 2.4415113463058802e-05, "loss": 2.5691, "step": 34667 }, { "epoch": 0.93, "learning_rate": 2.4396001376045028e-05, "loss": 2.4389, "step": 34668 }, { "epoch": 0.93, "learning_rate": 2.4376896680032734e-05, "loss": 2.4501, "step": 34669 }, { "epoch": 0.93, "learning_rate": 2.435779937516669e-05, "loss": 2.4839, "step": 34670 }, { "epoch": 0.93, "learning_rate": 2.4338709461591447e-05, "loss": 2.6008, "step": 34671 }, { "epoch": 0.93, "learning_rate": 2.4319626939451666e-05, "loss": 2.4618, "step": 34672 }, { "epoch": 0.93, "learning_rate": 2.4300551808892014e-05, "loss": 2.2684, "step": 34673 }, { "epoch": 0.93, "learning_rate": 2.4281484070056924e-05, "loss": 2.7768, "step": 34674 }, { "epoch": 0.93, "learning_rate": 2.4262423723090952e-05, "loss": 2.4095, "step": 34675 }, { "epoch": 0.93, "learning_rate": 2.4243370768138317e-05, "loss": 2.2878, "step": 34676 }, { "epoch": 0.93, "learning_rate": 2.4224325205343456e-05, "loss": 2.1869, "step": 34677 }, { "epoch": 0.93, "learning_rate": 2.4205287034850698e-05, "loss": 2.0237, "step": 34678 }, { "epoch": 0.93, "learning_rate": 2.418625625680426e-05, "loss": 2.1205, "step": 34679 }, { "epoch": 0.93, "learning_rate": 2.4167232871348145e-05, "loss": 2.5784, "step": 34680 }, { "epoch": 0.93, "learning_rate": 2.414821687862667e-05, "loss": 2.5016, "step": 34681 }, { "epoch": 0.93, "learning_rate": 2.4129208278783843e-05, "loss": 2.6182, "step": 34682 }, { "epoch": 0.93, "learning_rate": 2.4110207071963764e-05, "loss": 2.5089, "step": 34683 }, { "epoch": 0.93, "learning_rate": 2.409121325831021e-05, "loss": 2.7047, "step": 34684 }, { "epoch": 0.93, "learning_rate": 2.407222683796717e-05, "loss": 2.4097, "step": 34685 }, { "epoch": 0.93, "learning_rate": 2.4053247811078425e-05, "loss": 2.4337, "step": 34686 }, { "epoch": 0.93, "learning_rate": 2.403427617778775e-05, "loss": 2.7116, "step": 34687 }, { "epoch": 0.93, "learning_rate": 2.4015311938239026e-05, "loss": 2.2806, "step": 34688 }, { "epoch": 0.93, "learning_rate": 2.3996355092575805e-05, "loss": 2.9235, "step": 34689 }, { "epoch": 0.93, "learning_rate": 2.397740564094164e-05, "loss": 2.691, "step": 34690 }, { "epoch": 0.93, "learning_rate": 2.3958463583480082e-05, "loss": 2.1738, "step": 34691 }, { "epoch": 0.93, "learning_rate": 2.3939528920334907e-05, "loss": 2.4199, "step": 34692 }, { "epoch": 0.93, "learning_rate": 2.392060165164922e-05, "loss": 3.1622, "step": 34693 }, { "epoch": 0.93, "learning_rate": 2.3901681777566576e-05, "loss": 1.8597, "step": 34694 }, { "epoch": 0.93, "learning_rate": 2.388276929823019e-05, "loss": 2.6669, "step": 34695 }, { "epoch": 0.93, "learning_rate": 2.3863864213783505e-05, "loss": 2.2312, "step": 34696 }, { "epoch": 0.93, "learning_rate": 2.384496652436974e-05, "loss": 2.4503, "step": 34697 }, { "epoch": 0.93, "learning_rate": 2.382607623013189e-05, "loss": 2.1625, "step": 34698 }, { "epoch": 0.93, "learning_rate": 2.380719333121317e-05, "loss": 2.6029, "step": 34699 }, { "epoch": 0.93, "learning_rate": 2.37883178277567e-05, "loss": 2.8915, "step": 34700 }, { "epoch": 0.93, "learning_rate": 2.3769449719905357e-05, "loss": 2.4019, "step": 34701 }, { "epoch": 0.93, "learning_rate": 2.3750589007802138e-05, "loss": 2.2899, "step": 34702 }, { "epoch": 0.93, "learning_rate": 2.3731735691589927e-05, "loss": 2.5304, "step": 34703 }, { "epoch": 0.93, "learning_rate": 2.3712889771411507e-05, "loss": 2.8629, "step": 34704 }, { "epoch": 0.93, "learning_rate": 2.3694051247409752e-05, "loss": 2.5891, "step": 34705 }, { "epoch": 0.93, "learning_rate": 2.3675220119727224e-05, "loss": 2.2965, "step": 34706 }, { "epoch": 0.93, "learning_rate": 2.3656396388506696e-05, "loss": 2.4255, "step": 34707 }, { "epoch": 0.93, "learning_rate": 2.363758005389083e-05, "loss": 2.8346, "step": 34708 }, { "epoch": 0.93, "learning_rate": 2.3618771116022066e-05, "loss": 2.9537, "step": 34709 }, { "epoch": 0.93, "learning_rate": 2.3599969575042956e-05, "loss": 2.4498, "step": 34710 }, { "epoch": 0.93, "learning_rate": 2.3581175431095947e-05, "loss": 2.564, "step": 34711 }, { "epoch": 0.93, "learning_rate": 2.3562388684323255e-05, "loss": 2.645, "step": 34712 }, { "epoch": 0.93, "learning_rate": 2.3543609334867432e-05, "loss": 2.4743, "step": 34713 }, { "epoch": 0.93, "learning_rate": 2.352483738287059e-05, "loss": 2.9788, "step": 34714 }, { "epoch": 0.93, "learning_rate": 2.3506072828474945e-05, "loss": 2.3833, "step": 34715 }, { "epoch": 0.93, "learning_rate": 2.348731567182294e-05, "loss": 2.0053, "step": 34716 }, { "epoch": 0.93, "learning_rate": 2.346856591305624e-05, "loss": 2.0699, "step": 34717 }, { "epoch": 0.93, "learning_rate": 2.3449823552317174e-05, "loss": 2.0889, "step": 34718 }, { "epoch": 0.93, "learning_rate": 2.343108858974763e-05, "loss": 2.4948, "step": 34719 }, { "epoch": 0.93, "learning_rate": 2.3412361025489603e-05, "loss": 2.3754, "step": 34720 }, { "epoch": 0.93, "learning_rate": 2.3393640859684982e-05, "loss": 2.582, "step": 34721 }, { "epoch": 0.93, "learning_rate": 2.3374928092475434e-05, "loss": 2.4578, "step": 34722 }, { "epoch": 0.93, "learning_rate": 2.335622272400284e-05, "loss": 2.9053, "step": 34723 }, { "epoch": 0.93, "learning_rate": 2.333752475440898e-05, "loss": 2.2901, "step": 34724 }, { "epoch": 0.93, "learning_rate": 2.331883418383529e-05, "loss": 2.6358, "step": 34725 }, { "epoch": 0.93, "learning_rate": 2.3300151012423554e-05, "loss": 2.6536, "step": 34726 }, { "epoch": 0.93, "learning_rate": 2.328147524031521e-05, "loss": 2.6652, "step": 34727 }, { "epoch": 0.93, "learning_rate": 2.326280686765181e-05, "loss": 2.6829, "step": 34728 }, { "epoch": 0.93, "learning_rate": 2.3244145894574907e-05, "loss": 2.6535, "step": 34729 }, { "epoch": 0.93, "learning_rate": 2.3225492321225615e-05, "loss": 2.3705, "step": 34730 }, { "epoch": 0.93, "learning_rate": 2.3206846147745374e-05, "loss": 1.951, "step": 34731 }, { "epoch": 0.93, "learning_rate": 2.3188207374275293e-05, "loss": 2.1722, "step": 34732 }, { "epoch": 0.93, "learning_rate": 2.3169576000956927e-05, "loss": 2.225, "step": 34733 }, { "epoch": 0.93, "learning_rate": 2.3150952027931048e-05, "loss": 2.878, "step": 34734 }, { "epoch": 0.93, "learning_rate": 2.3132335455339103e-05, "loss": 2.3791, "step": 34735 }, { "epoch": 0.93, "learning_rate": 2.3113726283321757e-05, "loss": 2.4401, "step": 34736 }, { "epoch": 0.93, "learning_rate": 2.3095124512020338e-05, "loss": 2.43, "step": 34737 }, { "epoch": 0.93, "learning_rate": 2.3076530141575513e-05, "loss": 2.3505, "step": 34738 }, { "epoch": 0.93, "learning_rate": 2.305794317212817e-05, "loss": 1.8867, "step": 34739 }, { "epoch": 0.93, "learning_rate": 2.3039363603819197e-05, "loss": 2.7269, "step": 34740 }, { "epoch": 0.93, "learning_rate": 2.302079143678937e-05, "loss": 2.6246, "step": 34741 }, { "epoch": 0.93, "learning_rate": 2.300222667117935e-05, "loss": 2.5726, "step": 34742 }, { "epoch": 0.93, "learning_rate": 2.298366930712992e-05, "loss": 2.8231, "step": 34743 }, { "epoch": 0.93, "learning_rate": 2.2965119344781404e-05, "loss": 2.5782, "step": 34744 }, { "epoch": 0.93, "learning_rate": 2.2946576784274476e-05, "loss": 2.0954, "step": 34745 }, { "epoch": 0.93, "learning_rate": 2.2928041625749574e-05, "loss": 2.8794, "step": 34746 }, { "epoch": 0.93, "learning_rate": 2.2909513869347255e-05, "loss": 2.915, "step": 34747 }, { "epoch": 0.93, "learning_rate": 2.2890993515207735e-05, "loss": 2.3114, "step": 34748 }, { "epoch": 0.93, "learning_rate": 2.2872480563471355e-05, "loss": 2.4927, "step": 34749 }, { "epoch": 0.93, "learning_rate": 2.2853975014278326e-05, "loss": 2.5431, "step": 34750 }, { "epoch": 0.93, "learning_rate": 2.283547686776899e-05, "loss": 2.2693, "step": 34751 }, { "epoch": 0.93, "learning_rate": 2.281698612408323e-05, "loss": 2.3463, "step": 34752 }, { "epoch": 0.93, "learning_rate": 2.2798502783361373e-05, "loss": 2.3644, "step": 34753 }, { "epoch": 0.93, "learning_rate": 2.2780026845743207e-05, "loss": 2.8312, "step": 34754 }, { "epoch": 0.93, "learning_rate": 2.2761558311368946e-05, "loss": 2.5943, "step": 34755 }, { "epoch": 0.93, "learning_rate": 2.274309718037859e-05, "loss": 2.6816, "step": 34756 }, { "epoch": 0.93, "learning_rate": 2.2724643452911587e-05, "loss": 2.4219, "step": 34757 }, { "epoch": 0.93, "learning_rate": 2.2706197129108043e-05, "loss": 2.273, "step": 34758 }, { "epoch": 0.93, "learning_rate": 2.2687758209107513e-05, "loss": 2.1458, "step": 34759 }, { "epoch": 0.93, "learning_rate": 2.2669326693049887e-05, "loss": 2.6483, "step": 34760 }, { "epoch": 0.93, "learning_rate": 2.2650902581074718e-05, "loss": 2.515, "step": 34761 }, { "epoch": 0.93, "learning_rate": 2.2632485873321675e-05, "loss": 2.7094, "step": 34762 }, { "epoch": 0.93, "learning_rate": 2.2614076569929976e-05, "loss": 2.662, "step": 34763 }, { "epoch": 0.93, "learning_rate": 2.259567467103951e-05, "loss": 2.3484, "step": 34764 }, { "epoch": 0.93, "learning_rate": 2.2577280176789393e-05, "loss": 2.5829, "step": 34765 }, { "epoch": 0.93, "learning_rate": 2.2558893087318844e-05, "loss": 2.6251, "step": 34766 }, { "epoch": 0.93, "learning_rate": 2.2540513402767637e-05, "loss": 2.4561, "step": 34767 }, { "epoch": 0.93, "learning_rate": 2.2522141123274666e-05, "loss": 2.2035, "step": 34768 }, { "epoch": 0.93, "learning_rate": 2.2503776248979145e-05, "loss": 2.6266, "step": 34769 }, { "epoch": 0.93, "learning_rate": 2.2485418780020416e-05, "loss": 2.4611, "step": 34770 }, { "epoch": 0.93, "learning_rate": 2.2467068716537252e-05, "loss": 2.7735, "step": 34771 }, { "epoch": 0.93, "learning_rate": 2.2448726058668767e-05, "loss": 2.2641, "step": 34772 }, { "epoch": 0.93, "learning_rate": 2.2430390806553958e-05, "loss": 2.1887, "step": 34773 }, { "epoch": 0.93, "learning_rate": 2.2412062960331825e-05, "loss": 2.909, "step": 34774 }, { "epoch": 0.93, "learning_rate": 2.2393742520141148e-05, "loss": 2.4256, "step": 34775 }, { "epoch": 0.93, "learning_rate": 2.23754294861207e-05, "loss": 1.9142, "step": 34776 }, { "epoch": 0.93, "learning_rate": 2.2357123858409155e-05, "loss": 2.834, "step": 34777 }, { "epoch": 0.93, "learning_rate": 2.2338825637145287e-05, "loss": 2.3635, "step": 34778 }, { "epoch": 0.93, "learning_rate": 2.2320534822467542e-05, "loss": 2.9073, "step": 34779 }, { "epoch": 0.93, "learning_rate": 2.2302251414514916e-05, "loss": 2.7148, "step": 34780 }, { "epoch": 0.93, "learning_rate": 2.2283975413425418e-05, "loss": 1.9134, "step": 34781 }, { "epoch": 0.93, "learning_rate": 2.2265706819337815e-05, "loss": 2.6563, "step": 34782 }, { "epoch": 0.93, "learning_rate": 2.224744563239045e-05, "loss": 2.454, "step": 34783 }, { "epoch": 0.93, "learning_rate": 2.2229191852721542e-05, "loss": 2.6897, "step": 34784 }, { "epoch": 0.93, "learning_rate": 2.2210945480469425e-05, "loss": 2.3059, "step": 34785 }, { "epoch": 0.93, "learning_rate": 2.219270651577243e-05, "loss": 2.7281, "step": 34786 }, { "epoch": 0.93, "learning_rate": 2.2174474958768677e-05, "loss": 2.3722, "step": 34787 }, { "epoch": 0.93, "learning_rate": 2.2156250809596378e-05, "loss": 2.262, "step": 34788 }, { "epoch": 0.93, "learning_rate": 2.213803406839343e-05, "loss": 2.798, "step": 34789 }, { "epoch": 0.93, "learning_rate": 2.2119824735297833e-05, "loss": 2.5128, "step": 34790 }, { "epoch": 0.93, "learning_rate": 2.2101622810447807e-05, "loss": 2.788, "step": 34791 }, { "epoch": 0.93, "learning_rate": 2.2083428293980802e-05, "loss": 2.3729, "step": 34792 }, { "epoch": 0.94, "learning_rate": 2.2065241186034923e-05, "loss": 2.4415, "step": 34793 }, { "epoch": 0.94, "learning_rate": 2.2047061486748175e-05, "loss": 2.3151, "step": 34794 }, { "epoch": 0.94, "learning_rate": 2.2028889196257895e-05, "loss": 2.5209, "step": 34795 }, { "epoch": 0.94, "learning_rate": 2.201072431470186e-05, "loss": 2.5792, "step": 34796 }, { "epoch": 0.94, "learning_rate": 2.1992566842217955e-05, "loss": 2.2257, "step": 34797 }, { "epoch": 0.94, "learning_rate": 2.1974416778943297e-05, "loss": 2.4461, "step": 34798 }, { "epoch": 0.94, "learning_rate": 2.1956274125015664e-05, "loss": 2.7259, "step": 34799 }, { "epoch": 0.94, "learning_rate": 2.193813888057239e-05, "loss": 2.2598, "step": 34800 }, { "epoch": 0.94, "learning_rate": 2.192001104575092e-05, "loss": 2.2161, "step": 34801 }, { "epoch": 0.94, "learning_rate": 2.1901890620688702e-05, "loss": 2.3397, "step": 34802 }, { "epoch": 0.94, "learning_rate": 2.1883777605522847e-05, "loss": 2.6138, "step": 34803 }, { "epoch": 0.94, "learning_rate": 2.186567200039058e-05, "loss": 2.6117, "step": 34804 }, { "epoch": 0.94, "learning_rate": 2.1847573805429122e-05, "loss": 2.3994, "step": 34805 }, { "epoch": 0.94, "learning_rate": 2.1829483020775477e-05, "loss": 2.3352, "step": 34806 }, { "epoch": 0.94, "learning_rate": 2.1811399646566977e-05, "loss": 2.5582, "step": 34807 }, { "epoch": 0.94, "learning_rate": 2.179332368294029e-05, "loss": 2.2997, "step": 34808 }, { "epoch": 0.94, "learning_rate": 2.1775255130032536e-05, "loss": 2.2994, "step": 34809 }, { "epoch": 0.94, "learning_rate": 2.1757193987980595e-05, "loss": 2.5918, "step": 34810 }, { "epoch": 0.94, "learning_rate": 2.1739140256921254e-05, "loss": 2.4619, "step": 34811 }, { "epoch": 0.94, "learning_rate": 2.1721093936991175e-05, "loss": 2.2951, "step": 34812 }, { "epoch": 0.94, "learning_rate": 2.1703055028327258e-05, "loss": 2.7534, "step": 34813 }, { "epoch": 0.94, "learning_rate": 2.168502353106616e-05, "loss": 2.6498, "step": 34814 }, { "epoch": 0.94, "learning_rate": 2.166699944534445e-05, "loss": 2.6164, "step": 34815 }, { "epoch": 0.94, "learning_rate": 2.1648982771298454e-05, "loss": 2.1988, "step": 34816 }, { "epoch": 0.94, "learning_rate": 2.1630973509064954e-05, "loss": 2.7561, "step": 34817 }, { "epoch": 0.94, "learning_rate": 2.161297165878029e-05, "loss": 2.7875, "step": 34818 }, { "epoch": 0.94, "learning_rate": 2.1594977220580793e-05, "loss": 2.5814, "step": 34819 }, { "epoch": 0.94, "learning_rate": 2.1576990194602797e-05, "loss": 2.2956, "step": 34820 }, { "epoch": 0.94, "learning_rate": 2.1559010580982753e-05, "loss": 2.3461, "step": 34821 }, { "epoch": 0.94, "learning_rate": 2.1541038379856658e-05, "loss": 1.8905, "step": 34822 }, { "epoch": 0.94, "learning_rate": 2.152307359136074e-05, "loss": 2.8026, "step": 34823 }, { "epoch": 0.94, "learning_rate": 2.1505116215631006e-05, "loss": 2.5734, "step": 34824 }, { "epoch": 0.94, "learning_rate": 2.148716625280356e-05, "loss": 2.6383, "step": 34825 }, { "epoch": 0.94, "learning_rate": 2.1469223703014406e-05, "loss": 2.6791, "step": 34826 }, { "epoch": 0.94, "learning_rate": 2.145128856639955e-05, "loss": 3.0665, "step": 34827 }, { "epoch": 0.94, "learning_rate": 2.1433360843094662e-05, "loss": 2.5581, "step": 34828 }, { "epoch": 0.94, "learning_rate": 2.1415440533235854e-05, "loss": 2.7062, "step": 34829 }, { "epoch": 0.94, "learning_rate": 2.1397527636958568e-05, "loss": 2.1696, "step": 34830 }, { "epoch": 0.94, "learning_rate": 2.1379622154398705e-05, "loss": 2.2793, "step": 34831 }, { "epoch": 0.94, "learning_rate": 2.1361724085691814e-05, "loss": 2.6585, "step": 34832 }, { "epoch": 0.94, "learning_rate": 2.134383343097357e-05, "loss": 2.2426, "step": 34833 }, { "epoch": 0.94, "learning_rate": 2.1325950190379527e-05, "loss": 2.51, "step": 34834 }, { "epoch": 0.94, "learning_rate": 2.1308074364045137e-05, "loss": 2.1365, "step": 34835 }, { "epoch": 0.94, "learning_rate": 2.1290205952105733e-05, "loss": 2.9299, "step": 34836 }, { "epoch": 0.94, "learning_rate": 2.1272344954696764e-05, "loss": 2.3995, "step": 34837 }, { "epoch": 0.94, "learning_rate": 2.1254491371953567e-05, "loss": 2.5226, "step": 34838 }, { "epoch": 0.94, "learning_rate": 2.123664520401114e-05, "loss": 1.9512, "step": 34839 }, { "epoch": 0.94, "learning_rate": 2.1218806451005157e-05, "loss": 2.5229, "step": 34840 }, { "epoch": 0.94, "learning_rate": 2.12009751130704e-05, "loss": 2.6204, "step": 34841 }, { "epoch": 0.94, "learning_rate": 2.1183151190342198e-05, "loss": 2.5657, "step": 34842 }, { "epoch": 0.94, "learning_rate": 2.116533468295534e-05, "loss": 2.4648, "step": 34843 }, { "epoch": 0.94, "learning_rate": 2.1147525591044824e-05, "loss": 2.4691, "step": 34844 }, { "epoch": 0.94, "learning_rate": 2.112972391474577e-05, "loss": 2.6072, "step": 34845 }, { "epoch": 0.94, "learning_rate": 2.1111929654192842e-05, "loss": 2.5031, "step": 34846 }, { "epoch": 0.94, "learning_rate": 2.1094142809520935e-05, "loss": 2.2659, "step": 34847 }, { "epoch": 0.94, "learning_rate": 2.107636338086494e-05, "loss": 2.6304, "step": 34848 }, { "epoch": 0.94, "learning_rate": 2.1058591368359305e-05, "loss": 1.8751, "step": 34849 }, { "epoch": 0.94, "learning_rate": 2.104082677213881e-05, "loss": 2.4676, "step": 34850 }, { "epoch": 0.94, "learning_rate": 2.1023069592337906e-05, "loss": 2.4115, "step": 34851 }, { "epoch": 0.94, "learning_rate": 2.100531982909104e-05, "loss": 2.2549, "step": 34852 }, { "epoch": 0.94, "learning_rate": 2.0987577482533104e-05, "loss": 2.8517, "step": 34853 }, { "epoch": 0.94, "learning_rate": 2.0969842552798213e-05, "loss": 2.5341, "step": 34854 }, { "epoch": 0.94, "learning_rate": 2.0952115040020704e-05, "loss": 2.5396, "step": 34855 }, { "epoch": 0.94, "learning_rate": 2.093439494433502e-05, "loss": 2.889, "step": 34856 }, { "epoch": 0.94, "learning_rate": 2.0916682265875175e-05, "loss": 2.7162, "step": 34857 }, { "epoch": 0.94, "learning_rate": 2.089897700477561e-05, "loss": 2.6033, "step": 34858 }, { "epoch": 0.94, "learning_rate": 2.088127916117033e-05, "loss": 2.6877, "step": 34859 }, { "epoch": 0.94, "learning_rate": 2.086358873519334e-05, "loss": 2.7174, "step": 34860 }, { "epoch": 0.94, "learning_rate": 2.0845905726978865e-05, "loss": 2.4284, "step": 34861 }, { "epoch": 0.94, "learning_rate": 2.0828230136660686e-05, "loss": 2.184, "step": 34862 }, { "epoch": 0.94, "learning_rate": 2.0810561964372808e-05, "loss": 2.3471, "step": 34863 }, { "epoch": 0.94, "learning_rate": 2.0792901210249127e-05, "loss": 2.3692, "step": 34864 }, { "epoch": 0.94, "learning_rate": 2.0775247874423197e-05, "loss": 2.5915, "step": 34865 }, { "epoch": 0.94, "learning_rate": 2.0757601957029027e-05, "loss": 2.5969, "step": 34866 }, { "epoch": 0.94, "learning_rate": 2.0739963458200172e-05, "loss": 2.5443, "step": 34867 }, { "epoch": 0.94, "learning_rate": 2.0722332378070195e-05, "loss": 2.7959, "step": 34868 }, { "epoch": 0.94, "learning_rate": 2.070470871677288e-05, "loss": 2.4284, "step": 34869 }, { "epoch": 0.94, "learning_rate": 2.068709247444156e-05, "loss": 2.4698, "step": 34870 }, { "epoch": 0.94, "learning_rate": 2.0669483651209687e-05, "loss": 2.1217, "step": 34871 }, { "epoch": 0.94, "learning_rate": 2.0651882247210816e-05, "loss": 2.2232, "step": 34872 }, { "epoch": 0.94, "learning_rate": 2.0634288262578073e-05, "loss": 2.5652, "step": 34873 }, { "epoch": 0.94, "learning_rate": 2.0616701697445006e-05, "loss": 2.6439, "step": 34874 }, { "epoch": 0.94, "learning_rate": 2.0599122551944626e-05, "loss": 2.7846, "step": 34875 }, { "epoch": 0.94, "learning_rate": 2.058155082621027e-05, "loss": 2.8065, "step": 34876 }, { "epoch": 0.94, "learning_rate": 2.0563986520374833e-05, "loss": 2.6978, "step": 34877 }, { "epoch": 0.94, "learning_rate": 2.054642963457165e-05, "loss": 2.2334, "step": 34878 }, { "epoch": 0.94, "learning_rate": 2.0528880168933506e-05, "loss": 2.9687, "step": 34879 }, { "epoch": 0.94, "learning_rate": 2.0511338123593625e-05, "loss": 2.6944, "step": 34880 }, { "epoch": 0.94, "learning_rate": 2.049380349868457e-05, "loss": 2.5706, "step": 34881 }, { "epoch": 0.94, "learning_rate": 2.0476276294339457e-05, "loss": 2.4784, "step": 34882 }, { "epoch": 0.94, "learning_rate": 2.0458756510690957e-05, "loss": 2.5576, "step": 34883 }, { "epoch": 0.94, "learning_rate": 2.044124414787163e-05, "loss": 2.3633, "step": 34884 }, { "epoch": 0.94, "learning_rate": 2.042373920601437e-05, "loss": 2.4753, "step": 34885 }, { "epoch": 0.94, "learning_rate": 2.0406241685251846e-05, "loss": 2.5569, "step": 34886 }, { "epoch": 0.94, "learning_rate": 2.03887515857164e-05, "loss": 2.4663, "step": 34887 }, { "epoch": 0.94, "learning_rate": 2.0371268907540707e-05, "loss": 2.6479, "step": 34888 }, { "epoch": 0.94, "learning_rate": 2.035379365085699e-05, "loss": 2.6293, "step": 34889 }, { "epoch": 0.94, "learning_rate": 2.033632581579792e-05, "loss": 2.2253, "step": 34890 }, { "epoch": 0.94, "learning_rate": 2.0318865402495613e-05, "loss": 2.2034, "step": 34891 }, { "epoch": 0.94, "learning_rate": 2.030141241108252e-05, "loss": 2.3414, "step": 34892 }, { "epoch": 0.94, "learning_rate": 2.028396684169076e-05, "loss": 2.3008, "step": 34893 }, { "epoch": 0.94, "learning_rate": 2.0266528694452447e-05, "loss": 2.2545, "step": 34894 }, { "epoch": 0.94, "learning_rate": 2.0249097969499807e-05, "loss": 2.3428, "step": 34895 }, { "epoch": 0.94, "learning_rate": 2.023167466696485e-05, "loss": 2.1814, "step": 34896 }, { "epoch": 0.94, "learning_rate": 2.0214258786979577e-05, "loss": 1.8754, "step": 34897 }, { "epoch": 0.94, "learning_rate": 2.0196850329675665e-05, "loss": 2.4787, "step": 34898 }, { "epoch": 0.94, "learning_rate": 2.017944929518556e-05, "loss": 2.6972, "step": 34899 }, { "epoch": 0.94, "learning_rate": 2.01620556836406e-05, "loss": 2.3245, "step": 34900 }, { "epoch": 0.94, "learning_rate": 2.014466949517291e-05, "loss": 2.4678, "step": 34901 }, { "epoch": 0.94, "learning_rate": 2.0127290729913816e-05, "loss": 2.5372, "step": 34902 }, { "epoch": 0.94, "learning_rate": 2.0109919387995223e-05, "loss": 2.4289, "step": 34903 }, { "epoch": 0.94, "learning_rate": 2.009255546954869e-05, "loss": 2.4484, "step": 34904 }, { "epoch": 0.94, "learning_rate": 2.0075198974705778e-05, "loss": 2.307, "step": 34905 }, { "epoch": 0.94, "learning_rate": 2.0057849903598045e-05, "loss": 2.5297, "step": 34906 }, { "epoch": 0.94, "learning_rate": 2.0040508256356836e-05, "loss": 2.7337, "step": 34907 }, { "epoch": 0.94, "learning_rate": 2.002317403311349e-05, "loss": 2.5048, "step": 34908 }, { "epoch": 0.94, "learning_rate": 2.0005847233999343e-05, "loss": 2.1979, "step": 34909 }, { "epoch": 0.94, "learning_rate": 1.9988527859145733e-05, "loss": 2.5594, "step": 34910 }, { "epoch": 0.94, "learning_rate": 1.9971215908683783e-05, "loss": 2.2856, "step": 34911 }, { "epoch": 0.94, "learning_rate": 1.9953911382744714e-05, "loss": 2.4839, "step": 34912 }, { "epoch": 0.94, "learning_rate": 1.9936614281459653e-05, "loss": 2.6805, "step": 34913 }, { "epoch": 0.94, "learning_rate": 1.991932460495949e-05, "loss": 2.6578, "step": 34914 }, { "epoch": 0.94, "learning_rate": 1.990204235337545e-05, "loss": 2.4332, "step": 34915 }, { "epoch": 0.94, "learning_rate": 1.9884767526838098e-05, "loss": 2.2411, "step": 34916 }, { "epoch": 0.94, "learning_rate": 1.9867500125478667e-05, "loss": 2.391, "step": 34917 }, { "epoch": 0.94, "learning_rate": 1.9850240149427713e-05, "loss": 2.3441, "step": 34918 }, { "epoch": 0.94, "learning_rate": 1.9832987598816243e-05, "loss": 2.5485, "step": 34919 }, { "epoch": 0.94, "learning_rate": 1.9815742473774823e-05, "loss": 2.3393, "step": 34920 }, { "epoch": 0.94, "learning_rate": 1.9798504774434012e-05, "loss": 2.5052, "step": 34921 }, { "epoch": 0.94, "learning_rate": 1.9781274500924486e-05, "loss": 2.4315, "step": 34922 }, { "epoch": 0.94, "learning_rate": 1.9764051653376803e-05, "loss": 2.7729, "step": 34923 }, { "epoch": 0.94, "learning_rate": 1.9746836231921304e-05, "loss": 2.6169, "step": 34924 }, { "epoch": 0.94, "learning_rate": 1.9729628236688668e-05, "loss": 2.4174, "step": 34925 }, { "epoch": 0.94, "learning_rate": 1.971242766780912e-05, "loss": 2.2552, "step": 34926 }, { "epoch": 0.94, "learning_rate": 1.9695234525412888e-05, "loss": 2.3909, "step": 34927 }, { "epoch": 0.94, "learning_rate": 1.9678048809630312e-05, "loss": 2.5994, "step": 34928 }, { "epoch": 0.94, "learning_rate": 1.966087052059162e-05, "loss": 2.0276, "step": 34929 }, { "epoch": 0.94, "learning_rate": 1.9643699658426828e-05, "loss": 2.0426, "step": 34930 }, { "epoch": 0.94, "learning_rate": 1.9626536223266156e-05, "loss": 2.4484, "step": 34931 }, { "epoch": 0.94, "learning_rate": 1.9609380215239503e-05, "loss": 2.4095, "step": 34932 }, { "epoch": 0.94, "learning_rate": 1.9592231634476877e-05, "loss": 2.3791, "step": 34933 }, { "epoch": 0.94, "learning_rate": 1.9575090481108393e-05, "loss": 2.5417, "step": 34934 }, { "epoch": 0.94, "learning_rate": 1.9557956755263617e-05, "loss": 2.4193, "step": 34935 }, { "epoch": 0.94, "learning_rate": 1.9540830457072554e-05, "loss": 2.0647, "step": 34936 }, { "epoch": 0.94, "learning_rate": 1.952371158666477e-05, "loss": 2.5137, "step": 34937 }, { "epoch": 0.94, "learning_rate": 1.950660014417005e-05, "loss": 2.4935, "step": 34938 }, { "epoch": 0.94, "learning_rate": 1.9489496129718176e-05, "loss": 2.3232, "step": 34939 }, { "epoch": 0.94, "learning_rate": 1.947239954343849e-05, "loss": 2.1601, "step": 34940 }, { "epoch": 0.94, "learning_rate": 1.9455310385460558e-05, "loss": 2.1185, "step": 34941 }, { "epoch": 0.94, "learning_rate": 1.9438228655913935e-05, "loss": 2.0987, "step": 34942 }, { "epoch": 0.94, "learning_rate": 1.942115435492797e-05, "loss": 2.4058, "step": 34943 }, { "epoch": 0.94, "learning_rate": 1.9404087482632117e-05, "loss": 2.3071, "step": 34944 }, { "epoch": 0.94, "learning_rate": 1.9387028039155486e-05, "loss": 2.5056, "step": 34945 }, { "epoch": 0.94, "learning_rate": 1.936997602462731e-05, "loss": 2.7655, "step": 34946 }, { "epoch": 0.94, "learning_rate": 1.9352931439177158e-05, "loss": 2.5322, "step": 34947 }, { "epoch": 0.94, "learning_rate": 1.9335894282933696e-05, "loss": 2.4868, "step": 34948 }, { "epoch": 0.94, "learning_rate": 1.9318864556026163e-05, "loss": 2.6459, "step": 34949 }, { "epoch": 0.94, "learning_rate": 1.9301842258583557e-05, "loss": 2.5721, "step": 34950 }, { "epoch": 0.94, "learning_rate": 1.9284827390734895e-05, "loss": 2.418, "step": 34951 }, { "epoch": 0.94, "learning_rate": 1.9267819952609066e-05, "loss": 2.5717, "step": 34952 }, { "epoch": 0.94, "learning_rate": 1.9250819944334973e-05, "loss": 2.2967, "step": 34953 }, { "epoch": 0.94, "learning_rate": 1.9233827366041178e-05, "loss": 2.6323, "step": 34954 }, { "epoch": 0.94, "learning_rate": 1.9216842217856688e-05, "loss": 2.5284, "step": 34955 }, { "epoch": 0.94, "learning_rate": 1.919986449991007e-05, "loss": 2.3629, "step": 34956 }, { "epoch": 0.94, "learning_rate": 1.918289421232977e-05, "loss": 1.9581, "step": 34957 }, { "epoch": 0.94, "learning_rate": 1.9165931355244582e-05, "loss": 2.6058, "step": 34958 }, { "epoch": 0.94, "learning_rate": 1.9148975928782954e-05, "loss": 2.3039, "step": 34959 }, { "epoch": 0.94, "learning_rate": 1.9132027933073337e-05, "loss": 2.5378, "step": 34960 }, { "epoch": 0.94, "learning_rate": 1.911508736824419e-05, "loss": 2.5573, "step": 34961 }, { "epoch": 0.94, "learning_rate": 1.9098154234423626e-05, "loss": 2.7328, "step": 34962 }, { "epoch": 0.94, "learning_rate": 1.90812285317401e-05, "loss": 2.7725, "step": 34963 }, { "epoch": 0.94, "learning_rate": 1.9064310260321848e-05, "loss": 2.2619, "step": 34964 }, { "epoch": 0.94, "learning_rate": 1.9047399420296983e-05, "loss": 2.623, "step": 34965 }, { "epoch": 0.94, "learning_rate": 1.903049601179374e-05, "loss": 2.4581, "step": 34966 }, { "epoch": 0.94, "learning_rate": 1.9013600034940015e-05, "loss": 2.5312, "step": 34967 }, { "epoch": 0.94, "learning_rate": 1.8996711489863816e-05, "loss": 2.3407, "step": 34968 }, { "epoch": 0.94, "learning_rate": 1.8979830376693264e-05, "loss": 2.3516, "step": 34969 }, { "epoch": 0.94, "learning_rate": 1.8962956695556034e-05, "loss": 2.1004, "step": 34970 }, { "epoch": 0.94, "learning_rate": 1.8946090446580135e-05, "loss": 2.8328, "step": 34971 }, { "epoch": 0.94, "learning_rate": 1.892923162989313e-05, "loss": 2.8406, "step": 34972 }, { "epoch": 0.94, "learning_rate": 1.8912380245622916e-05, "loss": 2.6404, "step": 34973 }, { "epoch": 0.94, "learning_rate": 1.8895536293897174e-05, "loss": 2.4133, "step": 34974 }, { "epoch": 0.94, "learning_rate": 1.8878699774843355e-05, "loss": 2.4376, "step": 34975 }, { "epoch": 0.94, "learning_rate": 1.8861870688589134e-05, "loss": 2.6581, "step": 34976 }, { "epoch": 0.94, "learning_rate": 1.8845049035261962e-05, "loss": 2.5441, "step": 34977 }, { "epoch": 0.94, "learning_rate": 1.8828234814989298e-05, "loss": 2.2398, "step": 34978 }, { "epoch": 0.94, "learning_rate": 1.881142802789848e-05, "loss": 2.8853, "step": 34979 }, { "epoch": 0.94, "learning_rate": 1.8794628674116966e-05, "loss": 2.4077, "step": 34980 }, { "epoch": 0.94, "learning_rate": 1.8777836753771872e-05, "loss": 2.6864, "step": 34981 }, { "epoch": 0.94, "learning_rate": 1.876105226699043e-05, "loss": 2.6579, "step": 34982 }, { "epoch": 0.94, "learning_rate": 1.8744275213899876e-05, "loss": 2.5378, "step": 34983 }, { "epoch": 0.94, "learning_rate": 1.8727505594627104e-05, "loss": 2.442, "step": 34984 }, { "epoch": 0.94, "learning_rate": 1.8710743409299457e-05, "loss": 2.1902, "step": 34985 }, { "epoch": 0.94, "learning_rate": 1.869398865804384e-05, "loss": 2.5551, "step": 34986 }, { "epoch": 0.94, "learning_rate": 1.8677241340986916e-05, "loss": 2.392, "step": 34987 }, { "epoch": 0.94, "learning_rate": 1.866050145825604e-05, "loss": 2.8565, "step": 34988 }, { "epoch": 0.94, "learning_rate": 1.864376900997755e-05, "loss": 2.4434, "step": 34989 }, { "epoch": 0.94, "learning_rate": 1.862704399627846e-05, "loss": 2.3271, "step": 34990 }, { "epoch": 0.94, "learning_rate": 1.861032641728544e-05, "loss": 2.808, "step": 34991 }, { "epoch": 0.94, "learning_rate": 1.8593616273125057e-05, "loss": 2.4869, "step": 34992 }, { "epoch": 0.94, "learning_rate": 1.8576913563924213e-05, "loss": 2.203, "step": 34993 }, { "epoch": 0.94, "learning_rate": 1.8560218289809028e-05, "loss": 2.3416, "step": 34994 }, { "epoch": 0.94, "learning_rate": 1.8543530450906177e-05, "loss": 2.5048, "step": 34995 }, { "epoch": 0.94, "learning_rate": 1.8526850047342115e-05, "loss": 2.7487, "step": 34996 }, { "epoch": 0.94, "learning_rate": 1.8510177079243075e-05, "loss": 2.2973, "step": 34997 }, { "epoch": 0.94, "learning_rate": 1.849351154673551e-05, "loss": 2.4321, "step": 34998 }, { "epoch": 0.94, "learning_rate": 1.847685344994565e-05, "loss": 2.5243, "step": 34999 }, { "epoch": 0.94, "learning_rate": 1.8460202788999625e-05, "loss": 2.3269, "step": 35000 }, { "epoch": 0.94, "learning_rate": 1.844355956402366e-05, "loss": 1.7869, "step": 35001 }, { "epoch": 0.94, "learning_rate": 1.8426923775143876e-05, "loss": 2.3427, "step": 35002 }, { "epoch": 0.94, "learning_rate": 1.8410295422486067e-05, "loss": 2.3879, "step": 35003 }, { "epoch": 0.94, "learning_rate": 1.8393674506176463e-05, "loss": 2.646, "step": 35004 }, { "epoch": 0.94, "learning_rate": 1.8377061026340848e-05, "loss": 2.7438, "step": 35005 }, { "epoch": 0.94, "learning_rate": 1.8360454983105123e-05, "loss": 2.4074, "step": 35006 }, { "epoch": 0.94, "learning_rate": 1.834385637659519e-05, "loss": 2.6877, "step": 35007 }, { "epoch": 0.94, "learning_rate": 1.8327265206936506e-05, "loss": 2.336, "step": 35008 }, { "epoch": 0.94, "learning_rate": 1.8310681474255186e-05, "loss": 1.9583, "step": 35009 }, { "epoch": 0.94, "learning_rate": 1.8294105178676357e-05, "loss": 2.2864, "step": 35010 }, { "epoch": 0.94, "learning_rate": 1.827753632032603e-05, "loss": 2.4152, "step": 35011 }, { "epoch": 0.94, "learning_rate": 1.826097489932965e-05, "loss": 2.4219, "step": 35012 }, { "epoch": 0.94, "learning_rate": 1.8244420915812465e-05, "loss": 2.2129, "step": 35013 }, { "epoch": 0.94, "learning_rate": 1.8227874369900143e-05, "loss": 2.572, "step": 35014 }, { "epoch": 0.94, "learning_rate": 1.821133526171792e-05, "loss": 2.4278, "step": 35015 }, { "epoch": 0.94, "learning_rate": 1.819480359139103e-05, "loss": 2.2744, "step": 35016 }, { "epoch": 0.94, "learning_rate": 1.8178279359044704e-05, "loss": 2.7395, "step": 35017 }, { "epoch": 0.94, "learning_rate": 1.8161762564804285e-05, "loss": 2.1237, "step": 35018 }, { "epoch": 0.94, "learning_rate": 1.814525320879479e-05, "loss": 2.7713, "step": 35019 }, { "epoch": 0.94, "learning_rate": 1.8128751291141444e-05, "loss": 2.7407, "step": 35020 }, { "epoch": 0.94, "learning_rate": 1.811225681196904e-05, "loss": 2.6346, "step": 35021 }, { "epoch": 0.94, "learning_rate": 1.8095769771402594e-05, "loss": 2.833, "step": 35022 }, { "epoch": 0.94, "learning_rate": 1.8079290169566998e-05, "loss": 2.5309, "step": 35023 }, { "epoch": 0.94, "learning_rate": 1.806281800658727e-05, "loss": 2.5473, "step": 35024 }, { "epoch": 0.94, "learning_rate": 1.804635328258808e-05, "loss": 2.9269, "step": 35025 }, { "epoch": 0.94, "learning_rate": 1.8029895997694113e-05, "loss": 2.2553, "step": 35026 }, { "epoch": 0.94, "learning_rate": 1.8013446152030042e-05, "loss": 2.4716, "step": 35027 }, { "epoch": 0.94, "learning_rate": 1.7997003745720663e-05, "loss": 2.5426, "step": 35028 }, { "epoch": 0.94, "learning_rate": 1.798056877889043e-05, "loss": 2.3961, "step": 35029 }, { "epoch": 0.94, "learning_rate": 1.796414125166368e-05, "loss": 2.3236, "step": 35030 }, { "epoch": 0.94, "learning_rate": 1.7947721164165097e-05, "loss": 2.3147, "step": 35031 }, { "epoch": 0.94, "learning_rate": 1.793130851651903e-05, "loss": 2.2255, "step": 35032 }, { "epoch": 0.94, "learning_rate": 1.7914903308849817e-05, "loss": 2.6671, "step": 35033 }, { "epoch": 0.94, "learning_rate": 1.7898505541281696e-05, "loss": 2.4255, "step": 35034 }, { "epoch": 0.94, "learning_rate": 1.7882115213938788e-05, "loss": 2.5979, "step": 35035 }, { "epoch": 0.94, "learning_rate": 1.786573232694555e-05, "loss": 2.1653, "step": 35036 }, { "epoch": 0.94, "learning_rate": 1.784935688042588e-05, "loss": 2.0492, "step": 35037 }, { "epoch": 0.94, "learning_rate": 1.78329888745038e-05, "loss": 2.9479, "step": 35038 }, { "epoch": 0.94, "learning_rate": 1.781662830930364e-05, "loss": 2.5054, "step": 35039 }, { "epoch": 0.94, "learning_rate": 1.7800275184948866e-05, "loss": 2.7169, "step": 35040 }, { "epoch": 0.94, "learning_rate": 1.778392950156382e-05, "loss": 2.5494, "step": 35041 }, { "epoch": 0.94, "learning_rate": 1.7767591259271965e-05, "loss": 2.3332, "step": 35042 }, { "epoch": 0.94, "learning_rate": 1.7751260458197195e-05, "loss": 2.4023, "step": 35043 }, { "epoch": 0.94, "learning_rate": 1.77349370984633e-05, "loss": 2.2801, "step": 35044 }, { "epoch": 0.94, "learning_rate": 1.771862118019396e-05, "loss": 2.6909, "step": 35045 }, { "epoch": 0.94, "learning_rate": 1.7702312703512746e-05, "loss": 2.5445, "step": 35046 }, { "epoch": 0.94, "learning_rate": 1.7686011668543224e-05, "loss": 2.8103, "step": 35047 }, { "epoch": 0.94, "learning_rate": 1.7669718075408735e-05, "loss": 2.9195, "step": 35048 }, { "epoch": 0.94, "learning_rate": 1.7653431924232856e-05, "loss": 2.5635, "step": 35049 }, { "epoch": 0.94, "learning_rate": 1.7637153215139036e-05, "loss": 2.1769, "step": 35050 }, { "epoch": 0.94, "learning_rate": 1.76208819482504e-05, "loss": 2.6302, "step": 35051 }, { "epoch": 0.94, "learning_rate": 1.760461812369052e-05, "loss": 2.5884, "step": 35052 }, { "epoch": 0.94, "learning_rate": 1.758836174158229e-05, "loss": 2.1434, "step": 35053 }, { "epoch": 0.94, "learning_rate": 1.7572112802048955e-05, "loss": 2.3805, "step": 35054 }, { "epoch": 0.94, "learning_rate": 1.7555871305213743e-05, "loss": 2.7513, "step": 35055 }, { "epoch": 0.94, "learning_rate": 1.7539637251199447e-05, "loss": 2.3705, "step": 35056 }, { "epoch": 0.94, "learning_rate": 1.75234106401293e-05, "loss": 2.2244, "step": 35057 }, { "epoch": 0.94, "learning_rate": 1.7507191472126206e-05, "loss": 2.7197, "step": 35058 }, { "epoch": 0.94, "learning_rate": 1.7490979747312953e-05, "loss": 2.6698, "step": 35059 }, { "epoch": 0.94, "learning_rate": 1.7474775465812443e-05, "loss": 2.1126, "step": 35060 }, { "epoch": 0.94, "learning_rate": 1.7458578627747246e-05, "loss": 2.8649, "step": 35061 }, { "epoch": 0.94, "learning_rate": 1.7442389233240264e-05, "loss": 2.7474, "step": 35062 }, { "epoch": 0.94, "learning_rate": 1.7426207282414065e-05, "loss": 2.5943, "step": 35063 }, { "epoch": 0.94, "learning_rate": 1.7410032775391214e-05, "loss": 2.4253, "step": 35064 }, { "epoch": 0.94, "learning_rate": 1.739386571229429e-05, "loss": 2.4517, "step": 35065 }, { "epoch": 0.94, "learning_rate": 1.737770609324585e-05, "loss": 2.4331, "step": 35066 }, { "epoch": 0.94, "learning_rate": 1.7361553918368132e-05, "loss": 2.4513, "step": 35067 }, { "epoch": 0.94, "learning_rate": 1.734540918778371e-05, "loss": 2.8425, "step": 35068 }, { "epoch": 0.94, "learning_rate": 1.7329271901614596e-05, "loss": 2.7517, "step": 35069 }, { "epoch": 0.94, "learning_rate": 1.7313142059983357e-05, "loss": 2.5, "step": 35070 }, { "epoch": 0.94, "learning_rate": 1.7297019663012115e-05, "loss": 2.7917, "step": 35071 }, { "epoch": 0.94, "learning_rate": 1.7280904710822887e-05, "loss": 1.992, "step": 35072 }, { "epoch": 0.94, "learning_rate": 1.7264797203537907e-05, "loss": 2.3453, "step": 35073 }, { "epoch": 0.94, "learning_rate": 1.724869714127908e-05, "loss": 2.545, "step": 35074 }, { "epoch": 0.94, "learning_rate": 1.7232604524168415e-05, "loss": 2.2583, "step": 35075 }, { "epoch": 0.94, "learning_rate": 1.721651935232782e-05, "loss": 2.5621, "step": 35076 }, { "epoch": 0.94, "learning_rate": 1.720044162587919e-05, "loss": 2.598, "step": 35077 }, { "epoch": 0.94, "learning_rate": 1.7184371344944215e-05, "loss": 2.2229, "step": 35078 }, { "epoch": 0.94, "learning_rate": 1.7168308509644903e-05, "loss": 2.5743, "step": 35079 }, { "epoch": 0.94, "learning_rate": 1.7152253120102712e-05, "loss": 2.0432, "step": 35080 }, { "epoch": 0.94, "learning_rate": 1.7136205176439322e-05, "loss": 2.8332, "step": 35081 }, { "epoch": 0.94, "learning_rate": 1.7120164678776307e-05, "loss": 2.2531, "step": 35082 }, { "epoch": 0.94, "learning_rate": 1.710413162723512e-05, "loss": 2.8652, "step": 35083 }, { "epoch": 0.94, "learning_rate": 1.7088106021937445e-05, "loss": 2.4412, "step": 35084 }, { "epoch": 0.94, "learning_rate": 1.7072087863004516e-05, "loss": 2.0602, "step": 35085 }, { "epoch": 0.94, "learning_rate": 1.7056077150557682e-05, "loss": 2.3844, "step": 35086 }, { "epoch": 0.94, "learning_rate": 1.7040073884718398e-05, "loss": 2.3023, "step": 35087 }, { "epoch": 0.94, "learning_rate": 1.7024078065607572e-05, "loss": 2.4839, "step": 35088 }, { "epoch": 0.94, "learning_rate": 1.7008089693346775e-05, "loss": 2.6405, "step": 35089 }, { "epoch": 0.94, "learning_rate": 1.699210876805679e-05, "loss": 2.4634, "step": 35090 }, { "epoch": 0.94, "learning_rate": 1.6976135289858863e-05, "loss": 2.8306, "step": 35091 }, { "epoch": 0.94, "learning_rate": 1.6960169258874115e-05, "loss": 2.3773, "step": 35092 }, { "epoch": 0.94, "learning_rate": 1.6944210675223336e-05, "loss": 2.2309, "step": 35093 }, { "epoch": 0.94, "learning_rate": 1.6928259539027434e-05, "loss": 2.4056, "step": 35094 }, { "epoch": 0.94, "learning_rate": 1.69123158504072e-05, "loss": 2.568, "step": 35095 }, { "epoch": 0.94, "learning_rate": 1.6896379609483535e-05, "loss": 2.1836, "step": 35096 }, { "epoch": 0.94, "learning_rate": 1.6880450816377234e-05, "loss": 2.4636, "step": 35097 }, { "epoch": 0.94, "learning_rate": 1.6864529471208867e-05, "loss": 2.8103, "step": 35098 }, { "epoch": 0.94, "learning_rate": 1.6848615574099004e-05, "loss": 2.423, "step": 35099 }, { "epoch": 0.94, "learning_rate": 1.683270912516821e-05, "loss": 2.239, "step": 35100 }, { "epoch": 0.94, "learning_rate": 1.6816810124537173e-05, "loss": 2.3351, "step": 35101 }, { "epoch": 0.94, "learning_rate": 1.680091857232613e-05, "loss": 2.7683, "step": 35102 }, { "epoch": 0.94, "learning_rate": 1.6785034468655424e-05, "loss": 2.7127, "step": 35103 }, { "epoch": 0.94, "learning_rate": 1.676915781364563e-05, "loss": 2.198, "step": 35104 }, { "epoch": 0.94, "learning_rate": 1.6753288607416872e-05, "loss": 2.1889, "step": 35105 }, { "epoch": 0.94, "learning_rate": 1.673742685008961e-05, "loss": 2.7752, "step": 35106 }, { "epoch": 0.94, "learning_rate": 1.6721572541783635e-05, "loss": 2.6387, "step": 35107 }, { "epoch": 0.94, "learning_rate": 1.6705725682619187e-05, "loss": 2.4306, "step": 35108 }, { "epoch": 0.94, "learning_rate": 1.6689886272716392e-05, "loss": 2.285, "step": 35109 }, { "epoch": 0.94, "learning_rate": 1.6674054312195264e-05, "loss": 2.4486, "step": 35110 }, { "epoch": 0.94, "learning_rate": 1.6658229801175707e-05, "loss": 2.5004, "step": 35111 }, { "epoch": 0.94, "learning_rate": 1.6642412739777625e-05, "loss": 2.4039, "step": 35112 }, { "epoch": 0.94, "learning_rate": 1.66266031281207e-05, "loss": 2.3361, "step": 35113 }, { "epoch": 0.94, "learning_rate": 1.6610800966324944e-05, "loss": 2.3461, "step": 35114 }, { "epoch": 0.94, "learning_rate": 1.6595006254509937e-05, "loss": 2.5028, "step": 35115 }, { "epoch": 0.94, "learning_rate": 1.6579218992795132e-05, "loss": 2.4923, "step": 35116 }, { "epoch": 0.94, "learning_rate": 1.6563439181300655e-05, "loss": 2.5116, "step": 35117 }, { "epoch": 0.94, "learning_rate": 1.6547666820145524e-05, "loss": 2.4921, "step": 35118 }, { "epoch": 0.94, "learning_rate": 1.653190190944953e-05, "loss": 2.4892, "step": 35119 }, { "epoch": 0.94, "learning_rate": 1.651614444933203e-05, "loss": 2.5429, "step": 35120 }, { "epoch": 0.94, "learning_rate": 1.6500394439912357e-05, "loss": 2.641, "step": 35121 }, { "epoch": 0.94, "learning_rate": 1.6484651881309874e-05, "loss": 2.4542, "step": 35122 }, { "epoch": 0.94, "learning_rate": 1.6468916773643815e-05, "loss": 2.414, "step": 35123 }, { "epoch": 0.94, "learning_rate": 1.6453189117033418e-05, "loss": 2.8308, "step": 35124 }, { "epoch": 0.94, "learning_rate": 1.643746891159781e-05, "loss": 2.0626, "step": 35125 }, { "epoch": 0.94, "learning_rate": 1.6421756157456112e-05, "loss": 2.6035, "step": 35126 }, { "epoch": 0.94, "learning_rate": 1.640605085472746e-05, "loss": 2.4503, "step": 35127 }, { "epoch": 0.94, "learning_rate": 1.6390353003530535e-05, "loss": 2.2064, "step": 35128 }, { "epoch": 0.94, "learning_rate": 1.6374662603984348e-05, "loss": 2.6776, "step": 35129 }, { "epoch": 0.94, "learning_rate": 1.635897965620814e-05, "loss": 2.3412, "step": 35130 }, { "epoch": 0.94, "learning_rate": 1.634330416032026e-05, "loss": 2.4738, "step": 35131 }, { "epoch": 0.94, "learning_rate": 1.6327636116439726e-05, "loss": 2.2918, "step": 35132 }, { "epoch": 0.94, "learning_rate": 1.6311975524685107e-05, "loss": 2.3638, "step": 35133 }, { "epoch": 0.94, "learning_rate": 1.62963223851752e-05, "loss": 2.7037, "step": 35134 }, { "epoch": 0.94, "learning_rate": 1.628067669802835e-05, "loss": 2.3727, "step": 35135 }, { "epoch": 0.94, "learning_rate": 1.6265038463363246e-05, "loss": 2.3836, "step": 35136 }, { "epoch": 0.94, "learning_rate": 1.6249407681298344e-05, "loss": 2.0744, "step": 35137 }, { "epoch": 0.94, "learning_rate": 1.6233784351952107e-05, "loss": 2.6636, "step": 35138 }, { "epoch": 0.94, "learning_rate": 1.6218168475442774e-05, "loss": 2.5771, "step": 35139 }, { "epoch": 0.94, "learning_rate": 1.6202560051888805e-05, "loss": 2.7358, "step": 35140 }, { "epoch": 0.94, "learning_rate": 1.6186959081408327e-05, "loss": 2.3243, "step": 35141 }, { "epoch": 0.94, "learning_rate": 1.6171365564119355e-05, "loss": 2.4306, "step": 35142 }, { "epoch": 0.94, "learning_rate": 1.6155779500140464e-05, "loss": 2.5281, "step": 35143 }, { "epoch": 0.94, "learning_rate": 1.6140200889589453e-05, "loss": 2.388, "step": 35144 }, { "epoch": 0.94, "learning_rate": 1.612462973258433e-05, "loss": 2.4854, "step": 35145 }, { "epoch": 0.94, "learning_rate": 1.6109066029243225e-05, "loss": 2.4635, "step": 35146 }, { "epoch": 0.94, "learning_rate": 1.6093509779683825e-05, "loss": 2.829, "step": 35147 }, { "epoch": 0.94, "learning_rate": 1.607796098402403e-05, "loss": 2.5234, "step": 35148 }, { "epoch": 0.94, "learning_rate": 1.6062419642381753e-05, "loss": 2.3035, "step": 35149 }, { "epoch": 0.94, "learning_rate": 1.6046885754874674e-05, "loss": 2.3773, "step": 35150 }, { "epoch": 0.94, "learning_rate": 1.6031359321620475e-05, "loss": 2.3516, "step": 35151 }, { "epoch": 0.94, "learning_rate": 1.601584034273684e-05, "loss": 2.6281, "step": 35152 }, { "epoch": 0.94, "learning_rate": 1.6000328818341237e-05, "loss": 2.6347, "step": 35153 }, { "epoch": 0.94, "learning_rate": 1.598482474855123e-05, "loss": 2.5157, "step": 35154 }, { "epoch": 0.94, "learning_rate": 1.5969328133484173e-05, "loss": 2.3671, "step": 35155 }, { "epoch": 0.94, "learning_rate": 1.5953838973257638e-05, "loss": 2.374, "step": 35156 }, { "epoch": 0.94, "learning_rate": 1.593835726798898e-05, "loss": 2.5987, "step": 35157 }, { "epoch": 0.94, "learning_rate": 1.592288301779521e-05, "loss": 2.572, "step": 35158 }, { "epoch": 0.94, "learning_rate": 1.5907416222793904e-05, "loss": 2.5679, "step": 35159 }, { "epoch": 0.94, "learning_rate": 1.5891956883101964e-05, "loss": 2.4775, "step": 35160 }, { "epoch": 0.94, "learning_rate": 1.5876504998836637e-05, "loss": 2.4391, "step": 35161 }, { "epoch": 0.94, "learning_rate": 1.5861060570115048e-05, "loss": 2.5399, "step": 35162 }, { "epoch": 0.94, "learning_rate": 1.5845623597053994e-05, "loss": 2.3953, "step": 35163 }, { "epoch": 0.94, "learning_rate": 1.5830194079770598e-05, "loss": 2.3701, "step": 35164 }, { "epoch": 0.95, "learning_rate": 1.5814772018381774e-05, "loss": 2.3775, "step": 35165 }, { "epoch": 0.95, "learning_rate": 1.57993574130042e-05, "loss": 2.5141, "step": 35166 }, { "epoch": 0.95, "learning_rate": 1.5783950263754676e-05, "loss": 2.8143, "step": 35167 }, { "epoch": 0.95, "learning_rate": 1.5768550570749997e-05, "loss": 2.3761, "step": 35168 }, { "epoch": 0.95, "learning_rate": 1.5753158334106842e-05, "loss": 2.631, "step": 35169 }, { "epoch": 0.95, "learning_rate": 1.5737773553941902e-05, "loss": 2.6728, "step": 35170 }, { "epoch": 0.95, "learning_rate": 1.5722396230371528e-05, "loss": 2.8196, "step": 35171 }, { "epoch": 0.95, "learning_rate": 1.570702636351229e-05, "loss": 2.5977, "step": 35172 }, { "epoch": 0.95, "learning_rate": 1.569166395348076e-05, "loss": 2.6402, "step": 35173 }, { "epoch": 0.95, "learning_rate": 1.5676309000393073e-05, "loss": 2.4609, "step": 35174 }, { "epoch": 0.95, "learning_rate": 1.566096150436569e-05, "loss": 2.4295, "step": 35175 }, { "epoch": 0.95, "learning_rate": 1.5645621465514958e-05, "loss": 2.4556, "step": 35176 }, { "epoch": 0.95, "learning_rate": 1.563028888395701e-05, "loss": 2.2575, "step": 35177 }, { "epoch": 0.95, "learning_rate": 1.5614963759807867e-05, "loss": 2.6678, "step": 35178 }, { "epoch": 0.95, "learning_rate": 1.5599646093183983e-05, "loss": 2.6321, "step": 35179 }, { "epoch": 0.95, "learning_rate": 1.558433588420105e-05, "loss": 2.5209, "step": 35180 }, { "epoch": 0.95, "learning_rate": 1.5569033132975197e-05, "loss": 2.4261, "step": 35181 }, { "epoch": 0.95, "learning_rate": 1.5553737839622328e-05, "loss": 2.4361, "step": 35182 }, { "epoch": 0.95, "learning_rate": 1.5538450004258353e-05, "loss": 2.9525, "step": 35183 }, { "epoch": 0.95, "learning_rate": 1.5523169626999177e-05, "loss": 2.4911, "step": 35184 }, { "epoch": 0.95, "learning_rate": 1.550789670796038e-05, "loss": 2.2017, "step": 35185 }, { "epoch": 0.95, "learning_rate": 1.549263124725775e-05, "loss": 2.1789, "step": 35186 }, { "epoch": 0.95, "learning_rate": 1.5477373245006975e-05, "loss": 2.1531, "step": 35187 }, { "epoch": 0.95, "learning_rate": 1.5462122701323523e-05, "loss": 2.3618, "step": 35188 }, { "epoch": 0.95, "learning_rate": 1.5446879616323072e-05, "loss": 2.4336, "step": 35189 }, { "epoch": 0.95, "learning_rate": 1.543164399012098e-05, "loss": 2.8219, "step": 35190 }, { "epoch": 0.95, "learning_rate": 1.541641582283271e-05, "loss": 2.4204, "step": 35191 }, { "epoch": 0.95, "learning_rate": 1.540119511457383e-05, "loss": 2.4849, "step": 35192 }, { "epoch": 0.95, "learning_rate": 1.5385981865459254e-05, "loss": 1.9818, "step": 35193 }, { "epoch": 0.95, "learning_rate": 1.5370776075604555e-05, "loss": 2.5498, "step": 35194 }, { "epoch": 0.95, "learning_rate": 1.535557774512475e-05, "loss": 2.3085, "step": 35195 }, { "epoch": 0.95, "learning_rate": 1.5340386874135082e-05, "loss": 2.4032, "step": 35196 }, { "epoch": 0.95, "learning_rate": 1.5325203462750682e-05, "loss": 2.3608, "step": 35197 }, { "epoch": 0.95, "learning_rate": 1.5310027511086454e-05, "loss": 2.5766, "step": 35198 }, { "epoch": 0.95, "learning_rate": 1.5294859019257314e-05, "loss": 2.7052, "step": 35199 }, { "epoch": 0.95, "learning_rate": 1.5279697987378382e-05, "loss": 2.5534, "step": 35200 }, { "epoch": 0.95, "learning_rate": 1.5264544415564352e-05, "loss": 2.3794, "step": 35201 }, { "epoch": 0.95, "learning_rate": 1.5249398303930017e-05, "loss": 3.0053, "step": 35202 }, { "epoch": 0.95, "learning_rate": 1.5234259652590399e-05, "loss": 2.258, "step": 35203 }, { "epoch": 0.95, "learning_rate": 1.5219128461659847e-05, "loss": 2.5922, "step": 35204 }, { "epoch": 0.95, "learning_rate": 1.5204004731253052e-05, "loss": 2.4643, "step": 35205 }, { "epoch": 0.95, "learning_rate": 1.5188888461484807e-05, "loss": 2.2277, "step": 35206 }, { "epoch": 0.95, "learning_rate": 1.5173779652469355e-05, "loss": 2.409, "step": 35207 }, { "epoch": 0.95, "learning_rate": 1.5158678304321271e-05, "loss": 2.2479, "step": 35208 }, { "epoch": 0.95, "learning_rate": 1.514358441715491e-05, "loss": 2.4783, "step": 35209 }, { "epoch": 0.95, "learning_rate": 1.5128497991084733e-05, "loss": 2.7346, "step": 35210 }, { "epoch": 0.95, "learning_rate": 1.5113419026225094e-05, "loss": 2.2818, "step": 35211 }, { "epoch": 0.95, "learning_rate": 1.5098347522690014e-05, "loss": 2.2307, "step": 35212 }, { "epoch": 0.95, "learning_rate": 1.5083283480593735e-05, "loss": 2.4209, "step": 35213 }, { "epoch": 0.95, "learning_rate": 1.5068226900050496e-05, "loss": 2.4364, "step": 35214 }, { "epoch": 0.95, "learning_rate": 1.505317778117421e-05, "loss": 2.2831, "step": 35215 }, { "epoch": 0.95, "learning_rate": 1.5038136124079005e-05, "loss": 2.675, "step": 35216 }, { "epoch": 0.95, "learning_rate": 1.5023101928878791e-05, "loss": 2.3493, "step": 35217 }, { "epoch": 0.95, "learning_rate": 1.5008075195687365e-05, "loss": 2.3607, "step": 35218 }, { "epoch": 0.95, "learning_rate": 1.4993055924618859e-05, "loss": 2.3677, "step": 35219 }, { "epoch": 0.95, "learning_rate": 1.4978044115786737e-05, "loss": 2.692, "step": 35220 }, { "epoch": 0.95, "learning_rate": 1.4963039769304798e-05, "loss": 2.9293, "step": 35221 }, { "epoch": 0.95, "learning_rate": 1.4948042885286839e-05, "loss": 2.5836, "step": 35222 }, { "epoch": 0.95, "learning_rate": 1.4933053463846324e-05, "loss": 2.6863, "step": 35223 }, { "epoch": 0.95, "learning_rate": 1.4918071505096942e-05, "loss": 2.2142, "step": 35224 }, { "epoch": 0.95, "learning_rate": 1.4903097009152155e-05, "loss": 2.4042, "step": 35225 }, { "epoch": 0.95, "learning_rate": 1.488812997612532e-05, "loss": 2.6456, "step": 35226 }, { "epoch": 0.95, "learning_rate": 1.4873170406129899e-05, "loss": 2.6121, "step": 35227 }, { "epoch": 0.95, "learning_rate": 1.4858218299279136e-05, "loss": 2.5708, "step": 35228 }, { "epoch": 0.95, "learning_rate": 1.4843273655686495e-05, "loss": 2.1308, "step": 35229 }, { "epoch": 0.95, "learning_rate": 1.482833647546511e-05, "loss": 2.5854, "step": 35230 }, { "epoch": 0.95, "learning_rate": 1.481340675872811e-05, "loss": 2.7035, "step": 35231 }, { "epoch": 0.95, "learning_rate": 1.4798484505588627e-05, "loss": 2.6171, "step": 35232 }, { "epoch": 0.95, "learning_rate": 1.4783569716159573e-05, "loss": 2.51, "step": 35233 }, { "epoch": 0.95, "learning_rate": 1.4768662390554189e-05, "loss": 2.6508, "step": 35234 }, { "epoch": 0.95, "learning_rate": 1.4753762528885162e-05, "loss": 2.4349, "step": 35235 }, { "epoch": 0.95, "learning_rate": 1.4738870131265514e-05, "loss": 2.4445, "step": 35236 }, { "epoch": 0.95, "learning_rate": 1.4723985197808044e-05, "loss": 2.6811, "step": 35237 }, { "epoch": 0.95, "learning_rate": 1.4709107728625548e-05, "loss": 2.5361, "step": 35238 }, { "epoch": 0.95, "learning_rate": 1.4694237723830606e-05, "loss": 2.3782, "step": 35239 }, { "epoch": 0.95, "learning_rate": 1.4679375183536014e-05, "loss": 2.4316, "step": 35240 }, { "epoch": 0.95, "learning_rate": 1.4664520107854351e-05, "loss": 2.2827, "step": 35241 }, { "epoch": 0.95, "learning_rate": 1.4649672496898082e-05, "loss": 2.1575, "step": 35242 }, { "epoch": 0.95, "learning_rate": 1.4634832350779781e-05, "loss": 2.0145, "step": 35243 }, { "epoch": 0.95, "learning_rate": 1.4619999669611806e-05, "loss": 1.9458, "step": 35244 }, { "epoch": 0.95, "learning_rate": 1.460517445350651e-05, "loss": 2.8915, "step": 35245 }, { "epoch": 0.95, "learning_rate": 1.4590356702576247e-05, "loss": 2.1944, "step": 35246 }, { "epoch": 0.95, "learning_rate": 1.4575546416933261e-05, "loss": 2.5456, "step": 35247 }, { "epoch": 0.95, "learning_rate": 1.4560743596689685e-05, "loss": 2.5339, "step": 35248 }, { "epoch": 0.95, "learning_rate": 1.4545948241957874e-05, "loss": 2.069, "step": 35249 }, { "epoch": 0.95, "learning_rate": 1.4531160352849738e-05, "loss": 2.4404, "step": 35250 }, { "epoch": 0.95, "learning_rate": 1.4516379929477408e-05, "loss": 2.4391, "step": 35251 }, { "epoch": 0.95, "learning_rate": 1.4501606971952685e-05, "loss": 1.9688, "step": 35252 }, { "epoch": 0.95, "learning_rate": 1.4486841480387591e-05, "loss": 2.5721, "step": 35253 }, { "epoch": 0.95, "learning_rate": 1.4472083454894037e-05, "loss": 2.5305, "step": 35254 }, { "epoch": 0.95, "learning_rate": 1.4457332895583707e-05, "loss": 2.3517, "step": 35255 }, { "epoch": 0.95, "learning_rate": 1.4442589802568518e-05, "loss": 2.3906, "step": 35256 }, { "epoch": 0.95, "learning_rate": 1.4427854175960153e-05, "loss": 2.4656, "step": 35257 }, { "epoch": 0.95, "learning_rate": 1.441312601586997e-05, "loss": 2.3826, "step": 35258 }, { "epoch": 0.95, "learning_rate": 1.439840532240988e-05, "loss": 2.3762, "step": 35259 }, { "epoch": 0.95, "learning_rate": 1.4383692095691237e-05, "loss": 2.5243, "step": 35260 }, { "epoch": 0.95, "learning_rate": 1.4368986335825396e-05, "loss": 2.3434, "step": 35261 }, { "epoch": 0.95, "learning_rate": 1.4354288042924046e-05, "loss": 2.1827, "step": 35262 }, { "epoch": 0.95, "learning_rate": 1.4339597217098321e-05, "loss": 2.6586, "step": 35263 }, { "epoch": 0.95, "learning_rate": 1.4324913858459575e-05, "loss": 2.1399, "step": 35264 }, { "epoch": 0.95, "learning_rate": 1.4310237967119167e-05, "loss": 2.6562, "step": 35265 }, { "epoch": 0.95, "learning_rate": 1.4295569543188113e-05, "loss": 2.4784, "step": 35266 }, { "epoch": 0.95, "learning_rate": 1.4280908586777552e-05, "loss": 2.4752, "step": 35267 }, { "epoch": 0.95, "learning_rate": 1.4266255097998615e-05, "loss": 2.0844, "step": 35268 }, { "epoch": 0.95, "learning_rate": 1.4251609076962324e-05, "loss": 2.3199, "step": 35269 }, { "epoch": 0.95, "learning_rate": 1.4236970523779702e-05, "loss": 2.5759, "step": 35270 }, { "epoch": 0.95, "learning_rate": 1.4222339438561438e-05, "loss": 2.4627, "step": 35271 }, { "epoch": 0.95, "learning_rate": 1.4207715821418443e-05, "loss": 2.2148, "step": 35272 }, { "epoch": 0.95, "learning_rate": 1.4193099672461629e-05, "loss": 2.3092, "step": 35273 }, { "epoch": 0.95, "learning_rate": 1.4178490991801573e-05, "loss": 2.6988, "step": 35274 }, { "epoch": 0.95, "learning_rate": 1.4163889779549077e-05, "loss": 2.3635, "step": 35275 }, { "epoch": 0.95, "learning_rate": 1.4149296035814719e-05, "loss": 2.5713, "step": 35276 }, { "epoch": 0.95, "learning_rate": 1.4134709760709075e-05, "loss": 2.2956, "step": 35277 }, { "epoch": 0.95, "learning_rate": 1.4120130954342614e-05, "loss": 2.4747, "step": 35278 }, { "epoch": 0.95, "learning_rate": 1.4105559616825691e-05, "loss": 2.4388, "step": 35279 }, { "epoch": 0.95, "learning_rate": 1.4090995748268776e-05, "loss": 2.1661, "step": 35280 }, { "epoch": 0.95, "learning_rate": 1.4076439348782221e-05, "loss": 2.1449, "step": 35281 }, { "epoch": 0.95, "learning_rate": 1.4061890418476386e-05, "loss": 2.2852, "step": 35282 }, { "epoch": 0.95, "learning_rate": 1.4047348957461293e-05, "loss": 2.1118, "step": 35283 }, { "epoch": 0.95, "learning_rate": 1.4032814965847296e-05, "loss": 2.7607, "step": 35284 }, { "epoch": 0.95, "learning_rate": 1.401828844374442e-05, "loss": 2.7551, "step": 35285 }, { "epoch": 0.95, "learning_rate": 1.4003769391262689e-05, "loss": 2.2868, "step": 35286 }, { "epoch": 0.95, "learning_rate": 1.3989257808512012e-05, "loss": 2.0528, "step": 35287 }, { "epoch": 0.95, "learning_rate": 1.3974753695602527e-05, "loss": 2.179, "step": 35288 }, { "epoch": 0.95, "learning_rate": 1.3960257052644143e-05, "loss": 2.6059, "step": 35289 }, { "epoch": 0.95, "learning_rate": 1.394576787974644e-05, "loss": 2.2399, "step": 35290 }, { "epoch": 0.95, "learning_rate": 1.3931286177019332e-05, "loss": 2.3537, "step": 35291 }, { "epoch": 0.95, "learning_rate": 1.3916811944572505e-05, "loss": 2.6218, "step": 35292 }, { "epoch": 0.95, "learning_rate": 1.3902345182515653e-05, "loss": 2.5993, "step": 35293 }, { "epoch": 0.95, "learning_rate": 1.388788589095824e-05, "loss": 2.8843, "step": 35294 }, { "epoch": 0.95, "learning_rate": 1.387343407000996e-05, "loss": 2.0393, "step": 35295 }, { "epoch": 0.95, "learning_rate": 1.3858989719780168e-05, "loss": 2.4248, "step": 35296 }, { "epoch": 0.95, "learning_rate": 1.3844552840378555e-05, "loss": 2.12, "step": 35297 }, { "epoch": 0.95, "learning_rate": 1.3830123431914144e-05, "loss": 2.8551, "step": 35298 }, { "epoch": 0.95, "learning_rate": 1.3815701494496401e-05, "loss": 2.3809, "step": 35299 }, { "epoch": 0.95, "learning_rate": 1.3801287028234689e-05, "loss": 2.5357, "step": 35300 }, { "epoch": 0.95, "learning_rate": 1.3786880033238026e-05, "loss": 2.2453, "step": 35301 }, { "epoch": 0.95, "learning_rate": 1.377248050961566e-05, "loss": 2.8822, "step": 35302 }, { "epoch": 0.95, "learning_rate": 1.3758088457476725e-05, "loss": 2.1982, "step": 35303 }, { "epoch": 0.95, "learning_rate": 1.3743703876930136e-05, "loss": 2.5998, "step": 35304 }, { "epoch": 0.95, "learning_rate": 1.3729326768084915e-05, "loss": 2.5944, "step": 35305 }, { "epoch": 0.95, "learning_rate": 1.3714957131049977e-05, "loss": 2.6333, "step": 35306 }, { "epoch": 0.95, "learning_rate": 1.3700594965934232e-05, "loss": 2.3549, "step": 35307 }, { "epoch": 0.95, "learning_rate": 1.3686240272846374e-05, "loss": 2.5038, "step": 35308 }, { "epoch": 0.95, "learning_rate": 1.3671893051895201e-05, "loss": 2.6545, "step": 35309 }, { "epoch": 0.95, "learning_rate": 1.3657553303189629e-05, "loss": 2.6094, "step": 35310 }, { "epoch": 0.95, "learning_rate": 1.3643221026837904e-05, "loss": 2.6178, "step": 35311 }, { "epoch": 0.95, "learning_rate": 1.3628896222948828e-05, "loss": 2.2016, "step": 35312 }, { "epoch": 0.95, "learning_rate": 1.3614578891630868e-05, "loss": 2.3194, "step": 35313 }, { "epoch": 0.95, "learning_rate": 1.3600269032992607e-05, "loss": 2.5743, "step": 35314 }, { "epoch": 0.95, "learning_rate": 1.358596664714229e-05, "loss": 2.2391, "step": 35315 }, { "epoch": 0.95, "learning_rate": 1.3571671734188384e-05, "loss": 2.9336, "step": 35316 }, { "epoch": 0.95, "learning_rate": 1.3557384294239028e-05, "loss": 2.7071, "step": 35317 }, { "epoch": 0.95, "learning_rate": 1.3543104327402688e-05, "loss": 2.3581, "step": 35318 }, { "epoch": 0.95, "learning_rate": 1.3528831833787391e-05, "loss": 1.7978, "step": 35319 }, { "epoch": 0.95, "learning_rate": 1.3514566813501272e-05, "loss": 2.4222, "step": 35320 }, { "epoch": 0.95, "learning_rate": 1.3500309266652355e-05, "loss": 2.6009, "step": 35321 }, { "epoch": 0.95, "learning_rate": 1.3486059193348888e-05, "loss": 2.2506, "step": 35322 }, { "epoch": 0.95, "learning_rate": 1.347181659369856e-05, "loss": 2.6049, "step": 35323 }, { "epoch": 0.95, "learning_rate": 1.34575814678094e-05, "loss": 2.0032, "step": 35324 }, { "epoch": 0.95, "learning_rate": 1.3443353815789206e-05, "loss": 2.3385, "step": 35325 }, { "epoch": 0.95, "learning_rate": 1.3429133637745784e-05, "loss": 2.7489, "step": 35326 }, { "epoch": 0.95, "learning_rate": 1.3414920933786933e-05, "loss": 2.7982, "step": 35327 }, { "epoch": 0.95, "learning_rate": 1.3400715704020128e-05, "loss": 2.4914, "step": 35328 }, { "epoch": 0.95, "learning_rate": 1.3386517948553278e-05, "loss": 2.4374, "step": 35329 }, { "epoch": 0.95, "learning_rate": 1.3372327667493634e-05, "loss": 2.458, "step": 35330 }, { "epoch": 0.95, "learning_rate": 1.3358144860948884e-05, "loss": 2.1874, "step": 35331 }, { "epoch": 0.95, "learning_rate": 1.33439695290265e-05, "loss": 2.4161, "step": 35332 }, { "epoch": 0.95, "learning_rate": 1.3329801671833842e-05, "loss": 2.3151, "step": 35333 }, { "epoch": 0.95, "learning_rate": 1.3315641289477932e-05, "loss": 2.2651, "step": 35334 }, { "epoch": 0.95, "learning_rate": 1.3301488382066573e-05, "loss": 2.5165, "step": 35335 }, { "epoch": 0.95, "learning_rate": 1.3287342949706682e-05, "loss": 2.3897, "step": 35336 }, { "epoch": 0.95, "learning_rate": 1.3273204992505506e-05, "loss": 2.2672, "step": 35337 }, { "epoch": 0.95, "learning_rate": 1.3259074510570068e-05, "loss": 2.3398, "step": 35338 }, { "epoch": 0.95, "learning_rate": 1.3244951504007508e-05, "loss": 2.7942, "step": 35339 }, { "epoch": 0.95, "learning_rate": 1.3230835972924738e-05, "loss": 2.2074, "step": 35340 }, { "epoch": 0.95, "learning_rate": 1.3216727917428672e-05, "loss": 2.1953, "step": 35341 }, { "epoch": 0.95, "learning_rate": 1.3202627337626338e-05, "loss": 2.4518, "step": 35342 }, { "epoch": 0.95, "learning_rate": 1.3188534233624539e-05, "loss": 2.295, "step": 35343 }, { "epoch": 0.95, "learning_rate": 1.3174448605529854e-05, "loss": 1.9935, "step": 35344 }, { "epoch": 0.95, "learning_rate": 1.31603704534492e-05, "loss": 2.4278, "step": 35345 }, { "epoch": 0.95, "learning_rate": 1.3146299777489157e-05, "loss": 2.3341, "step": 35346 }, { "epoch": 0.95, "learning_rate": 1.3132236577756196e-05, "loss": 1.9125, "step": 35347 }, { "epoch": 0.95, "learning_rate": 1.311818085435712e-05, "loss": 2.3903, "step": 35348 }, { "epoch": 0.95, "learning_rate": 1.3104132607398178e-05, "loss": 2.4089, "step": 35349 }, { "epoch": 0.95, "learning_rate": 1.309009183698584e-05, "loss": 2.3983, "step": 35350 }, { "epoch": 0.95, "learning_rate": 1.3076058543226688e-05, "loss": 2.3929, "step": 35351 }, { "epoch": 0.95, "learning_rate": 1.3062032726226747e-05, "loss": 2.5656, "step": 35352 }, { "epoch": 0.95, "learning_rate": 1.3048014386092377e-05, "loss": 2.2663, "step": 35353 }, { "epoch": 0.95, "learning_rate": 1.3034003522929828e-05, "loss": 2.4035, "step": 35354 }, { "epoch": 0.95, "learning_rate": 1.3020000136845234e-05, "loss": 2.4503, "step": 35355 }, { "epoch": 0.95, "learning_rate": 1.3006004227944735e-05, "loss": 2.185, "step": 35356 }, { "epoch": 0.95, "learning_rate": 1.2992015796334244e-05, "loss": 2.6345, "step": 35357 }, { "epoch": 0.95, "learning_rate": 1.297803484211979e-05, "loss": 2.8268, "step": 35358 }, { "epoch": 0.95, "learning_rate": 1.2964061365407288e-05, "loss": 2.8184, "step": 35359 }, { "epoch": 0.95, "learning_rate": 1.2950095366302428e-05, "loss": 2.844, "step": 35360 }, { "epoch": 0.95, "learning_rate": 1.293613684491135e-05, "loss": 2.5252, "step": 35361 }, { "epoch": 0.95, "learning_rate": 1.2922185801339637e-05, "loss": 2.363, "step": 35362 }, { "epoch": 0.95, "learning_rate": 1.2908242235692868e-05, "loss": 2.5023, "step": 35363 }, { "epoch": 0.95, "learning_rate": 1.289430614807685e-05, "loss": 2.6084, "step": 35364 }, { "epoch": 0.95, "learning_rate": 1.2880377538597055e-05, "loss": 2.7702, "step": 35365 }, { "epoch": 0.95, "learning_rate": 1.2866456407359062e-05, "loss": 2.193, "step": 35366 }, { "epoch": 0.95, "learning_rate": 1.2852542754468344e-05, "loss": 2.4561, "step": 35367 }, { "epoch": 0.95, "learning_rate": 1.283863658003015e-05, "loss": 2.1621, "step": 35368 }, { "epoch": 0.95, "learning_rate": 1.2824737884150062e-05, "loss": 2.5765, "step": 35369 }, { "epoch": 0.95, "learning_rate": 1.281084666693333e-05, "loss": 2.763, "step": 35370 }, { "epoch": 0.95, "learning_rate": 1.2796962928484978e-05, "loss": 2.5517, "step": 35371 }, { "epoch": 0.95, "learning_rate": 1.2783086668910482e-05, "loss": 2.0866, "step": 35372 }, { "epoch": 0.95, "learning_rate": 1.2769217888314644e-05, "loss": 2.1767, "step": 35373 }, { "epoch": 0.95, "learning_rate": 1.2755356586802824e-05, "loss": 2.408, "step": 35374 }, { "epoch": 0.95, "learning_rate": 1.2741502764480051e-05, "loss": 2.4557, "step": 35375 }, { "epoch": 0.95, "learning_rate": 1.2727656421450906e-05, "loss": 2.5432, "step": 35376 }, { "epoch": 0.95, "learning_rate": 1.2713817557820639e-05, "loss": 2.816, "step": 35377 }, { "epoch": 0.95, "learning_rate": 1.2699986173694055e-05, "loss": 2.2909, "step": 35378 }, { "epoch": 0.95, "learning_rate": 1.2686162269175739e-05, "loss": 2.712, "step": 35379 }, { "epoch": 0.95, "learning_rate": 1.2672345844370603e-05, "loss": 2.6518, "step": 35380 }, { "epoch": 0.95, "learning_rate": 1.2658536899383233e-05, "loss": 2.3292, "step": 35381 }, { "epoch": 0.95, "learning_rate": 1.2644735434318322e-05, "loss": 2.5742, "step": 35382 }, { "epoch": 0.95, "learning_rate": 1.2630941449280343e-05, "loss": 2.5005, "step": 35383 }, { "epoch": 0.95, "learning_rate": 1.2617154944373766e-05, "loss": 2.0627, "step": 35384 }, { "epoch": 0.95, "learning_rate": 1.2603375919703175e-05, "loss": 2.582, "step": 35385 }, { "epoch": 0.95, "learning_rate": 1.258960437537282e-05, "loss": 2.6578, "step": 35386 }, { "epoch": 0.95, "learning_rate": 1.2575840311487063e-05, "loss": 2.9627, "step": 35387 }, { "epoch": 0.95, "learning_rate": 1.2562083728150263e-05, "loss": 2.4451, "step": 35388 }, { "epoch": 0.95, "learning_rate": 1.2548334625466673e-05, "loss": 2.6458, "step": 35389 }, { "epoch": 0.95, "learning_rate": 1.2534593003540207e-05, "loss": 2.6587, "step": 35390 }, { "epoch": 0.95, "learning_rate": 1.2520858862475226e-05, "loss": 2.0786, "step": 35391 }, { "epoch": 0.95, "learning_rate": 1.2507132202375648e-05, "loss": 2.5017, "step": 35392 }, { "epoch": 0.95, "learning_rate": 1.249341302334539e-05, "loss": 2.076, "step": 35393 }, { "epoch": 0.95, "learning_rate": 1.2479701325488591e-05, "loss": 2.1225, "step": 35394 }, { "epoch": 0.95, "learning_rate": 1.2465997108908944e-05, "loss": 2.685, "step": 35395 }, { "epoch": 0.95, "learning_rate": 1.2452300373710368e-05, "loss": 2.4344, "step": 35396 }, { "epoch": 0.95, "learning_rate": 1.2438611119996779e-05, "loss": 2.5422, "step": 35397 }, { "epoch": 0.95, "learning_rate": 1.2424929347871539e-05, "loss": 2.4872, "step": 35398 }, { "epoch": 0.95, "learning_rate": 1.2411255057438454e-05, "loss": 2.2675, "step": 35399 }, { "epoch": 0.95, "learning_rate": 1.2397588248801217e-05, "loss": 2.6671, "step": 35400 }, { "epoch": 0.95, "learning_rate": 1.2383928922063192e-05, "loss": 2.347, "step": 35401 }, { "epoch": 0.95, "learning_rate": 1.2370277077328073e-05, "loss": 2.614, "step": 35402 }, { "epoch": 0.95, "learning_rate": 1.2356632714699112e-05, "loss": 2.5772, "step": 35403 }, { "epoch": 0.95, "learning_rate": 1.2342995834279668e-05, "loss": 2.3377, "step": 35404 }, { "epoch": 0.95, "learning_rate": 1.2329366436173217e-05, "loss": 2.57, "step": 35405 }, { "epoch": 0.95, "learning_rate": 1.2315744520482786e-05, "loss": 2.0023, "step": 35406 }, { "epoch": 0.95, "learning_rate": 1.2302130087311847e-05, "loss": 2.3463, "step": 35407 }, { "epoch": 0.95, "learning_rate": 1.2288523136763207e-05, "loss": 2.3439, "step": 35408 }, { "epoch": 0.95, "learning_rate": 1.227492366894023e-05, "loss": 2.1286, "step": 35409 }, { "epoch": 0.95, "learning_rate": 1.2261331683945942e-05, "loss": 2.5642, "step": 35410 }, { "epoch": 0.95, "learning_rate": 1.224774718188304e-05, "loss": 2.2925, "step": 35411 }, { "epoch": 0.95, "learning_rate": 1.2234170162854663e-05, "loss": 2.9693, "step": 35412 }, { "epoch": 0.95, "learning_rate": 1.2220600626963618e-05, "loss": 2.1339, "step": 35413 }, { "epoch": 0.95, "learning_rate": 1.2207038574312712e-05, "loss": 2.5593, "step": 35414 }, { "epoch": 0.95, "learning_rate": 1.219348400500475e-05, "loss": 1.8547, "step": 35415 }, { "epoch": 0.95, "learning_rate": 1.217993691914232e-05, "loss": 2.5231, "step": 35416 }, { "epoch": 0.95, "learning_rate": 1.2166397316828004e-05, "loss": 2.5309, "step": 35417 }, { "epoch": 0.95, "learning_rate": 1.2152865198164498e-05, "loss": 2.5488, "step": 35418 }, { "epoch": 0.95, "learning_rate": 1.2139340563254276e-05, "loss": 2.2322, "step": 35419 }, { "epoch": 0.95, "learning_rate": 1.21258234121997e-05, "loss": 2.4613, "step": 35420 }, { "epoch": 0.95, "learning_rate": 1.2112313745103465e-05, "loss": 2.5824, "step": 35421 }, { "epoch": 0.95, "learning_rate": 1.2098811562067603e-05, "loss": 2.5263, "step": 35422 }, { "epoch": 0.95, "learning_rate": 1.2085316863194585e-05, "loss": 2.4152, "step": 35423 }, { "epoch": 0.95, "learning_rate": 1.2071829648586553e-05, "loss": 2.304, "step": 35424 }, { "epoch": 0.95, "learning_rate": 1.2058349918345646e-05, "loss": 2.4137, "step": 35425 }, { "epoch": 0.95, "learning_rate": 1.2044877672574117e-05, "loss": 2.4086, "step": 35426 }, { "epoch": 0.95, "learning_rate": 1.2031412911373996e-05, "loss": 2.4949, "step": 35427 }, { "epoch": 0.95, "learning_rate": 1.20179556348472e-05, "loss": 2.7602, "step": 35428 }, { "epoch": 0.95, "learning_rate": 1.2004505843095759e-05, "loss": 2.3518, "step": 35429 }, { "epoch": 0.95, "learning_rate": 1.1991063536221592e-05, "loss": 2.5911, "step": 35430 }, { "epoch": 0.95, "learning_rate": 1.1977628714326393e-05, "loss": 2.4587, "step": 35431 }, { "epoch": 0.95, "learning_rate": 1.1964201377512086e-05, "loss": 2.0629, "step": 35432 }, { "epoch": 0.95, "learning_rate": 1.195078152588036e-05, "loss": 2.6919, "step": 35433 }, { "epoch": 0.95, "learning_rate": 1.1937369159532918e-05, "loss": 2.2777, "step": 35434 }, { "epoch": 0.95, "learning_rate": 1.1923964278571231e-05, "loss": 2.7481, "step": 35435 }, { "epoch": 0.95, "learning_rate": 1.1910566883096886e-05, "loss": 2.3714, "step": 35436 }, { "epoch": 0.95, "learning_rate": 1.1897176973211576e-05, "loss": 2.281, "step": 35437 }, { "epoch": 0.95, "learning_rate": 1.1883794549016558e-05, "loss": 2.2391, "step": 35438 }, { "epoch": 0.95, "learning_rate": 1.1870419610613193e-05, "loss": 2.3399, "step": 35439 }, { "epoch": 0.95, "learning_rate": 1.1857052158102844e-05, "loss": 2.1306, "step": 35440 }, { "epoch": 0.95, "learning_rate": 1.1843692191586875e-05, "loss": 2.5076, "step": 35441 }, { "epoch": 0.95, "learning_rate": 1.1830339711166427e-05, "loss": 2.2774, "step": 35442 }, { "epoch": 0.95, "learning_rate": 1.1816994716942641e-05, "loss": 2.8695, "step": 35443 }, { "epoch": 0.95, "learning_rate": 1.180365720901666e-05, "loss": 2.2054, "step": 35444 }, { "epoch": 0.95, "learning_rate": 1.1790327187489403e-05, "loss": 2.0263, "step": 35445 }, { "epoch": 0.95, "learning_rate": 1.1777004652462009e-05, "loss": 2.2775, "step": 35446 }, { "epoch": 0.95, "learning_rate": 1.1763689604035399e-05, "loss": 2.9907, "step": 35447 }, { "epoch": 0.95, "learning_rate": 1.1750382042310381e-05, "loss": 2.9627, "step": 35448 }, { "epoch": 0.95, "learning_rate": 1.1737081967387763e-05, "loss": 2.6362, "step": 35449 }, { "epoch": 0.95, "learning_rate": 1.1723789379368355e-05, "loss": 2.4607, "step": 35450 }, { "epoch": 0.95, "learning_rate": 1.1710504278352851e-05, "loss": 2.4552, "step": 35451 }, { "epoch": 0.95, "learning_rate": 1.1697226664441841e-05, "loss": 2.7034, "step": 35452 }, { "epoch": 0.95, "learning_rate": 1.1683956537735907e-05, "loss": 2.263, "step": 35453 }, { "epoch": 0.95, "learning_rate": 1.1670693898335638e-05, "loss": 2.6098, "step": 35454 }, { "epoch": 0.95, "learning_rate": 1.165743874634151e-05, "loss": 2.0761, "step": 35455 }, { "epoch": 0.95, "learning_rate": 1.1644191081853994e-05, "loss": 2.3191, "step": 35456 }, { "epoch": 0.95, "learning_rate": 1.1630950904973236e-05, "loss": 2.4377, "step": 35457 }, { "epoch": 0.95, "learning_rate": 1.1617718215799822e-05, "loss": 2.5211, "step": 35458 }, { "epoch": 0.95, "learning_rate": 1.1604493014433782e-05, "loss": 2.2819, "step": 35459 }, { "epoch": 0.95, "learning_rate": 1.1591275300975479e-05, "loss": 2.3104, "step": 35460 }, { "epoch": 0.95, "learning_rate": 1.1578065075524947e-05, "loss": 2.501, "step": 35461 }, { "epoch": 0.95, "learning_rate": 1.1564862338182213e-05, "loss": 2.4379, "step": 35462 }, { "epoch": 0.95, "learning_rate": 1.1551667089047425e-05, "loss": 2.6873, "step": 35463 }, { "epoch": 0.95, "learning_rate": 1.1538479328220497e-05, "loss": 2.6411, "step": 35464 }, { "epoch": 0.95, "learning_rate": 1.1525299055801353e-05, "loss": 2.2831, "step": 35465 }, { "epoch": 0.95, "learning_rate": 1.1512126271889689e-05, "loss": 2.4238, "step": 35466 }, { "epoch": 0.95, "learning_rate": 1.1498960976585537e-05, "loss": 1.9028, "step": 35467 }, { "epoch": 0.95, "learning_rate": 1.1485803169988485e-05, "loss": 2.6098, "step": 35468 }, { "epoch": 0.95, "learning_rate": 1.147265285219834e-05, "loss": 2.4647, "step": 35469 }, { "epoch": 0.95, "learning_rate": 1.1459510023314578e-05, "loss": 2.499, "step": 35470 }, { "epoch": 0.95, "learning_rate": 1.1446374683436789e-05, "loss": 2.5226, "step": 35471 }, { "epoch": 0.95, "learning_rate": 1.1433246832664556e-05, "loss": 2.0786, "step": 35472 }, { "epoch": 0.95, "learning_rate": 1.1420126471097359e-05, "loss": 2.2274, "step": 35473 }, { "epoch": 0.95, "learning_rate": 1.1407013598834448e-05, "loss": 2.3075, "step": 35474 }, { "epoch": 0.95, "learning_rate": 1.1393908215975412e-05, "loss": 2.2156, "step": 35475 }, { "epoch": 0.95, "learning_rate": 1.1380810322619283e-05, "loss": 2.3546, "step": 35476 }, { "epoch": 0.95, "learning_rate": 1.1367719918865427e-05, "loss": 2.4053, "step": 35477 }, { "epoch": 0.95, "learning_rate": 1.1354637004812984e-05, "loss": 2.4959, "step": 35478 }, { "epoch": 0.95, "learning_rate": 1.1341561580560878e-05, "loss": 2.5136, "step": 35479 }, { "epoch": 0.95, "learning_rate": 1.1328493646208582e-05, "loss": 2.9311, "step": 35480 }, { "epoch": 0.95, "learning_rate": 1.1315433201854686e-05, "loss": 2.6428, "step": 35481 }, { "epoch": 0.95, "learning_rate": 1.1302380247598443e-05, "loss": 2.7564, "step": 35482 }, { "epoch": 0.95, "learning_rate": 1.1289334783538551e-05, "loss": 2.1452, "step": 35483 }, { "epoch": 0.95, "learning_rate": 1.1276296809773935e-05, "loss": 2.6316, "step": 35484 }, { "epoch": 0.95, "learning_rate": 1.1263266326403177e-05, "loss": 2.7728, "step": 35485 }, { "epoch": 0.95, "learning_rate": 1.1250243333525312e-05, "loss": 2.1932, "step": 35486 }, { "epoch": 0.95, "learning_rate": 1.1237227831238705e-05, "loss": 2.6922, "step": 35487 }, { "epoch": 0.95, "learning_rate": 1.1224219819642167e-05, "loss": 2.9092, "step": 35488 }, { "epoch": 0.95, "learning_rate": 1.1211219298834175e-05, "loss": 2.653, "step": 35489 }, { "epoch": 0.95, "learning_rate": 1.1198226268913203e-05, "loss": 2.5189, "step": 35490 }, { "epoch": 0.95, "learning_rate": 1.1185240729977619e-05, "loss": 2.1198, "step": 35491 }, { "epoch": 0.95, "learning_rate": 1.11722626821259e-05, "loss": 2.6742, "step": 35492 }, { "epoch": 0.95, "learning_rate": 1.1159292125456411e-05, "loss": 2.2404, "step": 35493 }, { "epoch": 0.95, "learning_rate": 1.1146329060067184e-05, "loss": 2.8524, "step": 35494 }, { "epoch": 0.95, "learning_rate": 1.1133373486056698e-05, "loss": 2.0825, "step": 35495 }, { "epoch": 0.95, "learning_rate": 1.1120425403522982e-05, "loss": 2.2548, "step": 35496 }, { "epoch": 0.95, "learning_rate": 1.1107484812564073e-05, "loss": 2.9168, "step": 35497 }, { "epoch": 0.95, "learning_rate": 1.1094551713278112e-05, "loss": 2.6032, "step": 35498 }, { "epoch": 0.95, "learning_rate": 1.1081626105762909e-05, "loss": 2.1874, "step": 35499 }, { "epoch": 0.95, "learning_rate": 1.1068707990116611e-05, "loss": 2.7771, "step": 35500 }, { "epoch": 0.95, "learning_rate": 1.1055797366436916e-05, "loss": 2.781, "step": 35501 }, { "epoch": 0.95, "learning_rate": 1.1042894234821854e-05, "loss": 2.2613, "step": 35502 }, { "epoch": 0.95, "learning_rate": 1.1029998595368795e-05, "loss": 2.321, "step": 35503 }, { "epoch": 0.95, "learning_rate": 1.1017110448175882e-05, "loss": 2.1687, "step": 35504 }, { "epoch": 0.95, "learning_rate": 1.1004229793340259e-05, "loss": 2.2435, "step": 35505 }, { "epoch": 0.95, "learning_rate": 1.099135663095996e-05, "loss": 2.6489, "step": 35506 }, { "epoch": 0.95, "learning_rate": 1.0978490961132349e-05, "loss": 2.301, "step": 35507 }, { "epoch": 0.95, "learning_rate": 1.0965632783954793e-05, "loss": 2.3011, "step": 35508 }, { "epoch": 0.95, "learning_rate": 1.0952782099524772e-05, "loss": 2.5263, "step": 35509 }, { "epoch": 0.95, "learning_rate": 1.093993890793965e-05, "loss": 2.2175, "step": 35510 }, { "epoch": 0.95, "learning_rate": 1.0927103209296795e-05, "loss": 2.2609, "step": 35511 }, { "epoch": 0.95, "learning_rate": 1.0914275003693241e-05, "loss": 2.2744, "step": 35512 }, { "epoch": 0.95, "learning_rate": 1.0901454291226464e-05, "loss": 2.0698, "step": 35513 }, { "epoch": 0.95, "learning_rate": 1.0888641071993277e-05, "loss": 2.4223, "step": 35514 }, { "epoch": 0.95, "learning_rate": 1.0875835346091046e-05, "loss": 2.7304, "step": 35515 }, { "epoch": 0.95, "learning_rate": 1.086303711361658e-05, "loss": 2.6903, "step": 35516 }, { "epoch": 0.95, "learning_rate": 1.0850246374666917e-05, "loss": 2.3904, "step": 35517 }, { "epoch": 0.95, "learning_rate": 1.0837463129338976e-05, "loss": 2.7817, "step": 35518 }, { "epoch": 0.95, "learning_rate": 1.0824687377729458e-05, "loss": 2.5656, "step": 35519 }, { "epoch": 0.95, "learning_rate": 1.0811919119935399e-05, "loss": 1.9269, "step": 35520 }, { "epoch": 0.95, "learning_rate": 1.0799158356053384e-05, "loss": 2.348, "step": 35521 }, { "epoch": 0.95, "learning_rate": 1.0786405086180006e-05, "loss": 2.9239, "step": 35522 }, { "epoch": 0.95, "learning_rate": 1.0773659310412075e-05, "loss": 2.5733, "step": 35523 }, { "epoch": 0.95, "learning_rate": 1.076092102884596e-05, "loss": 2.3865, "step": 35524 }, { "epoch": 0.95, "learning_rate": 1.0748190241578248e-05, "loss": 2.8907, "step": 35525 }, { "epoch": 0.95, "learning_rate": 1.0735466948705308e-05, "loss": 2.518, "step": 35526 }, { "epoch": 0.95, "learning_rate": 1.072275115032373e-05, "loss": 2.557, "step": 35527 }, { "epoch": 0.95, "learning_rate": 1.0710042846529766e-05, "loss": 2.3778, "step": 35528 }, { "epoch": 0.95, "learning_rate": 1.0697342037419566e-05, "loss": 2.5736, "step": 35529 }, { "epoch": 0.95, "learning_rate": 1.0684648723089385e-05, "loss": 2.6816, "step": 35530 }, { "epoch": 0.95, "learning_rate": 1.067196290363548e-05, "loss": 2.1822, "step": 35531 }, { "epoch": 0.95, "learning_rate": 1.0659284579153883e-05, "loss": 2.5712, "step": 35532 }, { "epoch": 0.95, "learning_rate": 1.064661374974063e-05, "loss": 2.4501, "step": 35533 }, { "epoch": 0.95, "learning_rate": 1.0633950415491867e-05, "loss": 2.5482, "step": 35534 }, { "epoch": 0.95, "learning_rate": 1.0621294576503404e-05, "loss": 2.5658, "step": 35535 }, { "epoch": 0.95, "learning_rate": 1.0608646232871166e-05, "loss": 2.475, "step": 35536 }, { "epoch": 0.96, "learning_rate": 1.0596005384690855e-05, "loss": 2.5228, "step": 35537 }, { "epoch": 0.96, "learning_rate": 1.058337203205828e-05, "loss": 2.1462, "step": 35538 }, { "epoch": 0.96, "learning_rate": 1.0570746175069257e-05, "loss": 2.3741, "step": 35539 }, { "epoch": 0.96, "learning_rate": 1.0558127813819263e-05, "loss": 2.5867, "step": 35540 }, { "epoch": 0.96, "learning_rate": 1.054551694840411e-05, "loss": 2.4795, "step": 35541 }, { "epoch": 0.96, "learning_rate": 1.0532913578919278e-05, "loss": 2.184, "step": 35542 }, { "epoch": 0.96, "learning_rate": 1.0520317705460024e-05, "loss": 2.9059, "step": 35543 }, { "epoch": 0.96, "learning_rate": 1.0507729328122051e-05, "loss": 2.073, "step": 35544 }, { "epoch": 0.96, "learning_rate": 1.0495148447000503e-05, "loss": 2.2232, "step": 35545 }, { "epoch": 0.96, "learning_rate": 1.0482575062190968e-05, "loss": 2.4799, "step": 35546 }, { "epoch": 0.96, "learning_rate": 1.0470009173788487e-05, "loss": 2.7082, "step": 35547 }, { "epoch": 0.96, "learning_rate": 1.04574507818882e-05, "loss": 2.8452, "step": 35548 }, { "epoch": 0.96, "learning_rate": 1.0444899886585479e-05, "loss": 2.5065, "step": 35549 }, { "epoch": 0.96, "learning_rate": 1.0432356487975247e-05, "loss": 2.7233, "step": 35550 }, { "epoch": 0.96, "learning_rate": 1.0419820586152428e-05, "loss": 2.1519, "step": 35551 }, { "epoch": 0.96, "learning_rate": 1.040729218121228e-05, "loss": 2.1315, "step": 35552 }, { "epoch": 0.96, "learning_rate": 1.0394771273249615e-05, "loss": 2.763, "step": 35553 }, { "epoch": 0.96, "learning_rate": 1.0382257862359134e-05, "loss": 2.6268, "step": 35554 }, { "epoch": 0.96, "learning_rate": 1.0369751948635763e-05, "loss": 2.6277, "step": 35555 }, { "epoch": 0.96, "learning_rate": 1.0357253532174204e-05, "loss": 2.2061, "step": 35556 }, { "epoch": 0.96, "learning_rate": 1.0344762613069158e-05, "loss": 2.9055, "step": 35557 }, { "epoch": 0.96, "learning_rate": 1.0332279191415218e-05, "loss": 2.4781, "step": 35558 }, { "epoch": 0.96, "learning_rate": 1.0319803267307082e-05, "loss": 2.7352, "step": 35559 }, { "epoch": 0.96, "learning_rate": 1.0307334840839122e-05, "loss": 2.0068, "step": 35560 }, { "epoch": 0.96, "learning_rate": 1.0294873912105928e-05, "loss": 2.2212, "step": 35561 }, { "epoch": 0.96, "learning_rate": 1.028242048120176e-05, "loss": 2.138, "step": 35562 }, { "epoch": 0.96, "learning_rate": 1.0269974548221095e-05, "loss": 2.405, "step": 35563 }, { "epoch": 0.96, "learning_rate": 1.0257536113257971e-05, "loss": 2.1945, "step": 35564 }, { "epoch": 0.96, "learning_rate": 1.0245105176406976e-05, "loss": 2.7299, "step": 35565 }, { "epoch": 0.96, "learning_rate": 1.023268173776215e-05, "loss": 2.4679, "step": 35566 }, { "epoch": 0.96, "learning_rate": 1.0220265797417417e-05, "loss": 2.1422, "step": 35567 }, { "epoch": 0.96, "learning_rate": 1.0207857355467143e-05, "loss": 2.2355, "step": 35568 }, { "epoch": 0.96, "learning_rate": 1.0195456412005144e-05, "loss": 2.4749, "step": 35569 }, { "epoch": 0.96, "learning_rate": 1.0183062967125345e-05, "loss": 2.7664, "step": 35570 }, { "epoch": 0.96, "learning_rate": 1.0170677020921671e-05, "loss": 2.3094, "step": 35571 }, { "epoch": 0.96, "learning_rate": 1.0158298573488045e-05, "loss": 2.5976, "step": 35572 }, { "epoch": 0.96, "learning_rate": 1.0145927624918172e-05, "loss": 2.6678, "step": 35573 }, { "epoch": 0.96, "learning_rate": 1.0133564175305864e-05, "loss": 2.3883, "step": 35574 }, { "epoch": 0.96, "learning_rate": 1.0121208224744605e-05, "loss": 2.9132, "step": 35575 }, { "epoch": 0.96, "learning_rate": 1.0108859773328094e-05, "loss": 2.2573, "step": 35576 }, { "epoch": 0.96, "learning_rate": 1.0096518821149924e-05, "loss": 2.4396, "step": 35577 }, { "epoch": 0.96, "learning_rate": 1.0084185368303468e-05, "loss": 2.1568, "step": 35578 }, { "epoch": 0.96, "learning_rate": 1.0071859414882311e-05, "loss": 2.2964, "step": 35579 }, { "epoch": 0.96, "learning_rate": 1.005954096097983e-05, "loss": 2.5996, "step": 35580 }, { "epoch": 0.96, "learning_rate": 1.0047230006689278e-05, "loss": 2.205, "step": 35581 }, { "epoch": 0.96, "learning_rate": 1.0034926552103917e-05, "loss": 2.4185, "step": 35582 }, { "epoch": 0.96, "learning_rate": 1.0022630597316896e-05, "loss": 2.0558, "step": 35583 }, { "epoch": 0.96, "learning_rate": 1.0010342142421358e-05, "loss": 1.9926, "step": 35584 }, { "epoch": 0.96, "learning_rate": 9.998061187510565e-06, "loss": 2.5565, "step": 35585 }, { "epoch": 0.96, "learning_rate": 9.985787732677443e-06, "loss": 2.4522, "step": 35586 }, { "epoch": 0.96, "learning_rate": 9.973521778015027e-06, "loss": 2.3378, "step": 35587 }, { "epoch": 0.96, "learning_rate": 9.961263323616243e-06, "loss": 2.2598, "step": 35588 }, { "epoch": 0.96, "learning_rate": 9.949012369573906e-06, "loss": 2.4116, "step": 35589 }, { "epoch": 0.96, "learning_rate": 9.936768915980831e-06, "loss": 2.3966, "step": 35590 }, { "epoch": 0.96, "learning_rate": 9.924532962929722e-06, "loss": 2.5951, "step": 35591 }, { "epoch": 0.96, "learning_rate": 9.912304510513392e-06, "loss": 2.3118, "step": 35592 }, { "epoch": 0.96, "learning_rate": 9.900083558824436e-06, "loss": 2.4363, "step": 35593 }, { "epoch": 0.96, "learning_rate": 9.887870107955444e-06, "loss": 2.4789, "step": 35594 }, { "epoch": 0.96, "learning_rate": 9.875664157998898e-06, "loss": 2.4998, "step": 35595 }, { "epoch": 0.96, "learning_rate": 9.863465709047393e-06, "loss": 2.7242, "step": 35596 }, { "epoch": 0.96, "learning_rate": 9.851274761193186e-06, "loss": 2.4386, "step": 35597 }, { "epoch": 0.96, "learning_rate": 9.839091314528759e-06, "loss": 2.2717, "step": 35598 }, { "epoch": 0.96, "learning_rate": 9.82691536914626e-06, "loss": 2.4072, "step": 35599 }, { "epoch": 0.96, "learning_rate": 9.814746925138062e-06, "loss": 2.5031, "step": 35600 }, { "epoch": 0.96, "learning_rate": 9.802585982596312e-06, "loss": 2.3032, "step": 35601 }, { "epoch": 0.96, "learning_rate": 9.79043254161316e-06, "loss": 2.4792, "step": 35602 }, { "epoch": 0.96, "learning_rate": 9.77828660228064e-06, "loss": 2.8225, "step": 35603 }, { "epoch": 0.96, "learning_rate": 9.766148164690792e-06, "loss": 2.3716, "step": 35604 }, { "epoch": 0.96, "learning_rate": 9.754017228935541e-06, "loss": 2.6032, "step": 35605 }, { "epoch": 0.96, "learning_rate": 9.741893795106815e-06, "loss": 2.6011, "step": 35606 }, { "epoch": 0.96, "learning_rate": 9.72977786329654e-06, "loss": 2.8, "step": 35607 }, { "epoch": 0.96, "learning_rate": 9.71766943359631e-06, "loss": 2.3728, "step": 35608 }, { "epoch": 0.96, "learning_rate": 9.70556850609805e-06, "loss": 2.4399, "step": 35609 }, { "epoch": 0.96, "learning_rate": 9.693475080893355e-06, "loss": 2.4116, "step": 35610 }, { "epoch": 0.96, "learning_rate": 9.681389158073705e-06, "loss": 1.9832, "step": 35611 }, { "epoch": 0.96, "learning_rate": 9.66931073773103e-06, "loss": 2.1989, "step": 35612 }, { "epoch": 0.96, "learning_rate": 9.657239819956477e-06, "loss": 2.9499, "step": 35613 }, { "epoch": 0.96, "learning_rate": 9.645176404841526e-06, "loss": 2.8162, "step": 35614 }, { "epoch": 0.96, "learning_rate": 9.633120492477887e-06, "loss": 2.3185, "step": 35615 }, { "epoch": 0.96, "learning_rate": 9.621072082956484e-06, "loss": 2.8415, "step": 35616 }, { "epoch": 0.96, "learning_rate": 9.6090311763688e-06, "loss": 2.389, "step": 35617 }, { "epoch": 0.96, "learning_rate": 9.596997772806093e-06, "loss": 2.787, "step": 35618 }, { "epoch": 0.96, "learning_rate": 9.584971872359405e-06, "loss": 2.5751, "step": 35619 }, { "epoch": 0.96, "learning_rate": 9.572953475119994e-06, "loss": 2.3662, "step": 35620 }, { "epoch": 0.96, "learning_rate": 9.560942581178677e-06, "loss": 2.1047, "step": 35621 }, { "epoch": 0.96, "learning_rate": 9.548939190626604e-06, "loss": 2.3911, "step": 35622 }, { "epoch": 0.96, "learning_rate": 9.536943303554812e-06, "loss": 2.3617, "step": 35623 }, { "epoch": 0.96, "learning_rate": 9.524954920053896e-06, "loss": 2.2458, "step": 35624 }, { "epoch": 0.96, "learning_rate": 9.512974040215006e-06, "loss": 2.5614, "step": 35625 }, { "epoch": 0.96, "learning_rate": 9.501000664128735e-06, "loss": 2.5082, "step": 35626 }, { "epoch": 0.96, "learning_rate": 9.489034791885676e-06, "loss": 2.7942, "step": 35627 }, { "epoch": 0.96, "learning_rate": 9.477076423576757e-06, "loss": 2.5594, "step": 35628 }, { "epoch": 0.96, "learning_rate": 9.465125559292242e-06, "loss": 2.4309, "step": 35629 }, { "epoch": 0.96, "learning_rate": 9.453182199122945e-06, "loss": 2.5337, "step": 35630 }, { "epoch": 0.96, "learning_rate": 9.441246343159238e-06, "loss": 2.2467, "step": 35631 }, { "epoch": 0.96, "learning_rate": 9.429317991491494e-06, "loss": 2.4544, "step": 35632 }, { "epoch": 0.96, "learning_rate": 9.417397144210194e-06, "loss": 2.1237, "step": 35633 }, { "epoch": 0.96, "learning_rate": 9.405483801405602e-06, "loss": 2.4436, "step": 35634 }, { "epoch": 0.96, "learning_rate": 9.393577963167976e-06, "loss": 2.29, "step": 35635 }, { "epoch": 0.96, "learning_rate": 9.38167962958747e-06, "loss": 2.6863, "step": 35636 }, { "epoch": 0.96, "learning_rate": 9.369788800754232e-06, "loss": 2.0297, "step": 35637 }, { "epoch": 0.96, "learning_rate": 9.3579054767583e-06, "loss": 2.2728, "step": 35638 }, { "epoch": 0.96, "learning_rate": 9.346029657689936e-06, "loss": 2.9466, "step": 35639 }, { "epoch": 0.96, "learning_rate": 9.334161343638847e-06, "loss": 2.5722, "step": 35640 }, { "epoch": 0.96, "learning_rate": 9.322300534695071e-06, "loss": 2.6706, "step": 35641 }, { "epoch": 0.96, "learning_rate": 9.310447230948427e-06, "loss": 2.4242, "step": 35642 }, { "epoch": 0.96, "learning_rate": 9.29860143248873e-06, "loss": 2.2637, "step": 35643 }, { "epoch": 0.96, "learning_rate": 9.286763139405575e-06, "loss": 2.5221, "step": 35644 }, { "epoch": 0.96, "learning_rate": 9.27493235178889e-06, "loss": 3.0305, "step": 35645 }, { "epoch": 0.96, "learning_rate": 9.26310906972816e-06, "loss": 2.8072, "step": 35646 }, { "epoch": 0.96, "learning_rate": 9.25129329331309e-06, "loss": 1.8948, "step": 35647 }, { "epoch": 0.96, "learning_rate": 9.239485022633053e-06, "loss": 2.9876, "step": 35648 }, { "epoch": 0.96, "learning_rate": 9.227684257777424e-06, "loss": 2.5069, "step": 35649 }, { "epoch": 0.96, "learning_rate": 9.215890998835797e-06, "loss": 2.6317, "step": 35650 }, { "epoch": 0.96, "learning_rate": 9.204105245897431e-06, "loss": 2.6921, "step": 35651 }, { "epoch": 0.96, "learning_rate": 9.192326999051703e-06, "loss": 2.8851, "step": 35652 }, { "epoch": 0.96, "learning_rate": 9.180556258387763e-06, "loss": 2.494, "step": 35653 }, { "epoch": 0.96, "learning_rate": 9.168793023994648e-06, "loss": 2.3608, "step": 35654 }, { "epoch": 0.96, "learning_rate": 9.157037295961735e-06, "loss": 2.5629, "step": 35655 }, { "epoch": 0.96, "learning_rate": 9.14528907437795e-06, "loss": 2.4846, "step": 35656 }, { "epoch": 0.96, "learning_rate": 9.133548359332223e-06, "loss": 2.1259, "step": 35657 }, { "epoch": 0.96, "learning_rate": 9.121815150913704e-06, "loss": 2.493, "step": 35658 }, { "epoch": 0.96, "learning_rate": 9.1100894492111e-06, "loss": 2.5921, "step": 35659 }, { "epoch": 0.96, "learning_rate": 9.098371254313343e-06, "loss": 2.7382, "step": 35660 }, { "epoch": 0.96, "learning_rate": 9.086660566309135e-06, "loss": 2.6283, "step": 35661 }, { "epoch": 0.96, "learning_rate": 9.074957385287186e-06, "loss": 2.6474, "step": 35662 }, { "epoch": 0.96, "learning_rate": 9.0632617113362e-06, "loss": 2.5951, "step": 35663 }, { "epoch": 0.96, "learning_rate": 9.051573544544777e-06, "loss": 2.2713, "step": 35664 }, { "epoch": 0.96, "learning_rate": 9.03989288500151e-06, "loss": 2.2484, "step": 35665 }, { "epoch": 0.96, "learning_rate": 9.028219732794884e-06, "loss": 2.3084, "step": 35666 }, { "epoch": 0.96, "learning_rate": 9.016554088013273e-06, "loss": 2.5004, "step": 35667 }, { "epoch": 0.96, "learning_rate": 9.004895950745051e-06, "loss": 2.4015, "step": 35668 }, { "epoch": 0.96, "learning_rate": 8.993245321078591e-06, "loss": 2.3876, "step": 35669 }, { "epoch": 0.96, "learning_rate": 8.981602199102156e-06, "loss": 2.3958, "step": 35670 }, { "epoch": 0.96, "learning_rate": 8.969966584903788e-06, "loss": 2.4661, "step": 35671 }, { "epoch": 0.96, "learning_rate": 8.95833847857186e-06, "loss": 2.0362, "step": 35672 }, { "epoch": 0.96, "learning_rate": 8.946717880194411e-06, "loss": 2.3696, "step": 35673 }, { "epoch": 0.96, "learning_rate": 8.935104789859483e-06, "loss": 2.3046, "step": 35674 }, { "epoch": 0.96, "learning_rate": 8.923499207654895e-06, "loss": 2.8099, "step": 35675 }, { "epoch": 0.96, "learning_rate": 8.911901133668799e-06, "loss": 2.6235, "step": 35676 }, { "epoch": 0.96, "learning_rate": 8.900310567988789e-06, "loss": 2.5664, "step": 35677 }, { "epoch": 0.96, "learning_rate": 8.88872751070302e-06, "loss": 2.5068, "step": 35678 }, { "epoch": 0.96, "learning_rate": 8.877151961898976e-06, "loss": 2.3868, "step": 35679 }, { "epoch": 0.96, "learning_rate": 8.865583921664477e-06, "loss": 2.4145, "step": 35680 }, { "epoch": 0.96, "learning_rate": 8.854023390087007e-06, "loss": 2.5581, "step": 35681 }, { "epoch": 0.96, "learning_rate": 8.842470367254385e-06, "loss": 2.2411, "step": 35682 }, { "epoch": 0.96, "learning_rate": 8.830924853253875e-06, "loss": 2.6761, "step": 35683 }, { "epoch": 0.96, "learning_rate": 8.819386848173183e-06, "loss": 2.2887, "step": 35684 }, { "epoch": 0.96, "learning_rate": 8.807856352099576e-06, "loss": 2.519, "step": 35685 }, { "epoch": 0.96, "learning_rate": 8.796333365120424e-06, "loss": 2.451, "step": 35686 }, { "epoch": 0.96, "learning_rate": 8.784817887323104e-06, "loss": 2.7588, "step": 35687 }, { "epoch": 0.96, "learning_rate": 8.773309918794658e-06, "loss": 2.3367, "step": 35688 }, { "epoch": 0.96, "learning_rate": 8.76180945962246e-06, "loss": 2.4278, "step": 35689 }, { "epoch": 0.96, "learning_rate": 8.750316509893663e-06, "loss": 2.9529, "step": 35690 }, { "epoch": 0.96, "learning_rate": 8.738831069695085e-06, "loss": 2.3864, "step": 35691 }, { "epoch": 0.96, "learning_rate": 8.727353139113991e-06, "loss": 2.3759, "step": 35692 }, { "epoch": 0.96, "learning_rate": 8.715882718237312e-06, "loss": 2.1007, "step": 35693 }, { "epoch": 0.96, "learning_rate": 8.704419807151864e-06, "loss": 1.8716, "step": 35694 }, { "epoch": 0.96, "learning_rate": 8.69296440594447e-06, "loss": 2.3746, "step": 35695 }, { "epoch": 0.96, "learning_rate": 8.681516514701947e-06, "loss": 2.283, "step": 35696 }, { "epoch": 0.96, "learning_rate": 8.670076133510896e-06, "loss": 2.7299, "step": 35697 }, { "epoch": 0.96, "learning_rate": 8.658643262458354e-06, "loss": 2.0683, "step": 35698 }, { "epoch": 0.96, "learning_rate": 8.647217901630478e-06, "loss": 2.4087, "step": 35699 }, { "epoch": 0.96, "learning_rate": 8.635800051114196e-06, "loss": 2.4516, "step": 35700 }, { "epoch": 0.96, "learning_rate": 8.624389710995883e-06, "loss": 2.2007, "step": 35701 }, { "epoch": 0.96, "learning_rate": 8.612986881361806e-06, "loss": 2.1254, "step": 35702 }, { "epoch": 0.96, "learning_rate": 8.601591562298561e-06, "loss": 2.4966, "step": 35703 }, { "epoch": 0.96, "learning_rate": 8.590203753892411e-06, "loss": 2.796, "step": 35704 }, { "epoch": 0.96, "learning_rate": 8.578823456229622e-06, "loss": 2.364, "step": 35705 }, { "epoch": 0.96, "learning_rate": 8.567450669396459e-06, "loss": 1.8681, "step": 35706 }, { "epoch": 0.96, "learning_rate": 8.556085393478962e-06, "loss": 2.4004, "step": 35707 }, { "epoch": 0.96, "learning_rate": 8.544727628563398e-06, "loss": 2.4765, "step": 35708 }, { "epoch": 0.96, "learning_rate": 8.533377374735584e-06, "loss": 2.8435, "step": 35709 }, { "epoch": 0.96, "learning_rate": 8.522034632081788e-06, "loss": 2.4854, "step": 35710 }, { "epoch": 0.96, "learning_rate": 8.510699400687716e-06, "loss": 2.8383, "step": 35711 }, { "epoch": 0.96, "learning_rate": 8.49937168063941e-06, "loss": 2.5397, "step": 35712 }, { "epoch": 0.96, "learning_rate": 8.488051472022473e-06, "loss": 2.5027, "step": 35713 }, { "epoch": 0.96, "learning_rate": 8.476738774922942e-06, "loss": 2.3864, "step": 35714 }, { "epoch": 0.96, "learning_rate": 8.465433589426308e-06, "loss": 2.6948, "step": 35715 }, { "epoch": 0.96, "learning_rate": 8.454135915618277e-06, "loss": 2.5191, "step": 35716 }, { "epoch": 0.96, "learning_rate": 8.442845753584339e-06, "loss": 2.1212, "step": 35717 }, { "epoch": 0.96, "learning_rate": 8.4315631034102e-06, "loss": 2.359, "step": 35718 }, { "epoch": 0.96, "learning_rate": 8.42028796518135e-06, "loss": 2.8856, "step": 35719 }, { "epoch": 0.96, "learning_rate": 8.409020338983053e-06, "loss": 2.3233, "step": 35720 }, { "epoch": 0.96, "learning_rate": 8.397760224900685e-06, "loss": 2.6135, "step": 35721 }, { "epoch": 0.96, "learning_rate": 8.386507623019624e-06, "loss": 2.3528, "step": 35722 }, { "epoch": 0.96, "learning_rate": 8.375262533425131e-06, "loss": 2.7387, "step": 35723 }, { "epoch": 0.96, "learning_rate": 8.364024956202366e-06, "loss": 2.5739, "step": 35724 }, { "epoch": 0.96, "learning_rate": 8.352794891436477e-06, "loss": 2.6652, "step": 35725 }, { "epoch": 0.96, "learning_rate": 8.341572339212511e-06, "loss": 2.5962, "step": 35726 }, { "epoch": 0.96, "learning_rate": 8.33035729961551e-06, "loss": 2.3794, "step": 35727 }, { "epoch": 0.96, "learning_rate": 8.319149772730406e-06, "loss": 2.428, "step": 35728 }, { "epoch": 0.96, "learning_rate": 8.30794975864213e-06, "loss": 2.6702, "step": 35729 }, { "epoch": 0.96, "learning_rate": 8.296757257435506e-06, "loss": 2.5568, "step": 35730 }, { "epoch": 0.96, "learning_rate": 8.285572269195352e-06, "loss": 2.1956, "step": 35731 }, { "epoch": 0.96, "learning_rate": 8.27439479400649e-06, "loss": 2.4443, "step": 35732 }, { "epoch": 0.96, "learning_rate": 8.26322483195341e-06, "loss": 2.5774, "step": 35733 }, { "epoch": 0.96, "learning_rate": 8.252062383120928e-06, "loss": 2.3725, "step": 35734 }, { "epoch": 0.96, "learning_rate": 8.240907447593426e-06, "loss": 2.3073, "step": 35735 }, { "epoch": 0.96, "learning_rate": 8.229760025455501e-06, "loss": 2.4093, "step": 35736 }, { "epoch": 0.96, "learning_rate": 8.218620116791531e-06, "loss": 2.6972, "step": 35737 }, { "epoch": 0.96, "learning_rate": 8.207487721686113e-06, "loss": 2.2099, "step": 35738 }, { "epoch": 0.96, "learning_rate": 8.196362840223403e-06, "loss": 2.737, "step": 35739 }, { "epoch": 0.96, "learning_rate": 8.185245472487779e-06, "loss": 2.4344, "step": 35740 }, { "epoch": 0.96, "learning_rate": 8.174135618563393e-06, "loss": 2.3259, "step": 35741 }, { "epoch": 0.96, "learning_rate": 8.163033278534404e-06, "loss": 2.6857, "step": 35742 }, { "epoch": 0.96, "learning_rate": 8.151938452484964e-06, "loss": 2.3936, "step": 35743 }, { "epoch": 0.96, "learning_rate": 8.140851140499116e-06, "loss": 2.5208, "step": 35744 }, { "epoch": 0.96, "learning_rate": 8.129771342660796e-06, "loss": 2.4982, "step": 35745 }, { "epoch": 0.96, "learning_rate": 8.118699059054158e-06, "loss": 2.4185, "step": 35746 }, { "epoch": 0.96, "learning_rate": 8.1076342897628e-06, "loss": 2.3871, "step": 35747 }, { "epoch": 0.96, "learning_rate": 8.096577034870656e-06, "loss": 2.359, "step": 35748 }, { "epoch": 0.96, "learning_rate": 8.085527294461547e-06, "loss": 2.4332, "step": 35749 }, { "epoch": 0.96, "learning_rate": 8.074485068619075e-06, "loss": 2.3701, "step": 35750 }, { "epoch": 0.96, "learning_rate": 8.06345035742706e-06, "loss": 2.8126, "step": 35751 }, { "epoch": 0.96, "learning_rate": 8.052423160968992e-06, "loss": 2.4666, "step": 35752 }, { "epoch": 0.96, "learning_rate": 8.041403479328358e-06, "loss": 2.7784, "step": 35753 }, { "epoch": 0.96, "learning_rate": 8.03039131258887e-06, "loss": 2.4222, "step": 35754 }, { "epoch": 0.96, "learning_rate": 8.019386660833572e-06, "loss": 2.2681, "step": 35755 }, { "epoch": 0.96, "learning_rate": 8.008389524146064e-06, "loss": 2.3769, "step": 35756 }, { "epoch": 0.96, "learning_rate": 7.997399902609836e-06, "loss": 2.7098, "step": 35757 }, { "epoch": 0.96, "learning_rate": 7.98641779630782e-06, "loss": 2.3332, "step": 35758 }, { "epoch": 0.96, "learning_rate": 7.975443205323396e-06, "loss": 2.3689, "step": 35759 }, { "epoch": 0.96, "learning_rate": 7.964476129739607e-06, "loss": 2.329, "step": 35760 }, { "epoch": 0.96, "learning_rate": 7.953516569639608e-06, "loss": 2.5708, "step": 35761 }, { "epoch": 0.96, "learning_rate": 7.942564525106443e-06, "loss": 2.4387, "step": 35762 }, { "epoch": 0.96, "learning_rate": 7.931619996222938e-06, "loss": 2.5966, "step": 35763 }, { "epoch": 0.96, "learning_rate": 7.920682983072247e-06, "loss": 2.6335, "step": 35764 }, { "epoch": 0.96, "learning_rate": 7.909753485737081e-06, "loss": 2.5721, "step": 35765 }, { "epoch": 0.96, "learning_rate": 7.898831504300152e-06, "loss": 2.478, "step": 35766 }, { "epoch": 0.96, "learning_rate": 7.887917038844395e-06, "loss": 2.4769, "step": 35767 }, { "epoch": 0.96, "learning_rate": 7.877010089452409e-06, "loss": 2.6874, "step": 35768 }, { "epoch": 0.96, "learning_rate": 7.866110656206682e-06, "loss": 2.3242, "step": 35769 }, { "epoch": 0.96, "learning_rate": 7.85521873919004e-06, "loss": 2.7657, "step": 35770 }, { "epoch": 0.96, "learning_rate": 7.84433433848497e-06, "loss": 2.3441, "step": 35771 }, { "epoch": 0.96, "learning_rate": 7.833457454173743e-06, "loss": 2.4424, "step": 35772 }, { "epoch": 0.96, "learning_rate": 7.822588086338845e-06, "loss": 2.3995, "step": 35773 }, { "epoch": 0.96, "learning_rate": 7.811726235062656e-06, "loss": 2.1452, "step": 35774 }, { "epoch": 0.96, "learning_rate": 7.800871900427442e-06, "loss": 2.8891, "step": 35775 }, { "epoch": 0.96, "learning_rate": 7.790025082515361e-06, "loss": 2.3871, "step": 35776 }, { "epoch": 0.96, "learning_rate": 7.779185781408792e-06, "loss": 2.79, "step": 35777 }, { "epoch": 0.96, "learning_rate": 7.768353997189559e-06, "loss": 2.2975, "step": 35778 }, { "epoch": 0.96, "learning_rate": 7.757529729940038e-06, "loss": 2.2159, "step": 35779 }, { "epoch": 0.96, "learning_rate": 7.746712979742054e-06, "loss": 2.4091, "step": 35780 }, { "epoch": 0.96, "learning_rate": 7.735903746677542e-06, "loss": 2.2322, "step": 35781 }, { "epoch": 0.96, "learning_rate": 7.725102030828324e-06, "loss": 2.473, "step": 35782 }, { "epoch": 0.96, "learning_rate": 7.714307832276447e-06, "loss": 2.5893, "step": 35783 }, { "epoch": 0.96, "learning_rate": 7.703521151103621e-06, "loss": 2.041, "step": 35784 }, { "epoch": 0.96, "learning_rate": 7.692741987391339e-06, "loss": 2.9071, "step": 35785 }, { "epoch": 0.96, "learning_rate": 7.681970341221534e-06, "loss": 2.4855, "step": 35786 }, { "epoch": 0.96, "learning_rate": 7.671206212675807e-06, "loss": 2.6667, "step": 35787 }, { "epoch": 0.96, "learning_rate": 7.660449601835428e-06, "loss": 2.3089, "step": 35788 }, { "epoch": 0.96, "learning_rate": 7.649700508782221e-06, "loss": 2.5586, "step": 35789 }, { "epoch": 0.96, "learning_rate": 7.63895893359734e-06, "loss": 2.456, "step": 35790 }, { "epoch": 0.96, "learning_rate": 7.628224876362389e-06, "loss": 2.2534, "step": 35791 }, { "epoch": 0.96, "learning_rate": 7.617498337158524e-06, "loss": 2.6293, "step": 35792 }, { "epoch": 0.96, "learning_rate": 7.606779316067125e-06, "loss": 2.5864, "step": 35793 }, { "epoch": 0.96, "learning_rate": 7.596067813169238e-06, "loss": 2.4485, "step": 35794 }, { "epoch": 0.96, "learning_rate": 7.585363828546243e-06, "loss": 2.2741, "step": 35795 }, { "epoch": 0.96, "learning_rate": 7.574667362278964e-06, "loss": 2.5318, "step": 35796 }, { "epoch": 0.96, "learning_rate": 7.56397841444878e-06, "loss": 2.5612, "step": 35797 }, { "epoch": 0.96, "learning_rate": 7.553296985136293e-06, "loss": 2.0528, "step": 35798 }, { "epoch": 0.96, "learning_rate": 7.542623074422661e-06, "loss": 2.1291, "step": 35799 }, { "epoch": 0.96, "learning_rate": 7.531956682388708e-06, "loss": 2.3298, "step": 35800 }, { "epoch": 0.96, "learning_rate": 7.521297809115146e-06, "loss": 3.0136, "step": 35801 }, { "epoch": 0.96, "learning_rate": 7.510646454682802e-06, "loss": 2.5098, "step": 35802 }, { "epoch": 0.96, "learning_rate": 7.500002619172386e-06, "loss": 2.0219, "step": 35803 }, { "epoch": 0.96, "learning_rate": 7.489366302664502e-06, "loss": 2.2835, "step": 35804 }, { "epoch": 0.96, "learning_rate": 7.478737505239752e-06, "loss": 2.2237, "step": 35805 }, { "epoch": 0.96, "learning_rate": 7.468116226978627e-06, "loss": 2.7437, "step": 35806 }, { "epoch": 0.96, "learning_rate": 7.457502467961619e-06, "loss": 2.055, "step": 35807 }, { "epoch": 0.96, "learning_rate": 7.446896228269107e-06, "loss": 2.3885, "step": 35808 }, { "epoch": 0.96, "learning_rate": 7.436297507981471e-06, "loss": 2.5367, "step": 35809 }, { "epoch": 0.96, "learning_rate": 7.42570630717887e-06, "loss": 2.2413, "step": 35810 }, { "epoch": 0.96, "learning_rate": 7.4151226259419055e-06, "loss": 2.7199, "step": 35811 }, { "epoch": 0.96, "learning_rate": 7.404546464350292e-06, "loss": 2.558, "step": 35812 }, { "epoch": 0.96, "learning_rate": 7.393977822484521e-06, "loss": 2.197, "step": 35813 }, { "epoch": 0.96, "learning_rate": 7.383416700424417e-06, "loss": 2.5536, "step": 35814 }, { "epoch": 0.96, "learning_rate": 7.372863098250138e-06, "loss": 2.5477, "step": 35815 }, { "epoch": 0.96, "learning_rate": 7.3623170160415085e-06, "loss": 2.5674, "step": 35816 }, { "epoch": 0.96, "learning_rate": 7.351778453878577e-06, "loss": 2.6309, "step": 35817 }, { "epoch": 0.96, "learning_rate": 7.3412474118410565e-06, "loss": 2.2718, "step": 35818 }, { "epoch": 0.96, "learning_rate": 7.330723890008884e-06, "loss": 2.5024, "step": 35819 }, { "epoch": 0.96, "learning_rate": 7.3202078884615496e-06, "loss": 2.5918, "step": 35820 }, { "epoch": 0.96, "learning_rate": 7.30969940727888e-06, "loss": 2.5177, "step": 35821 }, { "epoch": 0.96, "learning_rate": 7.299198446540478e-06, "loss": 2.5198, "step": 35822 }, { "epoch": 0.96, "learning_rate": 7.288705006325836e-06, "loss": 2.5093, "step": 35823 }, { "epoch": 0.96, "learning_rate": 7.2782190867145545e-06, "loss": 2.6573, "step": 35824 }, { "epoch": 0.96, "learning_rate": 7.267740687785907e-06, "loss": 2.2475, "step": 35825 }, { "epoch": 0.96, "learning_rate": 7.257269809619383e-06, "loss": 2.5412, "step": 35826 }, { "epoch": 0.96, "learning_rate": 7.246806452294363e-06, "loss": 2.42, "step": 35827 }, { "epoch": 0.96, "learning_rate": 7.236350615890008e-06, "loss": 2.6562, "step": 35828 }, { "epoch": 0.96, "learning_rate": 7.225902300485476e-06, "loss": 2.2989, "step": 35829 }, { "epoch": 0.96, "learning_rate": 7.215461506160259e-06, "loss": 2.3444, "step": 35830 }, { "epoch": 0.96, "learning_rate": 7.205028232993072e-06, "loss": 2.5241, "step": 35831 }, { "epoch": 0.96, "learning_rate": 7.194602481063073e-06, "loss": 2.1935, "step": 35832 }, { "epoch": 0.96, "learning_rate": 7.18418425044931e-06, "loss": 2.7442, "step": 35833 }, { "epoch": 0.96, "learning_rate": 7.17377354123061e-06, "loss": 2.4099, "step": 35834 }, { "epoch": 0.96, "learning_rate": 7.16337035348591e-06, "loss": 2.8438, "step": 35835 }, { "epoch": 0.96, "learning_rate": 7.152974687294034e-06, "loss": 2.3341, "step": 35836 }, { "epoch": 0.96, "learning_rate": 7.142586542733698e-06, "loss": 2.5711, "step": 35837 }, { "epoch": 0.96, "learning_rate": 7.132205919883727e-06, "loss": 2.3117, "step": 35838 }, { "epoch": 0.96, "learning_rate": 7.121832818822616e-06, "loss": 2.299, "step": 35839 }, { "epoch": 0.96, "learning_rate": 7.111467239628855e-06, "loss": 2.2489, "step": 35840 }, { "epoch": 0.96, "learning_rate": 7.101109182381271e-06, "loss": 2.5623, "step": 35841 }, { "epoch": 0.96, "learning_rate": 7.0907586471580245e-06, "loss": 2.4739, "step": 35842 }, { "epoch": 0.96, "learning_rate": 7.080415634037829e-06, "loss": 2.3731, "step": 35843 }, { "epoch": 0.96, "learning_rate": 7.0700801430988444e-06, "loss": 2.1492, "step": 35844 }, { "epoch": 0.96, "learning_rate": 7.059752174419342e-06, "loss": 2.3448, "step": 35845 }, { "epoch": 0.96, "learning_rate": 7.049431728077704e-06, "loss": 2.335, "step": 35846 }, { "epoch": 0.96, "learning_rate": 7.039118804151978e-06, "loss": 2.3236, "step": 35847 }, { "epoch": 0.96, "learning_rate": 7.028813402720435e-06, "loss": 2.5554, "step": 35848 }, { "epoch": 0.96, "learning_rate": 7.0185155238610135e-06, "loss": 2.177, "step": 35849 }, { "epoch": 0.96, "learning_rate": 7.008225167651761e-06, "loss": 2.4219, "step": 35850 }, { "epoch": 0.96, "learning_rate": 6.997942334170837e-06, "loss": 2.6559, "step": 35851 }, { "epoch": 0.96, "learning_rate": 6.9876670234958475e-06, "loss": 2.3969, "step": 35852 }, { "epoch": 0.96, "learning_rate": 6.977399235704729e-06, "loss": 2.1008, "step": 35853 }, { "epoch": 0.96, "learning_rate": 6.96713897087542e-06, "loss": 2.5998, "step": 35854 }, { "epoch": 0.96, "learning_rate": 6.9568862290853015e-06, "loss": 1.7498, "step": 35855 }, { "epoch": 0.96, "learning_rate": 6.946641010412425e-06, "loss": 2.903, "step": 35856 }, { "epoch": 0.96, "learning_rate": 6.936403314934281e-06, "loss": 2.6935, "step": 35857 }, { "epoch": 0.96, "learning_rate": 6.9261731427283645e-06, "loss": 2.606, "step": 35858 }, { "epoch": 0.96, "learning_rate": 6.915950493872281e-06, "loss": 2.5684, "step": 35859 }, { "epoch": 0.96, "learning_rate": 6.9057353684433e-06, "loss": 2.4052, "step": 35860 }, { "epoch": 0.96, "learning_rate": 6.8955277665190275e-06, "loss": 2.1624, "step": 35861 }, { "epoch": 0.96, "learning_rate": 6.885327688176513e-06, "loss": 2.3681, "step": 35862 }, { "epoch": 0.96, "learning_rate": 6.87513513349336e-06, "loss": 2.4841, "step": 35863 }, { "epoch": 0.96, "learning_rate": 6.864950102546619e-06, "loss": 2.4155, "step": 35864 }, { "epoch": 0.96, "learning_rate": 6.85477259541345e-06, "loss": 2.4287, "step": 35865 }, { "epoch": 0.96, "learning_rate": 6.844602612170903e-06, "loss": 2.7979, "step": 35866 }, { "epoch": 0.96, "learning_rate": 6.834440152896137e-06, "loss": 2.4529, "step": 35867 }, { "epoch": 0.96, "learning_rate": 6.824285217666093e-06, "loss": 2.3147, "step": 35868 }, { "epoch": 0.96, "learning_rate": 6.8141378065575965e-06, "loss": 2.2943, "step": 35869 }, { "epoch": 0.96, "learning_rate": 6.8039979196478084e-06, "loss": 2.5317, "step": 35870 }, { "epoch": 0.96, "learning_rate": 6.793865557013224e-06, "loss": 2.5687, "step": 35871 }, { "epoch": 0.96, "learning_rate": 6.78374071873078e-06, "loss": 2.4771, "step": 35872 }, { "epoch": 0.96, "learning_rate": 6.773623404877194e-06, "loss": 2.221, "step": 35873 }, { "epoch": 0.96, "learning_rate": 6.763513615529071e-06, "loss": 2.3418, "step": 35874 }, { "epoch": 0.96, "learning_rate": 6.753411350762906e-06, "loss": 3.0261, "step": 35875 }, { "epoch": 0.96, "learning_rate": 6.743316610655415e-06, "loss": 2.1198, "step": 35876 }, { "epoch": 0.96, "learning_rate": 6.733229395282869e-06, "loss": 2.1752, "step": 35877 }, { "epoch": 0.96, "learning_rate": 6.723149704721987e-06, "loss": 2.6503, "step": 35878 }, { "epoch": 0.96, "learning_rate": 6.713077539048817e-06, "loss": 2.9341, "step": 35879 }, { "epoch": 0.96, "learning_rate": 6.703012898339744e-06, "loss": 2.4609, "step": 35880 }, { "epoch": 0.96, "learning_rate": 6.69295578267104e-06, "loss": 2.6363, "step": 35881 }, { "epoch": 0.96, "learning_rate": 6.682906192118976e-06, "loss": 2.521, "step": 35882 }, { "epoch": 0.96, "learning_rate": 6.672864126759715e-06, "loss": 2.9513, "step": 35883 }, { "epoch": 0.96, "learning_rate": 6.6628295866691945e-06, "loss": 2.4316, "step": 35884 }, { "epoch": 0.96, "learning_rate": 6.652802571923355e-06, "loss": 2.643, "step": 35885 }, { "epoch": 0.96, "learning_rate": 6.642783082598469e-06, "loss": 2.6846, "step": 35886 }, { "epoch": 0.96, "learning_rate": 6.6327711187701426e-06, "loss": 2.4855, "step": 35887 }, { "epoch": 0.96, "learning_rate": 6.622766680514314e-06, "loss": 2.6865, "step": 35888 }, { "epoch": 0.96, "learning_rate": 6.612769767906923e-06, "loss": 2.0145, "step": 35889 }, { "epoch": 0.96, "learning_rate": 6.602780381023577e-06, "loss": 2.6475, "step": 35890 }, { "epoch": 0.96, "learning_rate": 6.59279851993988e-06, "loss": 2.4242, "step": 35891 }, { "epoch": 0.96, "learning_rate": 6.5828241847316615e-06, "loss": 2.4128, "step": 35892 }, { "epoch": 0.96, "learning_rate": 6.572857375474306e-06, "loss": 2.6831, "step": 35893 }, { "epoch": 0.96, "learning_rate": 6.562898092243308e-06, "loss": 2.8754, "step": 35894 }, { "epoch": 0.96, "learning_rate": 6.552946335114274e-06, "loss": 2.1783, "step": 35895 }, { "epoch": 0.96, "learning_rate": 6.543002104162366e-06, "loss": 2.6423, "step": 35896 }, { "epoch": 0.96, "learning_rate": 6.5330653994631895e-06, "loss": 2.8205, "step": 35897 }, { "epoch": 0.96, "learning_rate": 6.523136221091908e-06, "loss": 2.1604, "step": 35898 }, { "epoch": 0.96, "learning_rate": 6.5132145691236825e-06, "loss": 2.3009, "step": 35899 }, { "epoch": 0.96, "learning_rate": 6.5033004436337866e-06, "loss": 2.5022, "step": 35900 }, { "epoch": 0.96, "learning_rate": 6.4933938446970485e-06, "loss": 2.8597, "step": 35901 }, { "epoch": 0.96, "learning_rate": 6.483494772388965e-06, "loss": 2.3242, "step": 35902 }, { "epoch": 0.96, "learning_rate": 6.473603226784252e-06, "loss": 2.6404, "step": 35903 }, { "epoch": 0.96, "learning_rate": 6.463719207957852e-06, "loss": 2.0328, "step": 35904 }, { "epoch": 0.96, "learning_rate": 6.453842715984704e-06, "loss": 2.3809, "step": 35905 }, { "epoch": 0.96, "learning_rate": 6.443973750939636e-06, "loss": 2.4597, "step": 35906 }, { "epoch": 0.96, "learning_rate": 6.434112312897367e-06, "loss": 2.7241, "step": 35907 }, { "epoch": 0.96, "learning_rate": 6.4242584019326144e-06, "loss": 2.466, "step": 35908 }, { "epoch": 0.97, "learning_rate": 6.414412018120097e-06, "loss": 2.7641, "step": 35909 }, { "epoch": 0.97, "learning_rate": 6.404573161534311e-06, "loss": 2.4623, "step": 35910 }, { "epoch": 0.97, "learning_rate": 6.394741832249862e-06, "loss": 2.5753, "step": 35911 }, { "epoch": 0.97, "learning_rate": 6.384918030341247e-06, "loss": 2.5481, "step": 35912 }, { "epoch": 0.97, "learning_rate": 6.3751017558828504e-06, "loss": 2.182, "step": 35913 }, { "epoch": 0.97, "learning_rate": 6.365293008948947e-06, "loss": 2.4665, "step": 35914 }, { "epoch": 0.97, "learning_rate": 6.355491789613921e-06, "loss": 2.5516, "step": 35915 }, { "epoch": 0.97, "learning_rate": 6.345698097952158e-06, "loss": 2.0495, "step": 35916 }, { "epoch": 0.97, "learning_rate": 6.335911934037708e-06, "loss": 2.1124, "step": 35917 }, { "epoch": 0.97, "learning_rate": 6.326133297944736e-06, "loss": 2.665, "step": 35918 }, { "epoch": 0.97, "learning_rate": 6.316362189747293e-06, "loss": 2.4168, "step": 35919 }, { "epoch": 0.97, "learning_rate": 6.306598609519431e-06, "loss": 2.7992, "step": 35920 }, { "epoch": 0.97, "learning_rate": 6.296842557335203e-06, "loss": 2.4527, "step": 35921 }, { "epoch": 0.97, "learning_rate": 6.287094033268326e-06, "loss": 2.3538, "step": 35922 }, { "epoch": 0.97, "learning_rate": 6.277353037392852e-06, "loss": 2.3542, "step": 35923 }, { "epoch": 0.97, "learning_rate": 6.267619569782501e-06, "loss": 2.8034, "step": 35924 }, { "epoch": 0.97, "learning_rate": 6.25789363051088e-06, "loss": 2.3178, "step": 35925 }, { "epoch": 0.97, "learning_rate": 6.2481752196519305e-06, "loss": 2.5978, "step": 35926 }, { "epoch": 0.97, "learning_rate": 6.238464337279037e-06, "loss": 2.2374, "step": 35927 }, { "epoch": 0.97, "learning_rate": 6.22876098346592e-06, "loss": 2.3361, "step": 35928 }, { "epoch": 0.97, "learning_rate": 6.219065158286075e-06, "loss": 2.4527, "step": 35929 }, { "epoch": 0.97, "learning_rate": 6.209376861812776e-06, "loss": 2.4398, "step": 35930 }, { "epoch": 0.97, "learning_rate": 6.199696094119745e-06, "loss": 2.3862, "step": 35931 }, { "epoch": 0.97, "learning_rate": 6.190022855280031e-06, "loss": 2.5485, "step": 35932 }, { "epoch": 0.97, "learning_rate": 6.180357145367133e-06, "loss": 2.5191, "step": 35933 }, { "epoch": 0.97, "learning_rate": 6.170698964453991e-06, "loss": 1.8542, "step": 35934 }, { "epoch": 0.97, "learning_rate": 6.161048312614104e-06, "loss": 2.5758, "step": 35935 }, { "epoch": 0.97, "learning_rate": 6.151405189920412e-06, "loss": 2.5318, "step": 35936 }, { "epoch": 0.97, "learning_rate": 6.1417695964459675e-06, "loss": 2.3708, "step": 35937 }, { "epoch": 0.97, "learning_rate": 6.132141532263824e-06, "loss": 2.3627, "step": 35938 }, { "epoch": 0.97, "learning_rate": 6.1225209974468125e-06, "loss": 2.4443, "step": 35939 }, { "epoch": 0.97, "learning_rate": 6.112907992067873e-06, "loss": 2.4928, "step": 35940 }, { "epoch": 0.97, "learning_rate": 6.103302516199949e-06, "loss": 2.3046, "step": 35941 }, { "epoch": 0.97, "learning_rate": 6.093704569915648e-06, "loss": 3.1062, "step": 35942 }, { "epoch": 0.97, "learning_rate": 6.0841141532878005e-06, "loss": 2.4057, "step": 35943 }, { "epoch": 0.97, "learning_rate": 6.0745312663890166e-06, "loss": 2.0574, "step": 35944 }, { "epoch": 0.97, "learning_rate": 6.064955909291902e-06, "loss": 2.7462, "step": 35945 }, { "epoch": 0.97, "learning_rate": 6.055388082068958e-06, "loss": 1.9674, "step": 35946 }, { "epoch": 0.97, "learning_rate": 6.045827784792679e-06, "loss": 2.5741, "step": 35947 }, { "epoch": 0.97, "learning_rate": 6.036275017535453e-06, "loss": 2.5326, "step": 35948 }, { "epoch": 0.97, "learning_rate": 6.026729780369778e-06, "loss": 2.7375, "step": 35949 }, { "epoch": 0.97, "learning_rate": 6.0171920733678165e-06, "loss": 2.7299, "step": 35950 }, { "epoch": 0.97, "learning_rate": 6.007661896601957e-06, "loss": 2.8949, "step": 35951 }, { "epoch": 0.97, "learning_rate": 5.998139250144363e-06, "loss": 2.6634, "step": 35952 }, { "epoch": 0.97, "learning_rate": 5.988624134067089e-06, "loss": 2.4224, "step": 35953 }, { "epoch": 0.97, "learning_rate": 5.979116548442409e-06, "loss": 2.4675, "step": 35954 }, { "epoch": 0.97, "learning_rate": 5.969616493342045e-06, "loss": 2.5312, "step": 35955 }, { "epoch": 0.97, "learning_rate": 5.960123968838272e-06, "loss": 2.1634, "step": 35956 }, { "epoch": 0.97, "learning_rate": 5.95063897500292e-06, "loss": 2.9602, "step": 35957 }, { "epoch": 0.97, "learning_rate": 5.941161511907711e-06, "loss": 1.9328, "step": 35958 }, { "epoch": 0.97, "learning_rate": 5.931691579624587e-06, "loss": 2.5257, "step": 35959 }, { "epoch": 0.97, "learning_rate": 5.922229178225269e-06, "loss": 2.7771, "step": 35960 }, { "epoch": 0.97, "learning_rate": 5.9127743077813655e-06, "loss": 2.751, "step": 35961 }, { "epoch": 0.97, "learning_rate": 5.903326968364597e-06, "loss": 2.4821, "step": 35962 }, { "epoch": 0.97, "learning_rate": 5.893887160046463e-06, "loss": 2.6415, "step": 35963 }, { "epoch": 0.97, "learning_rate": 5.884454882898571e-06, "loss": 2.4351, "step": 35964 }, { "epoch": 0.97, "learning_rate": 5.875030136992199e-06, "loss": 2.6291, "step": 35965 }, { "epoch": 0.97, "learning_rate": 5.865612922398955e-06, "loss": 2.1501, "step": 35966 }, { "epoch": 0.97, "learning_rate": 5.856203239190006e-06, "loss": 2.1, "step": 35967 }, { "epoch": 0.97, "learning_rate": 5.846801087436849e-06, "loss": 2.6017, "step": 35968 }, { "epoch": 0.97, "learning_rate": 5.837406467210538e-06, "loss": 2.4283, "step": 35969 }, { "epoch": 0.97, "learning_rate": 5.82801937858235e-06, "loss": 2.3532, "step": 35970 }, { "epoch": 0.97, "learning_rate": 5.818639821623228e-06, "loss": 2.4569, "step": 35971 }, { "epoch": 0.97, "learning_rate": 5.809267796404449e-06, "loss": 2.5049, "step": 35972 }, { "epoch": 0.97, "learning_rate": 5.799903302996845e-06, "loss": 2.4373, "step": 35973 }, { "epoch": 0.97, "learning_rate": 5.790546341471359e-06, "loss": 2.2785, "step": 35974 }, { "epoch": 0.97, "learning_rate": 5.781196911899156e-06, "loss": 2.5364, "step": 35975 }, { "epoch": 0.97, "learning_rate": 5.771855014350735e-06, "loss": 2.4985, "step": 35976 }, { "epoch": 0.97, "learning_rate": 5.76252064889693e-06, "loss": 2.5178, "step": 35977 }, { "epoch": 0.97, "learning_rate": 5.753193815608682e-06, "loss": 2.6083, "step": 35978 }, { "epoch": 0.97, "learning_rate": 5.743874514556268e-06, "loss": 2.0844, "step": 35979 }, { "epoch": 0.97, "learning_rate": 5.734562745810634e-06, "loss": 2.4931, "step": 35980 }, { "epoch": 0.97, "learning_rate": 5.725258509442166e-06, "loss": 2.6522, "step": 35981 }, { "epoch": 0.97, "learning_rate": 5.7159618055213634e-06, "loss": 2.4281, "step": 35982 }, { "epoch": 0.97, "learning_rate": 5.706672634118726e-06, "loss": 2.6694, "step": 35983 }, { "epoch": 0.97, "learning_rate": 5.697390995304641e-06, "loss": 2.4406, "step": 35984 }, { "epoch": 0.97, "learning_rate": 5.688116889149164e-06, "loss": 2.4886, "step": 35985 }, { "epoch": 0.97, "learning_rate": 5.678850315722906e-06, "loss": 2.6865, "step": 35986 }, { "epoch": 0.97, "learning_rate": 5.669591275095809e-06, "loss": 2.2182, "step": 35987 }, { "epoch": 0.97, "learning_rate": 5.660339767338151e-06, "loss": 2.6785, "step": 35988 }, { "epoch": 0.97, "learning_rate": 5.651095792519989e-06, "loss": 2.8324, "step": 35989 }, { "epoch": 0.97, "learning_rate": 5.641859350711376e-06, "loss": 2.3654, "step": 35990 }, { "epoch": 0.97, "learning_rate": 5.632630441982256e-06, "loss": 2.5222, "step": 35991 }, { "epoch": 0.97, "learning_rate": 5.6234090664025735e-06, "loss": 2.6309, "step": 35992 }, { "epoch": 0.97, "learning_rate": 5.614195224042162e-06, "loss": 2.4788, "step": 35993 }, { "epoch": 0.97, "learning_rate": 5.604988914970744e-06, "loss": 2.5387, "step": 35994 }, { "epoch": 0.97, "learning_rate": 5.595790139258261e-06, "loss": 2.7031, "step": 35995 }, { "epoch": 0.97, "learning_rate": 5.586598896974215e-06, "loss": 2.3023, "step": 35996 }, { "epoch": 0.97, "learning_rate": 5.577415188188328e-06, "loss": 2.3479, "step": 35997 }, { "epoch": 0.97, "learning_rate": 5.5682390129701e-06, "loss": 2.3893, "step": 35998 }, { "epoch": 0.97, "learning_rate": 5.559070371389252e-06, "loss": 2.56, "step": 35999 }, { "epoch": 0.97, "learning_rate": 5.549909263514951e-06, "loss": 2.3221, "step": 36000 }, { "epoch": 0.97, "learning_rate": 5.54075568941681e-06, "loss": 2.6197, "step": 36001 }, { "epoch": 0.97, "learning_rate": 5.5316096491641044e-06, "loss": 2.67, "step": 36002 }, { "epoch": 0.97, "learning_rate": 5.5224711428261136e-06, "loss": 2.4542, "step": 36003 }, { "epoch": 0.97, "learning_rate": 5.513340170472114e-06, "loss": 2.3904, "step": 36004 }, { "epoch": 0.97, "learning_rate": 5.504216732171274e-06, "loss": 1.8817, "step": 36005 }, { "epoch": 0.97, "learning_rate": 5.49510082799265e-06, "loss": 2.4553, "step": 36006 }, { "epoch": 0.97, "learning_rate": 5.485992458005407e-06, "loss": 2.3306, "step": 36007 }, { "epoch": 0.97, "learning_rate": 5.476891622278379e-06, "loss": 2.8045, "step": 36008 }, { "epoch": 0.97, "learning_rate": 5.467798320880624e-06, "loss": 2.8438, "step": 36009 }, { "epoch": 0.97, "learning_rate": 5.4587125538810846e-06, "loss": 2.5913, "step": 36010 }, { "epoch": 0.97, "learning_rate": 5.449634321348484e-06, "loss": 2.7284, "step": 36011 }, { "epoch": 0.97, "learning_rate": 5.4405636233516575e-06, "loss": 2.5729, "step": 36012 }, { "epoch": 0.97, "learning_rate": 5.431500459959326e-06, "loss": 2.4043, "step": 36013 }, { "epoch": 0.97, "learning_rate": 5.422444831240103e-06, "loss": 2.4413, "step": 36014 }, { "epoch": 0.97, "learning_rate": 5.41339673726271e-06, "loss": 2.5673, "step": 36015 }, { "epoch": 0.97, "learning_rate": 5.404356178095537e-06, "loss": 2.1341, "step": 36016 }, { "epoch": 0.97, "learning_rate": 5.395323153807196e-06, "loss": 2.5249, "step": 36017 }, { "epoch": 0.97, "learning_rate": 5.386297664466078e-06, "loss": 2.5099, "step": 36018 }, { "epoch": 0.97, "learning_rate": 5.377279710140459e-06, "loss": 2.315, "step": 36019 }, { "epoch": 0.97, "learning_rate": 5.368269290898731e-06, "loss": 2.6687, "step": 36020 }, { "epoch": 0.97, "learning_rate": 5.359266406809282e-06, "loss": 2.1943, "step": 36021 }, { "epoch": 0.97, "learning_rate": 5.35027105794017e-06, "loss": 2.3135, "step": 36022 }, { "epoch": 0.97, "learning_rate": 5.341283244359452e-06, "loss": 1.8359, "step": 36023 }, { "epoch": 0.97, "learning_rate": 5.332302966135516e-06, "loss": 2.4093, "step": 36024 }, { "epoch": 0.97, "learning_rate": 5.323330223336198e-06, "loss": 2.5464, "step": 36025 }, { "epoch": 0.97, "learning_rate": 5.314365016029443e-06, "loss": 3.2329, "step": 36026 }, { "epoch": 0.97, "learning_rate": 5.3054073442831974e-06, "loss": 2.3425, "step": 36027 }, { "epoch": 0.97, "learning_rate": 5.296457208165406e-06, "loss": 2.8485, "step": 36028 }, { "epoch": 0.97, "learning_rate": 5.287514607743793e-06, "loss": 2.3375, "step": 36029 }, { "epoch": 0.97, "learning_rate": 5.278579543086193e-06, "loss": 2.7442, "step": 36030 }, { "epoch": 0.97, "learning_rate": 5.269652014260106e-06, "loss": 2.1241, "step": 36031 }, { "epoch": 0.97, "learning_rate": 5.2607320213334806e-06, "loss": 2.4964, "step": 36032 }, { "epoch": 0.97, "learning_rate": 5.2518195643735946e-06, "loss": 2.5403, "step": 36033 }, { "epoch": 0.97, "learning_rate": 5.24291464344806e-06, "loss": 2.2318, "step": 36034 }, { "epoch": 0.97, "learning_rate": 5.234017258624379e-06, "loss": 2.6473, "step": 36035 }, { "epoch": 0.97, "learning_rate": 5.225127409969943e-06, "loss": 2.1979, "step": 36036 }, { "epoch": 0.97, "learning_rate": 5.2162450975521415e-06, "loss": 2.446, "step": 36037 }, { "epoch": 0.97, "learning_rate": 5.207370321438143e-06, "loss": 2.2322, "step": 36038 }, { "epoch": 0.97, "learning_rate": 5.198503081695228e-06, "loss": 2.1119, "step": 36039 }, { "epoch": 0.97, "learning_rate": 5.1896433783906735e-06, "loss": 2.8136, "step": 36040 }, { "epoch": 0.97, "learning_rate": 5.180791211591429e-06, "loss": 2.5518, "step": 36041 }, { "epoch": 0.97, "learning_rate": 5.171946581364773e-06, "loss": 2.8485, "step": 36042 }, { "epoch": 0.97, "learning_rate": 5.16310948777754e-06, "loss": 2.2978, "step": 36043 }, { "epoch": 0.97, "learning_rate": 5.154279930896788e-06, "loss": 2.2729, "step": 36044 }, { "epoch": 0.97, "learning_rate": 5.145457910789242e-06, "loss": 2.43, "step": 36045 }, { "epoch": 0.97, "learning_rate": 5.136643427521848e-06, "loss": 2.4354, "step": 36046 }, { "epoch": 0.97, "learning_rate": 5.127836481161441e-06, "loss": 2.287, "step": 36047 }, { "epoch": 0.97, "learning_rate": 5.119037071774746e-06, "loss": 2.3617, "step": 36048 }, { "epoch": 0.97, "learning_rate": 5.110245199428265e-06, "loss": 2.3168, "step": 36049 }, { "epoch": 0.97, "learning_rate": 5.101460864188723e-06, "loss": 2.3723, "step": 36050 }, { "epoch": 0.97, "learning_rate": 5.0926840661226215e-06, "loss": 2.0609, "step": 36051 }, { "epoch": 0.97, "learning_rate": 5.083914805296463e-06, "loss": 2.5933, "step": 36052 }, { "epoch": 0.97, "learning_rate": 5.07515308177664e-06, "loss": 3.0003, "step": 36053 }, { "epoch": 0.97, "learning_rate": 5.066398895629654e-06, "loss": 2.2378, "step": 36054 }, { "epoch": 0.97, "learning_rate": 5.057652246921784e-06, "loss": 2.4923, "step": 36055 }, { "epoch": 0.97, "learning_rate": 5.048913135719202e-06, "loss": 2.524, "step": 36056 }, { "epoch": 0.97, "learning_rate": 5.040181562088187e-06, "loss": 2.0807, "step": 36057 }, { "epoch": 0.97, "learning_rate": 5.031457526094907e-06, "loss": 2.7197, "step": 36058 }, { "epoch": 0.97, "learning_rate": 5.022741027805422e-06, "loss": 2.4693, "step": 36059 }, { "epoch": 0.97, "learning_rate": 5.014032067285679e-06, "loss": 2.8102, "step": 36060 }, { "epoch": 0.97, "learning_rate": 5.0053306446018465e-06, "loss": 2.6673, "step": 36061 }, { "epoch": 0.97, "learning_rate": 4.996636759819651e-06, "loss": 2.6431, "step": 36062 }, { "epoch": 0.97, "learning_rate": 4.987950413005149e-06, "loss": 2.8685, "step": 36063 }, { "epoch": 0.97, "learning_rate": 4.979271604223956e-06, "loss": 2.532, "step": 36064 }, { "epoch": 0.97, "learning_rate": 4.9706003335420195e-06, "loss": 2.4176, "step": 36065 }, { "epoch": 0.97, "learning_rate": 4.961936601024841e-06, "loss": 2.4875, "step": 36066 }, { "epoch": 0.97, "learning_rate": 4.953280406738037e-06, "loss": 2.6867, "step": 36067 }, { "epoch": 0.97, "learning_rate": 4.944631750747442e-06, "loss": 2.2889, "step": 36068 }, { "epoch": 0.97, "learning_rate": 4.9359906331183365e-06, "loss": 2.1886, "step": 36069 }, { "epoch": 0.97, "learning_rate": 4.927357053916337e-06, "loss": 2.7722, "step": 36070 }, { "epoch": 0.97, "learning_rate": 4.918731013206723e-06, "loss": 2.5379, "step": 36071 }, { "epoch": 0.97, "learning_rate": 4.910112511054887e-06, "loss": 2.5878, "step": 36072 }, { "epoch": 0.97, "learning_rate": 4.90150154752611e-06, "loss": 2.4946, "step": 36073 }, { "epoch": 0.97, "learning_rate": 4.892898122685674e-06, "loss": 2.4789, "step": 36074 }, { "epoch": 0.97, "learning_rate": 4.884302236598748e-06, "loss": 2.4309, "step": 36075 }, { "epoch": 0.97, "learning_rate": 4.875713889330502e-06, "loss": 2.9, "step": 36076 }, { "epoch": 0.97, "learning_rate": 4.867133080945884e-06, "loss": 2.3906, "step": 36077 }, { "epoch": 0.97, "learning_rate": 4.858559811509844e-06, "loss": 2.8742, "step": 36078 }, { "epoch": 0.97, "learning_rate": 4.8499940810875495e-06, "loss": 2.8633, "step": 36079 }, { "epoch": 0.97, "learning_rate": 4.841435889743839e-06, "loss": 2.5465, "step": 36080 }, { "epoch": 0.97, "learning_rate": 4.832885237543327e-06, "loss": 2.7256, "step": 36081 }, { "epoch": 0.97, "learning_rate": 4.824342124551073e-06, "loss": 2.7411, "step": 36082 }, { "epoch": 0.97, "learning_rate": 4.8158065508316914e-06, "loss": 2.6135, "step": 36083 }, { "epoch": 0.97, "learning_rate": 4.8072785164497975e-06, "loss": 2.562, "step": 36084 }, { "epoch": 0.97, "learning_rate": 4.7987580214700065e-06, "loss": 2.1621, "step": 36085 }, { "epoch": 0.97, "learning_rate": 4.790245065956933e-06, "loss": 2.086, "step": 36086 }, { "epoch": 0.97, "learning_rate": 4.781739649975081e-06, "loss": 2.4105, "step": 36087 }, { "epoch": 0.97, "learning_rate": 4.773241773588843e-06, "loss": 2.6113, "step": 36088 }, { "epoch": 0.97, "learning_rate": 4.7647514368625024e-06, "loss": 2.4383, "step": 36089 }, { "epoch": 0.97, "learning_rate": 4.756268639860562e-06, "loss": 2.3165, "step": 36090 }, { "epoch": 0.97, "learning_rate": 4.747793382647192e-06, "loss": 2.2587, "step": 36091 }, { "epoch": 0.97, "learning_rate": 4.739325665286565e-06, "loss": 2.975, "step": 36092 }, { "epoch": 0.97, "learning_rate": 4.73086548784285e-06, "loss": 2.5267, "step": 36093 }, { "epoch": 0.97, "learning_rate": 4.72241285038022e-06, "loss": 2.8883, "step": 36094 }, { "epoch": 0.97, "learning_rate": 4.7139677529626225e-06, "loss": 2.4989, "step": 36095 }, { "epoch": 0.97, "learning_rate": 4.7055301956541174e-06, "loss": 2.2694, "step": 36096 }, { "epoch": 0.97, "learning_rate": 4.697100178518543e-06, "loss": 2.7981, "step": 36097 }, { "epoch": 0.97, "learning_rate": 4.688677701619737e-06, "loss": 2.3027, "step": 36098 }, { "epoch": 0.97, "learning_rate": 4.680262765021537e-06, "loss": 2.9192, "step": 36099 }, { "epoch": 0.97, "learning_rate": 4.6718553687877804e-06, "loss": 2.7146, "step": 36100 }, { "epoch": 0.97, "learning_rate": 4.663455512982085e-06, "loss": 2.0162, "step": 36101 }, { "epoch": 0.97, "learning_rate": 4.655063197668174e-06, "loss": 2.7191, "step": 36102 }, { "epoch": 0.97, "learning_rate": 4.646678422909556e-06, "loss": 2.2599, "step": 36103 }, { "epoch": 0.97, "learning_rate": 4.638301188769622e-06, "loss": 2.4048, "step": 36104 }, { "epoch": 0.97, "learning_rate": 4.629931495312101e-06, "loss": 2.3366, "step": 36105 }, { "epoch": 0.97, "learning_rate": 4.6215693426001625e-06, "loss": 2.612, "step": 36106 }, { "epoch": 0.97, "learning_rate": 4.613214730697312e-06, "loss": 2.7238, "step": 36107 }, { "epoch": 0.97, "learning_rate": 4.604867659666723e-06, "loss": 2.821, "step": 36108 }, { "epoch": 0.97, "learning_rate": 4.596528129571787e-06, "loss": 2.2989, "step": 36109 }, { "epoch": 0.97, "learning_rate": 4.5881961404755645e-06, "loss": 2.6244, "step": 36110 }, { "epoch": 0.97, "learning_rate": 4.579871692441118e-06, "loss": 2.4371, "step": 36111 }, { "epoch": 0.97, "learning_rate": 4.5715547855317285e-06, "loss": 2.807, "step": 36112 }, { "epoch": 0.97, "learning_rate": 4.563245419810125e-06, "loss": 2.2914, "step": 36113 }, { "epoch": 0.97, "learning_rate": 4.554943595339478e-06, "loss": 2.1653, "step": 36114 }, { "epoch": 0.97, "learning_rate": 4.546649312182738e-06, "loss": 2.8443, "step": 36115 }, { "epoch": 0.97, "learning_rate": 4.538362570402521e-06, "loss": 2.5666, "step": 36116 }, { "epoch": 0.97, "learning_rate": 4.530083370061666e-06, "loss": 2.6608, "step": 36117 }, { "epoch": 0.97, "learning_rate": 4.5218117112229e-06, "loss": 2.7304, "step": 36118 }, { "epoch": 0.97, "learning_rate": 4.513547593948952e-06, "loss": 2.3317, "step": 36119 }, { "epoch": 0.97, "learning_rate": 4.5052910183024375e-06, "loss": 2.2397, "step": 36120 }, { "epoch": 0.97, "learning_rate": 4.497041984345751e-06, "loss": 2.6125, "step": 36121 }, { "epoch": 0.97, "learning_rate": 4.488800492141509e-06, "loss": 2.6412, "step": 36122 }, { "epoch": 0.97, "learning_rate": 4.480566541752218e-06, "loss": 2.4477, "step": 36123 }, { "epoch": 0.97, "learning_rate": 4.47234013324016e-06, "loss": 2.5744, "step": 36124 }, { "epoch": 0.97, "learning_rate": 4.46412126666762e-06, "loss": 2.6631, "step": 36125 }, { "epoch": 0.97, "learning_rate": 4.455909942096992e-06, "loss": 2.6615, "step": 36126 }, { "epoch": 0.97, "learning_rate": 4.447706159590337e-06, "loss": 2.2652, "step": 36127 }, { "epoch": 0.97, "learning_rate": 4.4395099192099385e-06, "loss": 2.6047, "step": 36128 }, { "epoch": 0.97, "learning_rate": 4.431321221017748e-06, "loss": 2.7615, "step": 36129 }, { "epoch": 0.97, "learning_rate": 4.4231400650758256e-06, "loss": 2.7157, "step": 36130 }, { "epoch": 0.97, "learning_rate": 4.414966451446345e-06, "loss": 2.2309, "step": 36131 }, { "epoch": 0.97, "learning_rate": 4.406800380190923e-06, "loss": 2.2019, "step": 36132 }, { "epoch": 0.97, "learning_rate": 4.398641851371732e-06, "loss": 2.6244, "step": 36133 }, { "epoch": 0.97, "learning_rate": 4.390490865050389e-06, "loss": 2.6144, "step": 36134 }, { "epoch": 0.97, "learning_rate": 4.382347421288735e-06, "loss": 2.7824, "step": 36135 }, { "epoch": 0.97, "learning_rate": 4.374211520148275e-06, "loss": 1.9831, "step": 36136 }, { "epoch": 0.97, "learning_rate": 4.366083161690959e-06, "loss": 2.4074, "step": 36137 }, { "epoch": 0.97, "learning_rate": 4.357962345978073e-06, "loss": 2.6191, "step": 36138 }, { "epoch": 0.97, "learning_rate": 4.349849073071344e-06, "loss": 2.3038, "step": 36139 }, { "epoch": 0.97, "learning_rate": 4.3417433430320565e-06, "loss": 2.4681, "step": 36140 }, { "epoch": 0.97, "learning_rate": 4.3336451559217174e-06, "loss": 2.3058, "step": 36141 }, { "epoch": 0.97, "learning_rate": 4.325554511801721e-06, "loss": 2.5498, "step": 36142 }, { "epoch": 0.97, "learning_rate": 4.3174714107333535e-06, "loss": 2.5851, "step": 36143 }, { "epoch": 0.97, "learning_rate": 4.309395852777787e-06, "loss": 2.7046, "step": 36144 }, { "epoch": 0.97, "learning_rate": 4.301327837996194e-06, "loss": 2.9709, "step": 36145 }, { "epoch": 0.97, "learning_rate": 4.293267366449749e-06, "loss": 2.5402, "step": 36146 }, { "epoch": 0.97, "learning_rate": 4.285214438199514e-06, "loss": 2.5044, "step": 36147 }, { "epoch": 0.97, "learning_rate": 4.27716905330644e-06, "loss": 2.9263, "step": 36148 }, { "epoch": 0.97, "learning_rate": 4.269131211831478e-06, "loss": 2.6049, "step": 36149 }, { "epoch": 0.97, "learning_rate": 4.261100913835691e-06, "loss": 2.722, "step": 36150 }, { "epoch": 0.97, "learning_rate": 4.253078159379698e-06, "loss": 2.4959, "step": 36151 }, { "epoch": 0.97, "learning_rate": 4.245062948524336e-06, "loss": 2.7987, "step": 36152 }, { "epoch": 0.97, "learning_rate": 4.237055281330337e-06, "loss": 2.6077, "step": 36153 }, { "epoch": 0.97, "learning_rate": 4.22905515785843e-06, "loss": 2.336, "step": 36154 }, { "epoch": 0.97, "learning_rate": 4.221062578169233e-06, "loss": 2.8469, "step": 36155 }, { "epoch": 0.97, "learning_rate": 4.21307754232314e-06, "loss": 2.5984, "step": 36156 }, { "epoch": 0.97, "learning_rate": 4.205100050380772e-06, "loss": 2.5594, "step": 36157 }, { "epoch": 0.97, "learning_rate": 4.197130102402525e-06, "loss": 2.397, "step": 36158 }, { "epoch": 0.97, "learning_rate": 4.189167698448793e-06, "loss": 2.5988, "step": 36159 }, { "epoch": 0.97, "learning_rate": 4.181212838579862e-06, "loss": 2.5375, "step": 36160 }, { "epoch": 0.97, "learning_rate": 4.173265522856018e-06, "loss": 2.4451, "step": 36161 }, { "epoch": 0.97, "learning_rate": 4.165325751337546e-06, "loss": 2.7897, "step": 36162 }, { "epoch": 0.97, "learning_rate": 4.157393524084508e-06, "loss": 2.4939, "step": 36163 }, { "epoch": 0.97, "learning_rate": 4.149468841157078e-06, "loss": 2.6326, "step": 36164 }, { "epoch": 0.97, "learning_rate": 4.141551702615098e-06, "loss": 2.7755, "step": 36165 }, { "epoch": 0.97, "learning_rate": 4.133642108518743e-06, "loss": 2.4456, "step": 36166 }, { "epoch": 0.97, "learning_rate": 4.125740058927851e-06, "loss": 2.8089, "step": 36167 }, { "epoch": 0.97, "learning_rate": 4.117845553902377e-06, "loss": 2.714, "step": 36168 }, { "epoch": 0.97, "learning_rate": 4.10995859350205e-06, "loss": 2.3334, "step": 36169 }, { "epoch": 0.97, "learning_rate": 4.102079177786488e-06, "loss": 2.6121, "step": 36170 }, { "epoch": 0.97, "learning_rate": 4.094207306815645e-06, "loss": 2.5326, "step": 36171 }, { "epoch": 0.97, "learning_rate": 4.086342980649027e-06, "loss": 2.3901, "step": 36172 }, { "epoch": 0.97, "learning_rate": 4.078486199346143e-06, "loss": 2.8732, "step": 36173 }, { "epoch": 0.97, "learning_rate": 4.070636962966723e-06, "loss": 2.7217, "step": 36174 }, { "epoch": 0.97, "learning_rate": 4.062795271570052e-06, "loss": 3.0199, "step": 36175 }, { "epoch": 0.97, "learning_rate": 4.054961125215528e-06, "loss": 2.3142, "step": 36176 }, { "epoch": 0.97, "learning_rate": 4.047134523962659e-06, "loss": 2.4658, "step": 36177 }, { "epoch": 0.97, "learning_rate": 4.039315467870619e-06, "loss": 2.1593, "step": 36178 }, { "epoch": 0.97, "learning_rate": 4.031503956998583e-06, "loss": 1.9862, "step": 36179 }, { "epoch": 0.97, "learning_rate": 4.023699991405838e-06, "loss": 2.6443, "step": 36180 }, { "epoch": 0.97, "learning_rate": 4.015903571151558e-06, "loss": 2.4656, "step": 36181 }, { "epoch": 0.97, "learning_rate": 4.008114696294696e-06, "loss": 2.2602, "step": 36182 }, { "epoch": 0.97, "learning_rate": 4.000333366894204e-06, "loss": 2.3664, "step": 36183 }, { "epoch": 0.97, "learning_rate": 3.992559583009148e-06, "loss": 3.0684, "step": 36184 }, { "epoch": 0.97, "learning_rate": 3.9847933446984786e-06, "loss": 2.0519, "step": 36185 }, { "epoch": 0.97, "learning_rate": 3.977034652020817e-06, "loss": 2.446, "step": 36186 }, { "epoch": 0.97, "learning_rate": 3.969283505035115e-06, "loss": 2.2667, "step": 36187 }, { "epoch": 0.97, "learning_rate": 3.9615399038001045e-06, "loss": 2.4313, "step": 36188 }, { "epoch": 0.97, "learning_rate": 3.953803848374404e-06, "loss": 2.5526, "step": 36189 }, { "epoch": 0.97, "learning_rate": 3.946075338816524e-06, "loss": 2.1035, "step": 36190 }, { "epoch": 0.97, "learning_rate": 3.938354375185193e-06, "loss": 2.3493, "step": 36191 }, { "epoch": 0.97, "learning_rate": 3.930640957538701e-06, "loss": 2.5036, "step": 36192 }, { "epoch": 0.97, "learning_rate": 3.922935085935664e-06, "loss": 2.3844, "step": 36193 }, { "epoch": 0.97, "learning_rate": 3.915236760434371e-06, "loss": 2.4463, "step": 36194 }, { "epoch": 0.97, "learning_rate": 3.907545981093108e-06, "loss": 2.4892, "step": 36195 }, { "epoch": 0.97, "learning_rate": 3.899862747970273e-06, "loss": 2.7253, "step": 36196 }, { "epoch": 0.97, "learning_rate": 3.892187061124041e-06, "loss": 2.4864, "step": 36197 }, { "epoch": 0.97, "learning_rate": 3.884518920612367e-06, "loss": 2.4833, "step": 36198 }, { "epoch": 0.97, "learning_rate": 3.876858326493537e-06, "loss": 2.5078, "step": 36199 }, { "epoch": 0.97, "learning_rate": 3.869205278825616e-06, "loss": 2.6784, "step": 36200 }, { "epoch": 0.97, "learning_rate": 3.861559777666446e-06, "loss": 2.4989, "step": 36201 }, { "epoch": 0.97, "learning_rate": 3.85392182307398e-06, "loss": 2.6544, "step": 36202 }, { "epoch": 0.97, "learning_rate": 3.846291415106174e-06, "loss": 2.3223, "step": 36203 }, { "epoch": 0.97, "learning_rate": 3.838668553820756e-06, "loss": 2.6812, "step": 36204 }, { "epoch": 0.97, "learning_rate": 3.831053239275351e-06, "loss": 2.4359, "step": 36205 }, { "epoch": 0.97, "learning_rate": 3.82344547152802e-06, "loss": 2.3445, "step": 36206 }, { "epoch": 0.97, "learning_rate": 3.815845250636052e-06, "loss": 2.8666, "step": 36207 }, { "epoch": 0.97, "learning_rate": 3.8082525766570675e-06, "loss": 2.2586, "step": 36208 }, { "epoch": 0.97, "learning_rate": 3.800667449648798e-06, "loss": 2.4781, "step": 36209 }, { "epoch": 0.97, "learning_rate": 3.79308986966842e-06, "loss": 2.7763, "step": 36210 }, { "epoch": 0.97, "learning_rate": 3.7855198367735545e-06, "loss": 2.0017, "step": 36211 }, { "epoch": 0.97, "learning_rate": 3.777957351021488e-06, "loss": 2.4445, "step": 36212 }, { "epoch": 0.97, "learning_rate": 3.7704024124695093e-06, "loss": 2.2873, "step": 36213 }, { "epoch": 0.97, "learning_rate": 3.7628550211749045e-06, "loss": 2.5332, "step": 36214 }, { "epoch": 0.97, "learning_rate": 3.7553151771947402e-06, "loss": 2.3671, "step": 36215 }, { "epoch": 0.97, "learning_rate": 3.7477828805861926e-06, "loss": 2.4249, "step": 36216 }, { "epoch": 0.97, "learning_rate": 3.7402581314063266e-06, "loss": 2.8093, "step": 36217 }, { "epoch": 0.97, "learning_rate": 3.732740929712208e-06, "loss": 2.2625, "step": 36218 }, { "epoch": 0.97, "learning_rate": 3.725231275560681e-06, "loss": 2.675, "step": 36219 }, { "epoch": 0.97, "learning_rate": 3.717729169008699e-06, "loss": 2.3481, "step": 36220 }, { "epoch": 0.97, "learning_rate": 3.7102346101131056e-06, "loss": 2.8174, "step": 36221 }, { "epoch": 0.97, "learning_rate": 3.7027475989306336e-06, "loss": 2.469, "step": 36222 }, { "epoch": 0.97, "learning_rate": 3.695268135518015e-06, "loss": 2.379, "step": 36223 }, { "epoch": 0.97, "learning_rate": 3.6877962199318714e-06, "loss": 2.4149, "step": 36224 }, { "epoch": 0.97, "learning_rate": 3.6803318522289353e-06, "loss": 2.4487, "step": 36225 }, { "epoch": 0.97, "learning_rate": 3.6728750324656056e-06, "loss": 2.5835, "step": 36226 }, { "epoch": 0.97, "learning_rate": 3.6654257606985044e-06, "loss": 2.5262, "step": 36227 }, { "epoch": 0.97, "learning_rate": 3.65798403698403e-06, "loss": 2.2505, "step": 36228 }, { "epoch": 0.97, "learning_rate": 3.6505498613785826e-06, "loss": 1.8875, "step": 36229 }, { "epoch": 0.97, "learning_rate": 3.643123233938339e-06, "loss": 2.4973, "step": 36230 }, { "epoch": 0.97, "learning_rate": 3.635704154719699e-06, "loss": 2.2641, "step": 36231 }, { "epoch": 0.97, "learning_rate": 3.6282926237787283e-06, "loss": 2.6916, "step": 36232 }, { "epoch": 0.97, "learning_rate": 3.6208886411718267e-06, "loss": 2.3964, "step": 36233 }, { "epoch": 0.97, "learning_rate": 3.6134922069549493e-06, "loss": 2.1348, "step": 36234 }, { "epoch": 0.97, "learning_rate": 3.60610332118394e-06, "loss": 2.393, "step": 36235 }, { "epoch": 0.97, "learning_rate": 3.5987219839151985e-06, "loss": 2.6732, "step": 36236 }, { "epoch": 0.97, "learning_rate": 3.591348195204236e-06, "loss": 2.7359, "step": 36237 }, { "epoch": 0.97, "learning_rate": 3.5839819551070076e-06, "loss": 2.0468, "step": 36238 }, { "epoch": 0.97, "learning_rate": 3.576623263679579e-06, "loss": 2.5279, "step": 36239 }, { "epoch": 0.97, "learning_rate": 3.5692721209773515e-06, "loss": 2.2782, "step": 36240 }, { "epoch": 0.97, "learning_rate": 3.5619285270562794e-06, "loss": 2.1648, "step": 36241 }, { "epoch": 0.97, "learning_rate": 3.5545924819718746e-06, "loss": 2.098, "step": 36242 }, { "epoch": 0.97, "learning_rate": 3.5472639857796473e-06, "loss": 2.1475, "step": 36243 }, { "epoch": 0.97, "learning_rate": 3.5399430385353314e-06, "loss": 2.4615, "step": 36244 }, { "epoch": 0.97, "learning_rate": 3.532629640294105e-06, "loss": 2.6106, "step": 36245 }, { "epoch": 0.97, "learning_rate": 3.5253237911115898e-06, "loss": 2.2415, "step": 36246 }, { "epoch": 0.97, "learning_rate": 3.5180254910431863e-06, "loss": 2.5877, "step": 36247 }, { "epoch": 0.97, "learning_rate": 3.5107347401439616e-06, "loss": 2.2278, "step": 36248 }, { "epoch": 0.97, "learning_rate": 3.5034515384692043e-06, "loss": 2.4128, "step": 36249 }, { "epoch": 0.97, "learning_rate": 3.4961758860742044e-06, "loss": 2.5136, "step": 36250 }, { "epoch": 0.97, "learning_rate": 3.4889077830140283e-06, "loss": 2.5324, "step": 36251 }, { "epoch": 0.97, "learning_rate": 3.481647229343743e-06, "loss": 2.3049, "step": 36252 }, { "epoch": 0.97, "learning_rate": 3.4743942251183045e-06, "loss": 2.4839, "step": 36253 }, { "epoch": 0.97, "learning_rate": 3.4671487703926696e-06, "loss": 2.164, "step": 36254 }, { "epoch": 0.97, "learning_rate": 3.4599108652217935e-06, "loss": 2.8118, "step": 36255 }, { "epoch": 0.97, "learning_rate": 3.4526805096604107e-06, "loss": 3.0411, "step": 36256 }, { "epoch": 0.97, "learning_rate": 3.4454577037633663e-06, "loss": 2.2742, "step": 36257 }, { "epoch": 0.97, "learning_rate": 3.4382424475853937e-06, "loss": 2.1709, "step": 36258 }, { "epoch": 0.97, "learning_rate": 3.431034741181116e-06, "loss": 2.1196, "step": 36259 }, { "epoch": 0.97, "learning_rate": 3.4238345846051566e-06, "loss": 2.426, "step": 36260 }, { "epoch": 0.97, "learning_rate": 3.416641977912138e-06, "loss": 2.6751, "step": 36261 }, { "epoch": 0.97, "learning_rate": 3.409456921156351e-06, "loss": 2.4263, "step": 36262 }, { "epoch": 0.97, "learning_rate": 3.4022794143924173e-06, "loss": 2.3108, "step": 36263 }, { "epoch": 0.97, "learning_rate": 3.3951094576745167e-06, "loss": 2.2591, "step": 36264 }, { "epoch": 0.97, "learning_rate": 3.3879470510571606e-06, "loss": 2.7715, "step": 36265 }, { "epoch": 0.97, "learning_rate": 3.3807921945946397e-06, "loss": 2.6465, "step": 36266 }, { "epoch": 0.97, "learning_rate": 3.37364488834091e-06, "loss": 2.8695, "step": 36267 }, { "epoch": 0.97, "learning_rate": 3.3665051323503725e-06, "loss": 2.7735, "step": 36268 }, { "epoch": 0.97, "learning_rate": 3.3593729266769845e-06, "loss": 2.4756, "step": 36269 }, { "epoch": 0.97, "learning_rate": 3.3522482713748135e-06, "loss": 2.0691, "step": 36270 }, { "epoch": 0.97, "learning_rate": 3.3451311664978167e-06, "loss": 2.9744, "step": 36271 }, { "epoch": 0.97, "learning_rate": 3.33802161209984e-06, "loss": 2.2375, "step": 36272 }, { "epoch": 0.97, "learning_rate": 3.33091960823495e-06, "loss": 2.304, "step": 36273 }, { "epoch": 0.97, "learning_rate": 3.3238251549567722e-06, "loss": 2.3426, "step": 36274 }, { "epoch": 0.97, "learning_rate": 3.3167382523190403e-06, "loss": 2.5576, "step": 36275 }, { "epoch": 0.97, "learning_rate": 3.3096589003756005e-06, "loss": 2.3368, "step": 36276 }, { "epoch": 0.97, "learning_rate": 3.3025870991799655e-06, "loss": 2.6067, "step": 36277 }, { "epoch": 0.97, "learning_rate": 3.2955228487857593e-06, "loss": 2.3108, "step": 36278 }, { "epoch": 0.97, "learning_rate": 3.288466149246383e-06, "loss": 3.0528, "step": 36279 }, { "epoch": 0.97, "learning_rate": 3.281417000615461e-06, "loss": 2.5454, "step": 36280 }, { "epoch": 0.98, "learning_rate": 3.2743754029463944e-06, "loss": 2.6217, "step": 36281 }, { "epoch": 0.98, "learning_rate": 3.2673413562923637e-06, "loss": 2.7647, "step": 36282 }, { "epoch": 0.98, "learning_rate": 3.2603148607067703e-06, "loss": 2.0342, "step": 36283 }, { "epoch": 0.98, "learning_rate": 3.2532959162429043e-06, "loss": 2.3798, "step": 36284 }, { "epoch": 0.98, "learning_rate": 3.246284522953835e-06, "loss": 2.665, "step": 36285 }, { "epoch": 0.98, "learning_rate": 3.239280680892631e-06, "loss": 2.2899, "step": 36286 }, { "epoch": 0.98, "learning_rate": 3.2322843901124723e-06, "loss": 2.5308, "step": 36287 }, { "epoch": 0.98, "learning_rate": 3.2252956506664264e-06, "loss": 2.2856, "step": 36288 }, { "epoch": 0.98, "learning_rate": 3.21831446260723e-06, "loss": 2.3147, "step": 36289 }, { "epoch": 0.98, "learning_rate": 3.2113408259878406e-06, "loss": 2.4509, "step": 36290 }, { "epoch": 0.98, "learning_rate": 3.2043747408612157e-06, "loss": 2.2207, "step": 36291 }, { "epoch": 0.98, "learning_rate": 3.1974162072799797e-06, "loss": 2.8402, "step": 36292 }, { "epoch": 0.98, "learning_rate": 3.190465225296868e-06, "loss": 2.0828, "step": 36293 }, { "epoch": 0.98, "learning_rate": 3.183521794964728e-06, "loss": 2.3133, "step": 36294 }, { "epoch": 0.98, "learning_rate": 3.17658591633585e-06, "loss": 2.3989, "step": 36295 }, { "epoch": 0.98, "learning_rate": 3.169657589463082e-06, "loss": 2.6922, "step": 36296 }, { "epoch": 0.98, "learning_rate": 3.1627368143987147e-06, "loss": 2.7483, "step": 36297 }, { "epoch": 0.98, "learning_rate": 3.1558235911951505e-06, "loss": 2.5673, "step": 36298 }, { "epoch": 0.98, "learning_rate": 3.1489179199049034e-06, "loss": 2.2892, "step": 36299 }, { "epoch": 0.98, "learning_rate": 3.1420198005802646e-06, "loss": 1.9758, "step": 36300 }, { "epoch": 0.98, "learning_rate": 3.135129233273526e-06, "loss": 2.3898, "step": 36301 }, { "epoch": 0.98, "learning_rate": 3.1282462180366457e-06, "loss": 2.6052, "step": 36302 }, { "epoch": 0.98, "learning_rate": 3.121370754922137e-06, "loss": 2.4247, "step": 36303 }, { "epoch": 0.98, "learning_rate": 3.114502843981737e-06, "loss": 2.515, "step": 36304 }, { "epoch": 0.98, "learning_rate": 3.1076424852677365e-06, "loss": 2.4022, "step": 36305 }, { "epoch": 0.98, "learning_rate": 3.1007896788319834e-06, "loss": 2.2736, "step": 36306 }, { "epoch": 0.98, "learning_rate": 3.0939444247264357e-06, "loss": 2.4052, "step": 36307 }, { "epoch": 0.98, "learning_rate": 3.0871067230029413e-06, "loss": 2.2883, "step": 36308 }, { "epoch": 0.98, "learning_rate": 3.0802765737132365e-06, "loss": 2.5308, "step": 36309 }, { "epoch": 0.98, "learning_rate": 3.0734539769091685e-06, "loss": 2.5141, "step": 36310 }, { "epoch": 0.98, "learning_rate": 3.066638932642363e-06, "loss": 1.9299, "step": 36311 }, { "epoch": 0.98, "learning_rate": 3.0598314409644445e-06, "loss": 2.1374, "step": 36312 }, { "epoch": 0.98, "learning_rate": 3.0530315019270395e-06, "loss": 2.4493, "step": 36313 }, { "epoch": 0.98, "learning_rate": 3.0462391155816616e-06, "loss": 2.4518, "step": 36314 }, { "epoch": 0.98, "learning_rate": 3.0394542819797142e-06, "loss": 1.9079, "step": 36315 }, { "epoch": 0.98, "learning_rate": 3.0326770011726013e-06, "loss": 2.7475, "step": 36316 }, { "epoch": 0.98, "learning_rate": 3.0259072732117253e-06, "loss": 2.0918, "step": 36317 }, { "epoch": 0.98, "learning_rate": 3.0191450981482684e-06, "loss": 2.2147, "step": 36318 }, { "epoch": 0.98, "learning_rate": 3.012390476033522e-06, "loss": 2.6728, "step": 36319 }, { "epoch": 0.98, "learning_rate": 3.005643406918779e-06, "loss": 2.5045, "step": 36320 }, { "epoch": 0.98, "learning_rate": 2.998903890854887e-06, "loss": 2.6015, "step": 36321 }, { "epoch": 0.98, "learning_rate": 2.9921719278931393e-06, "loss": 2.4282, "step": 36322 }, { "epoch": 0.98, "learning_rate": 2.985447518084383e-06, "loss": 2.7047, "step": 36323 }, { "epoch": 0.98, "learning_rate": 2.9787306614796893e-06, "loss": 2.3961, "step": 36324 }, { "epoch": 0.98, "learning_rate": 2.972021358129906e-06, "loss": 2.0909, "step": 36325 }, { "epoch": 0.98, "learning_rate": 2.9653196080857703e-06, "loss": 2.0347, "step": 36326 }, { "epoch": 0.98, "learning_rate": 2.9586254113981304e-06, "loss": 1.9605, "step": 36327 }, { "epoch": 0.98, "learning_rate": 2.9519387681177233e-06, "loss": 2.2306, "step": 36328 }, { "epoch": 0.98, "learning_rate": 2.9452596782951758e-06, "loss": 2.7831, "step": 36329 }, { "epoch": 0.98, "learning_rate": 2.9385881419810024e-06, "loss": 2.1035, "step": 36330 }, { "epoch": 0.98, "learning_rate": 2.9319241592259404e-06, "loss": 2.1181, "step": 36331 }, { "epoch": 0.98, "learning_rate": 2.9252677300802833e-06, "loss": 2.2103, "step": 36332 }, { "epoch": 0.98, "learning_rate": 2.918618854594546e-06, "loss": 2.3308, "step": 36333 }, { "epoch": 0.98, "learning_rate": 2.911977532819132e-06, "loss": 2.6354, "step": 36334 }, { "epoch": 0.98, "learning_rate": 2.9053437648043356e-06, "loss": 2.4401, "step": 36335 }, { "epoch": 0.98, "learning_rate": 2.8987175506003382e-06, "loss": 2.5076, "step": 36336 }, { "epoch": 0.98, "learning_rate": 2.892098890257322e-06, "loss": 2.2947, "step": 36337 }, { "epoch": 0.98, "learning_rate": 2.88548778382558e-06, "loss": 2.2053, "step": 36338 }, { "epoch": 0.98, "learning_rate": 2.878884231355183e-06, "loss": 2.1, "step": 36339 }, { "epoch": 0.98, "learning_rate": 2.872288232895981e-06, "loss": 2.4083, "step": 36340 }, { "epoch": 0.98, "learning_rate": 2.865699788498155e-06, "loss": 2.5037, "step": 36341 }, { "epoch": 0.98, "learning_rate": 2.8591188982114436e-06, "loss": 2.4701, "step": 36342 }, { "epoch": 0.98, "learning_rate": 2.8525455620856953e-06, "loss": 2.5402, "step": 36343 }, { "epoch": 0.98, "learning_rate": 2.845979780170871e-06, "loss": 2.5802, "step": 36344 }, { "epoch": 0.98, "learning_rate": 2.8394215525167076e-06, "loss": 2.4248, "step": 36345 }, { "epoch": 0.98, "learning_rate": 2.832870879172722e-06, "loss": 2.2338, "step": 36346 }, { "epoch": 0.98, "learning_rate": 2.826327760188652e-06, "loss": 2.3319, "step": 36347 }, { "epoch": 0.98, "learning_rate": 2.8197921956140127e-06, "loss": 2.3046, "step": 36348 }, { "epoch": 0.98, "learning_rate": 2.813264185498432e-06, "loss": 2.6027, "step": 36349 }, { "epoch": 0.98, "learning_rate": 2.8067437298912035e-06, "loss": 2.8538, "step": 36350 }, { "epoch": 0.98, "learning_rate": 2.800230828841843e-06, "loss": 2.2586, "step": 36351 }, { "epoch": 0.98, "learning_rate": 2.793725482399645e-06, "loss": 2.1935, "step": 36352 }, { "epoch": 0.98, "learning_rate": 2.7872276906137915e-06, "loss": 2.2819, "step": 36353 }, { "epoch": 0.98, "learning_rate": 2.7807374535337995e-06, "loss": 2.2154, "step": 36354 }, { "epoch": 0.98, "learning_rate": 2.7742547712085177e-06, "loss": 2.9595, "step": 36355 }, { "epoch": 0.98, "learning_rate": 2.7677796436872406e-06, "loss": 2.5343, "step": 36356 }, { "epoch": 0.98, "learning_rate": 2.7613120710190396e-06, "loss": 2.4795, "step": 36357 }, { "epoch": 0.98, "learning_rate": 2.7548520532527653e-06, "loss": 2.0792, "step": 36358 }, { "epoch": 0.98, "learning_rate": 2.7483995904373784e-06, "loss": 2.5252, "step": 36359 }, { "epoch": 0.98, "learning_rate": 2.74195468262195e-06, "loss": 2.6194, "step": 36360 }, { "epoch": 0.98, "learning_rate": 2.7355173298552195e-06, "loss": 2.5811, "step": 36361 }, { "epoch": 0.98, "learning_rate": 2.7290875321858144e-06, "loss": 2.3781, "step": 36362 }, { "epoch": 0.98, "learning_rate": 2.7226652896624738e-06, "loss": 2.3773, "step": 36363 }, { "epoch": 0.98, "learning_rate": 2.7162506023340472e-06, "loss": 2.5921, "step": 36364 }, { "epoch": 0.98, "learning_rate": 2.7098434702490516e-06, "loss": 2.3862, "step": 36365 }, { "epoch": 0.98, "learning_rate": 2.7034438934558923e-06, "loss": 2.9932, "step": 36366 }, { "epoch": 0.98, "learning_rate": 2.697051872003087e-06, "loss": 2.6945, "step": 36367 }, { "epoch": 0.98, "learning_rate": 2.6906674059392623e-06, "loss": 2.3765, "step": 36368 }, { "epoch": 0.98, "learning_rate": 2.6842904953126024e-06, "loss": 2.5269, "step": 36369 }, { "epoch": 0.98, "learning_rate": 2.677921140171402e-06, "loss": 2.6826, "step": 36370 }, { "epoch": 0.98, "learning_rate": 2.671559340563956e-06, "loss": 2.333, "step": 36371 }, { "epoch": 0.98, "learning_rate": 2.6652050965384476e-06, "loss": 2.6254, "step": 36372 }, { "epoch": 0.98, "learning_rate": 2.6588584081431723e-06, "loss": 2.4513, "step": 36373 }, { "epoch": 0.98, "learning_rate": 2.65251927542598e-06, "loss": 2.6362, "step": 36374 }, { "epoch": 0.98, "learning_rate": 2.646187698434943e-06, "loss": 2.0793, "step": 36375 }, { "epoch": 0.98, "learning_rate": 2.639863677218135e-06, "loss": 2.6019, "step": 36376 }, { "epoch": 0.98, "learning_rate": 2.633547211823406e-06, "loss": 2.4107, "step": 36377 }, { "epoch": 0.98, "learning_rate": 2.627238302298607e-06, "loss": 1.6682, "step": 36378 }, { "epoch": 0.98, "learning_rate": 2.620936948691588e-06, "loss": 2.2556, "step": 36379 }, { "epoch": 0.98, "learning_rate": 2.6146431510499778e-06, "loss": 2.6275, "step": 36380 }, { "epoch": 0.98, "learning_rate": 2.6083569094216273e-06, "loss": 2.5827, "step": 36381 }, { "epoch": 0.98, "learning_rate": 2.602078223853943e-06, "loss": 2.6744, "step": 36382 }, { "epoch": 0.98, "learning_rate": 2.5958070943945533e-06, "loss": 2.6854, "step": 36383 }, { "epoch": 0.98, "learning_rate": 2.5895435210910867e-06, "loss": 2.7443, "step": 36384 }, { "epoch": 0.98, "learning_rate": 2.5832875039909498e-06, "loss": 2.5696, "step": 36385 }, { "epoch": 0.98, "learning_rate": 2.577039043141438e-06, "loss": 2.8725, "step": 36386 }, { "epoch": 0.98, "learning_rate": 2.5707981385899583e-06, "loss": 2.4668, "step": 36387 }, { "epoch": 0.98, "learning_rate": 2.5645647903838054e-06, "loss": 2.617, "step": 36388 }, { "epoch": 0.98, "learning_rate": 2.5583389985701645e-06, "loss": 3.0213, "step": 36389 }, { "epoch": 0.98, "learning_rate": 2.5521207631962196e-06, "loss": 2.5881, "step": 36390 }, { "epoch": 0.98, "learning_rate": 2.5459100843091554e-06, "loss": 2.522, "step": 36391 }, { "epoch": 0.98, "learning_rate": 2.5397069619558235e-06, "loss": 3.1026, "step": 36392 }, { "epoch": 0.98, "learning_rate": 2.533511396183408e-06, "loss": 2.9181, "step": 36393 }, { "epoch": 0.98, "learning_rate": 2.5273233870388714e-06, "loss": 2.6806, "step": 36394 }, { "epoch": 0.98, "learning_rate": 2.521142934568843e-06, "loss": 2.462, "step": 36395 }, { "epoch": 0.98, "learning_rate": 2.5149700388203967e-06, "loss": 2.3394, "step": 36396 }, { "epoch": 0.98, "learning_rate": 2.5088046998401616e-06, "loss": 2.1535, "step": 36397 }, { "epoch": 0.98, "learning_rate": 2.502646917674878e-06, "loss": 2.5223, "step": 36398 }, { "epoch": 0.98, "learning_rate": 2.4964966923712863e-06, "loss": 2.5004, "step": 36399 }, { "epoch": 0.98, "learning_rate": 2.490354023975905e-06, "loss": 2.3515, "step": 36400 }, { "epoch": 0.98, "learning_rate": 2.4842189125351413e-06, "loss": 2.3621, "step": 36401 }, { "epoch": 0.98, "learning_rate": 2.4780913580956243e-06, "loss": 1.984, "step": 36402 }, { "epoch": 0.98, "learning_rate": 2.471971360703762e-06, "loss": 3.1573, "step": 36403 }, { "epoch": 0.98, "learning_rate": 2.4658589204059613e-06, "loss": 2.7062, "step": 36404 }, { "epoch": 0.98, "learning_rate": 2.4597540372484074e-06, "loss": 2.7265, "step": 36405 }, { "epoch": 0.98, "learning_rate": 2.4536567112775076e-06, "loss": 2.2699, "step": 36406 }, { "epoch": 0.98, "learning_rate": 2.4475669425392256e-06, "loss": 2.329, "step": 36407 }, { "epoch": 0.98, "learning_rate": 2.441484731079968e-06, "loss": 2.6354, "step": 36408 }, { "epoch": 0.98, "learning_rate": 2.435410076945588e-06, "loss": 2.6402, "step": 36409 }, { "epoch": 0.98, "learning_rate": 2.429342980182159e-06, "loss": 2.7479, "step": 36410 }, { "epoch": 0.98, "learning_rate": 2.423283440835755e-06, "loss": 2.0866, "step": 36411 }, { "epoch": 0.98, "learning_rate": 2.4172314589522292e-06, "loss": 2.2168, "step": 36412 }, { "epoch": 0.98, "learning_rate": 2.4111870345773225e-06, "loss": 2.6103, "step": 36413 }, { "epoch": 0.98, "learning_rate": 2.4051501677569976e-06, "loss": 2.9861, "step": 36414 }, { "epoch": 0.98, "learning_rate": 2.399120858536774e-06, "loss": 2.488, "step": 36415 }, { "epoch": 0.98, "learning_rate": 2.3930991069625042e-06, "loss": 2.1139, "step": 36416 }, { "epoch": 0.98, "learning_rate": 2.387084913079818e-06, "loss": 2.3743, "step": 36417 }, { "epoch": 0.98, "learning_rate": 2.3810782769342345e-06, "loss": 2.4772, "step": 36418 }, { "epoch": 0.98, "learning_rate": 2.3750791985711616e-06, "loss": 2.4147, "step": 36419 }, { "epoch": 0.98, "learning_rate": 2.3690876780362304e-06, "loss": 2.7936, "step": 36420 }, { "epoch": 0.98, "learning_rate": 2.363103715374626e-06, "loss": 2.3595, "step": 36421 }, { "epoch": 0.98, "learning_rate": 2.357127310631757e-06, "loss": 2.4402, "step": 36422 }, { "epoch": 0.98, "learning_rate": 2.3511584638530315e-06, "loss": 2.6504, "step": 36423 }, { "epoch": 0.98, "learning_rate": 2.3451971750836352e-06, "loss": 2.7155, "step": 36424 }, { "epoch": 0.98, "learning_rate": 2.339243444368533e-06, "loss": 2.3636, "step": 36425 }, { "epoch": 0.98, "learning_rate": 2.33329727175291e-06, "loss": 2.1456, "step": 36426 }, { "epoch": 0.98, "learning_rate": 2.327358657281953e-06, "loss": 2.3946, "step": 36427 }, { "epoch": 0.98, "learning_rate": 2.321427601000625e-06, "loss": 2.4824, "step": 36428 }, { "epoch": 0.98, "learning_rate": 2.3155041029536693e-06, "loss": 2.8935, "step": 36429 }, { "epoch": 0.98, "learning_rate": 2.3095881631861603e-06, "loss": 2.6006, "step": 36430 }, { "epoch": 0.98, "learning_rate": 2.303679781742729e-06, "loss": 2.3226, "step": 36431 }, { "epoch": 0.98, "learning_rate": 2.2977789586683394e-06, "loss": 2.8302, "step": 36432 }, { "epoch": 0.98, "learning_rate": 2.291885694007623e-06, "loss": 2.3465, "step": 36433 }, { "epoch": 0.98, "learning_rate": 2.2859999878052097e-06, "loss": 2.7281, "step": 36434 }, { "epoch": 0.98, "learning_rate": 2.28012184010562e-06, "loss": 2.9303, "step": 36435 }, { "epoch": 0.98, "learning_rate": 2.274251250953485e-06, "loss": 2.2127, "step": 36436 }, { "epoch": 0.98, "learning_rate": 2.2683882203932137e-06, "loss": 2.287, "step": 36437 }, { "epoch": 0.98, "learning_rate": 2.262532748469326e-06, "loss": 2.3303, "step": 36438 }, { "epoch": 0.98, "learning_rate": 2.2566848352261193e-06, "loss": 2.4811, "step": 36439 }, { "epoch": 0.98, "learning_rate": 2.250844480707781e-06, "loss": 2.8875, "step": 36440 }, { "epoch": 0.98, "learning_rate": 2.245011684958831e-06, "loss": 2.2351, "step": 36441 }, { "epoch": 0.98, "learning_rate": 2.239186448023123e-06, "loss": 2.5712, "step": 36442 }, { "epoch": 0.98, "learning_rate": 2.2333687699450653e-06, "loss": 2.3917, "step": 36443 }, { "epoch": 0.98, "learning_rate": 2.227558650768513e-06, "loss": 2.5789, "step": 36444 }, { "epoch": 0.98, "learning_rate": 2.2217560905376523e-06, "loss": 2.5604, "step": 36445 }, { "epoch": 0.98, "learning_rate": 2.215961089296448e-06, "loss": 2.474, "step": 36446 }, { "epoch": 0.98, "learning_rate": 2.2101736470886423e-06, "loss": 2.5351, "step": 36447 }, { "epoch": 0.98, "learning_rate": 2.2043937639582013e-06, "loss": 2.3019, "step": 36448 }, { "epoch": 0.98, "learning_rate": 2.198621439948867e-06, "loss": 2.4374, "step": 36449 }, { "epoch": 0.98, "learning_rate": 2.1928566751043823e-06, "loss": 2.5974, "step": 36450 }, { "epoch": 0.98, "learning_rate": 2.18709946946849e-06, "loss": 2.5597, "step": 36451 }, { "epoch": 0.98, "learning_rate": 2.1813498230847107e-06, "loss": 2.1701, "step": 36452 }, { "epoch": 0.98, "learning_rate": 2.1756077359965654e-06, "loss": 2.4203, "step": 36453 }, { "epoch": 0.98, "learning_rate": 2.1698732082476855e-06, "loss": 2.8702, "step": 36454 }, { "epoch": 0.98, "learning_rate": 2.1641462398814816e-06, "loss": 2.1722, "step": 36455 }, { "epoch": 0.98, "learning_rate": 2.1584268309411405e-06, "loss": 2.4779, "step": 36456 }, { "epoch": 0.98, "learning_rate": 2.152714981470405e-06, "loss": 2.5595, "step": 36457 }, { "epoch": 0.98, "learning_rate": 2.14701069151213e-06, "loss": 2.5848, "step": 36458 }, { "epoch": 0.98, "learning_rate": 2.1413139611098363e-06, "loss": 2.7325, "step": 36459 }, { "epoch": 0.98, "learning_rate": 2.1356247903063785e-06, "loss": 2.4383, "step": 36460 }, { "epoch": 0.98, "learning_rate": 2.1299431791451664e-06, "loss": 2.4682, "step": 36461 }, { "epoch": 0.98, "learning_rate": 2.124269127669054e-06, "loss": 2.4634, "step": 36462 }, { "epoch": 0.98, "learning_rate": 2.1186026359210076e-06, "loss": 2.9246, "step": 36463 }, { "epoch": 0.98, "learning_rate": 2.1129437039441037e-06, "loss": 2.7306, "step": 36464 }, { "epoch": 0.98, "learning_rate": 2.1072923317810855e-06, "loss": 2.5558, "step": 36465 }, { "epoch": 0.98, "learning_rate": 2.101648519474919e-06, "loss": 2.4859, "step": 36466 }, { "epoch": 0.98, "learning_rate": 2.096012267068126e-06, "loss": 2.3263, "step": 36467 }, { "epoch": 0.98, "learning_rate": 2.0903835746036713e-06, "loss": 2.0929, "step": 36468 }, { "epoch": 0.98, "learning_rate": 2.0847624421238555e-06, "loss": 2.2908, "step": 36469 }, { "epoch": 0.98, "learning_rate": 2.079148869671643e-06, "loss": 2.4853, "step": 36470 }, { "epoch": 0.98, "learning_rate": 2.0735428572893347e-06, "loss": 1.8922, "step": 36471 }, { "epoch": 0.98, "learning_rate": 2.0679444050194506e-06, "loss": 2.2695, "step": 36472 }, { "epoch": 0.98, "learning_rate": 2.0623535129045133e-06, "loss": 2.3749, "step": 36473 }, { "epoch": 0.98, "learning_rate": 2.0567701809866e-06, "loss": 2.2329, "step": 36474 }, { "epoch": 0.98, "learning_rate": 2.0511944093082326e-06, "loss": 2.8816, "step": 36475 }, { "epoch": 0.98, "learning_rate": 2.0456261979115985e-06, "loss": 2.6808, "step": 36476 }, { "epoch": 0.98, "learning_rate": 2.0400655468388874e-06, "loss": 2.0897, "step": 36477 }, { "epoch": 0.98, "learning_rate": 2.034512456132287e-06, "loss": 2.6192, "step": 36478 }, { "epoch": 0.98, "learning_rate": 2.028966925833764e-06, "loss": 2.4474, "step": 36479 }, { "epoch": 0.98, "learning_rate": 2.023428955985396e-06, "loss": 2.7284, "step": 36480 }, { "epoch": 0.98, "learning_rate": 2.017898546629038e-06, "loss": 2.4392, "step": 36481 }, { "epoch": 0.98, "learning_rate": 2.0123756978066564e-06, "loss": 2.4762, "step": 36482 }, { "epoch": 0.98, "learning_rate": 2.0068604095601074e-06, "loss": 2.412, "step": 36483 }, { "epoch": 0.98, "learning_rate": 2.0013526819312456e-06, "loss": 2.5379, "step": 36484 }, { "epoch": 0.98, "learning_rate": 1.9958525149615934e-06, "loss": 2.5454, "step": 36485 }, { "epoch": 0.98, "learning_rate": 1.990359908693007e-06, "loss": 2.5488, "step": 36486 }, { "epoch": 0.98, "learning_rate": 1.9848748631670076e-06, "loss": 2.6713, "step": 36487 }, { "epoch": 0.98, "learning_rate": 1.9793973784251183e-06, "loss": 2.4394, "step": 36488 }, { "epoch": 0.98, "learning_rate": 1.9739274545089725e-06, "loss": 2.0783, "step": 36489 }, { "epoch": 0.98, "learning_rate": 1.9684650914598703e-06, "loss": 2.3691, "step": 36490 }, { "epoch": 0.98, "learning_rate": 1.9630102893192226e-06, "loss": 2.8259, "step": 36491 }, { "epoch": 0.98, "learning_rate": 1.957563048128441e-06, "loss": 2.5342, "step": 36492 }, { "epoch": 0.98, "learning_rate": 1.9521233679287154e-06, "loss": 2.0764, "step": 36493 }, { "epoch": 0.98, "learning_rate": 1.9466912487612344e-06, "loss": 2.3059, "step": 36494 }, { "epoch": 0.98, "learning_rate": 1.941266690667187e-06, "loss": 2.3069, "step": 36495 }, { "epoch": 0.98, "learning_rate": 1.9358496936876526e-06, "loss": 2.6461, "step": 36496 }, { "epoch": 0.98, "learning_rate": 1.930440257863708e-06, "loss": 1.9598, "step": 36497 }, { "epoch": 0.98, "learning_rate": 1.9250383832363216e-06, "loss": 2.8509, "step": 36498 }, { "epoch": 0.98, "learning_rate": 1.9196440698463493e-06, "loss": 1.8612, "step": 36499 }, { "epoch": 0.98, "learning_rate": 1.9142573177347576e-06, "loss": 2.3768, "step": 36500 }, { "epoch": 0.98, "learning_rate": 1.908878126942404e-06, "loss": 2.7491, "step": 36501 }, { "epoch": 0.98, "learning_rate": 1.9035064975098105e-06, "loss": 2.1672, "step": 36502 }, { "epoch": 0.98, "learning_rate": 1.8981424294778337e-06, "loss": 2.2678, "step": 36503 }, { "epoch": 0.98, "learning_rate": 1.892785922887108e-06, "loss": 2.2391, "step": 36504 }, { "epoch": 0.98, "learning_rate": 1.8874369777782673e-06, "loss": 2.2935, "step": 36505 }, { "epoch": 0.98, "learning_rate": 1.8820955941916129e-06, "loss": 2.5614, "step": 36506 }, { "epoch": 0.98, "learning_rate": 1.8767617721678898e-06, "loss": 2.6399, "step": 36507 }, { "epoch": 0.98, "learning_rate": 1.8714355117472882e-06, "loss": 2.2867, "step": 36508 }, { "epoch": 0.98, "learning_rate": 1.86611681297022e-06, "loss": 2.6854, "step": 36509 }, { "epoch": 0.98, "learning_rate": 1.8608056758769866e-06, "loss": 2.3815, "step": 36510 }, { "epoch": 0.98, "learning_rate": 1.8555021005079998e-06, "loss": 2.5884, "step": 36511 }, { "epoch": 0.98, "learning_rate": 1.8502060869031168e-06, "loss": 2.1288, "step": 36512 }, { "epoch": 0.98, "learning_rate": 1.8449176351027498e-06, "loss": 2.658, "step": 36513 }, { "epoch": 0.98, "learning_rate": 1.8396367451467556e-06, "loss": 2.3526, "step": 36514 }, { "epoch": 0.98, "learning_rate": 1.8343634170752133e-06, "loss": 2.3016, "step": 36515 }, { "epoch": 0.98, "learning_rate": 1.829097650928091e-06, "loss": 2.6044, "step": 36516 }, { "epoch": 0.98, "learning_rate": 1.8238394467452458e-06, "loss": 2.5463, "step": 36517 }, { "epoch": 0.98, "learning_rate": 1.8185888045665345e-06, "loss": 2.359, "step": 36518 }, { "epoch": 0.98, "learning_rate": 1.8133457244317032e-06, "loss": 2.4187, "step": 36519 }, { "epoch": 0.98, "learning_rate": 1.8081102063806088e-06, "loss": 2.5781, "step": 36520 }, { "epoch": 0.98, "learning_rate": 1.8028822504527752e-06, "loss": 2.4053, "step": 36521 }, { "epoch": 0.98, "learning_rate": 1.7976618566878378e-06, "loss": 2.6256, "step": 36522 }, { "epoch": 0.98, "learning_rate": 1.79244902512532e-06, "loss": 2.7982, "step": 36523 }, { "epoch": 0.98, "learning_rate": 1.7872437558047461e-06, "loss": 2.4707, "step": 36524 }, { "epoch": 0.98, "learning_rate": 1.7820460487656399e-06, "loss": 2.2825, "step": 36525 }, { "epoch": 0.98, "learning_rate": 1.776855904047192e-06, "loss": 2.6051, "step": 36526 }, { "epoch": 0.98, "learning_rate": 1.7716733216888159e-06, "loss": 2.6762, "step": 36527 }, { "epoch": 0.98, "learning_rate": 1.7664983017298131e-06, "loss": 2.2146, "step": 36528 }, { "epoch": 0.98, "learning_rate": 1.7613308442093745e-06, "loss": 2.5472, "step": 36529 }, { "epoch": 0.98, "learning_rate": 1.75617094916658e-06, "loss": 2.4792, "step": 36530 }, { "epoch": 0.98, "learning_rate": 1.7510186166406206e-06, "loss": 2.465, "step": 36531 }, { "epoch": 0.98, "learning_rate": 1.745873846670465e-06, "loss": 2.8674, "step": 36532 }, { "epoch": 0.98, "learning_rate": 1.7407366392950819e-06, "loss": 2.4261, "step": 36533 }, { "epoch": 0.98, "learning_rate": 1.7356069945533293e-06, "loss": 2.6082, "step": 36534 }, { "epoch": 0.98, "learning_rate": 1.730484912484176e-06, "loss": 2.295, "step": 36535 }, { "epoch": 0.98, "learning_rate": 1.7253703931264797e-06, "loss": 2.7721, "step": 36536 }, { "epoch": 0.98, "learning_rate": 1.7202634365188763e-06, "loss": 2.6347, "step": 36537 }, { "epoch": 0.98, "learning_rate": 1.7151640427000015e-06, "loss": 2.947, "step": 36538 }, { "epoch": 0.98, "learning_rate": 1.7100722117087131e-06, "loss": 2.3252, "step": 36539 }, { "epoch": 0.98, "learning_rate": 1.7049879435833139e-06, "loss": 2.1269, "step": 36540 }, { "epoch": 0.98, "learning_rate": 1.6999112383624394e-06, "loss": 2.4198, "step": 36541 }, { "epoch": 0.98, "learning_rate": 1.6948420960846144e-06, "loss": 2.3237, "step": 36542 }, { "epoch": 0.98, "learning_rate": 1.6897805167881419e-06, "loss": 2.1799, "step": 36543 }, { "epoch": 0.98, "learning_rate": 1.6847265005115464e-06, "loss": 2.7922, "step": 36544 }, { "epoch": 0.98, "learning_rate": 1.6796800472927976e-06, "loss": 2.5772, "step": 36545 }, { "epoch": 0.98, "learning_rate": 1.67464115717042e-06, "loss": 2.1458, "step": 36546 }, { "epoch": 0.98, "learning_rate": 1.6696098301824947e-06, "loss": 2.5776, "step": 36547 }, { "epoch": 0.98, "learning_rate": 1.664586066366991e-06, "loss": 2.528, "step": 36548 }, { "epoch": 0.98, "learning_rate": 1.6595698657622115e-06, "loss": 2.2323, "step": 36549 }, { "epoch": 0.98, "learning_rate": 1.6545612284060153e-06, "loss": 2.3682, "step": 36550 }, { "epoch": 0.98, "learning_rate": 1.6495601543363713e-06, "loss": 2.5541, "step": 36551 }, { "epoch": 0.98, "learning_rate": 1.644566643591139e-06, "loss": 2.6053, "step": 36552 }, { "epoch": 0.98, "learning_rate": 1.639580696208287e-06, "loss": 2.5443, "step": 36553 }, { "epoch": 0.98, "learning_rate": 1.6346023122253418e-06, "loss": 2.7975, "step": 36554 }, { "epoch": 0.98, "learning_rate": 1.6296314916802723e-06, "loss": 2.5203, "step": 36555 }, { "epoch": 0.98, "learning_rate": 1.6246682346106045e-06, "loss": 2.6827, "step": 36556 }, { "epoch": 0.98, "learning_rate": 1.6197125410538639e-06, "loss": 2.1164, "step": 36557 }, { "epoch": 0.98, "learning_rate": 1.6147644110477976e-06, "loss": 2.7016, "step": 36558 }, { "epoch": 0.98, "learning_rate": 1.6098238446297098e-06, "loss": 2.6628, "step": 36559 }, { "epoch": 0.98, "learning_rate": 1.6048908418371256e-06, "loss": 2.7578, "step": 36560 }, { "epoch": 0.98, "learning_rate": 1.5999654027073485e-06, "loss": 2.6354, "step": 36561 }, { "epoch": 0.98, "learning_rate": 1.595047527277793e-06, "loss": 2.7858, "step": 36562 }, { "epoch": 0.98, "learning_rate": 1.590137215585652e-06, "loss": 2.4109, "step": 36563 }, { "epoch": 0.98, "learning_rate": 1.5852344676682284e-06, "loss": 2.2363, "step": 36564 }, { "epoch": 0.98, "learning_rate": 1.580339283562382e-06, "loss": 2.5899, "step": 36565 }, { "epoch": 0.98, "learning_rate": 1.5754516633055272e-06, "loss": 2.4406, "step": 36566 }, { "epoch": 0.98, "learning_rate": 1.5705716069344122e-06, "loss": 2.6534, "step": 36567 }, { "epoch": 0.98, "learning_rate": 1.5656991144862298e-06, "loss": 2.5909, "step": 36568 }, { "epoch": 0.98, "learning_rate": 1.5608341859978393e-06, "loss": 2.7345, "step": 36569 }, { "epoch": 0.98, "learning_rate": 1.5559768215059888e-06, "loss": 2.7414, "step": 36570 }, { "epoch": 0.98, "learning_rate": 1.5511270210476491e-06, "loss": 2.7421, "step": 36571 }, { "epoch": 0.98, "learning_rate": 1.5462847846594575e-06, "loss": 2.5134, "step": 36572 }, { "epoch": 0.98, "learning_rate": 1.5414501123780512e-06, "loss": 2.4619, "step": 36573 }, { "epoch": 0.98, "learning_rate": 1.5366230042400676e-06, "loss": 2.3503, "step": 36574 }, { "epoch": 0.98, "learning_rate": 1.531803460282144e-06, "loss": 2.52, "step": 36575 }, { "epoch": 0.98, "learning_rate": 1.526991480540807e-06, "loss": 2.1427, "step": 36576 }, { "epoch": 0.98, "learning_rate": 1.5221870650524716e-06, "loss": 1.9328, "step": 36577 }, { "epoch": 0.98, "learning_rate": 1.5173902138535534e-06, "loss": 2.4927, "step": 36578 }, { "epoch": 0.98, "learning_rate": 1.5126009269803565e-06, "loss": 2.6542, "step": 36579 }, { "epoch": 0.98, "learning_rate": 1.5078192044690741e-06, "loss": 2.8707, "step": 36580 }, { "epoch": 0.98, "learning_rate": 1.5030450463562328e-06, "loss": 2.6206, "step": 36581 }, { "epoch": 0.98, "learning_rate": 1.4982784526776927e-06, "loss": 2.2051, "step": 36582 }, { "epoch": 0.98, "learning_rate": 1.493519423469647e-06, "loss": 2.5094, "step": 36583 }, { "epoch": 0.98, "learning_rate": 1.488767958768289e-06, "loss": 2.1473, "step": 36584 }, { "epoch": 0.98, "learning_rate": 1.484024058609368e-06, "loss": 2.2558, "step": 36585 }, { "epoch": 0.98, "learning_rate": 1.479287723029077e-06, "loss": 2.5491, "step": 36586 }, { "epoch": 0.98, "learning_rate": 1.4745589520631654e-06, "loss": 2.2809, "step": 36587 }, { "epoch": 0.98, "learning_rate": 1.4698377457474931e-06, "loss": 2.8533, "step": 36588 }, { "epoch": 0.98, "learning_rate": 1.4651241041176988e-06, "loss": 2.5842, "step": 36589 }, { "epoch": 0.98, "learning_rate": 1.4604180272097534e-06, "loss": 2.5348, "step": 36590 }, { "epoch": 0.98, "learning_rate": 1.455719515059073e-06, "loss": 3.0114, "step": 36591 }, { "epoch": 0.98, "learning_rate": 1.4510285677014067e-06, "loss": 2.6679, "step": 36592 }, { "epoch": 0.98, "learning_rate": 1.446345185172171e-06, "loss": 2.6497, "step": 36593 }, { "epoch": 0.98, "learning_rate": 1.4416693675068925e-06, "loss": 2.9644, "step": 36594 }, { "epoch": 0.98, "learning_rate": 1.4370011147409878e-06, "loss": 2.793, "step": 36595 }, { "epoch": 0.98, "learning_rate": 1.4323404269098728e-06, "loss": 2.5949, "step": 36596 }, { "epoch": 0.98, "learning_rate": 1.4276873040487415e-06, "loss": 2.0193, "step": 36597 }, { "epoch": 0.98, "learning_rate": 1.42304174619301e-06, "loss": 2.1232, "step": 36598 }, { "epoch": 0.98, "learning_rate": 1.4184037533777617e-06, "loss": 2.8019, "step": 36599 }, { "epoch": 0.98, "learning_rate": 1.4137733256381902e-06, "loss": 2.341, "step": 36600 }, { "epoch": 0.98, "learning_rate": 1.4091504630092678e-06, "loss": 2.7697, "step": 36601 }, { "epoch": 0.98, "learning_rate": 1.4045351655261883e-06, "loss": 2.5932, "step": 36602 }, { "epoch": 0.98, "learning_rate": 1.3999274332237023e-06, "loss": 2.5047, "step": 36603 }, { "epoch": 0.98, "learning_rate": 1.3953272661368922e-06, "loss": 2.8425, "step": 36604 }, { "epoch": 0.98, "learning_rate": 1.390734664300508e-06, "loss": 2.7167, "step": 36605 }, { "epoch": 0.98, "learning_rate": 1.3861496277495222e-06, "loss": 2.3635, "step": 36606 }, { "epoch": 0.98, "learning_rate": 1.3815721565183514e-06, "loss": 2.7553, "step": 36607 }, { "epoch": 0.98, "learning_rate": 1.3770022506419678e-06, "loss": 2.3228, "step": 36608 }, { "epoch": 0.98, "learning_rate": 1.372439910154788e-06, "loss": 2.5162, "step": 36609 }, { "epoch": 0.98, "learning_rate": 1.3678851350915622e-06, "loss": 2.6896, "step": 36610 }, { "epoch": 0.98, "learning_rate": 1.3633379254867072e-06, "loss": 2.5289, "step": 36611 }, { "epoch": 0.98, "learning_rate": 1.3587982813745292e-06, "loss": 2.4433, "step": 36612 }, { "epoch": 0.98, "learning_rate": 1.354266202789667e-06, "loss": 2.2763, "step": 36613 }, { "epoch": 0.98, "learning_rate": 1.349741689766315e-06, "loss": 2.3177, "step": 36614 }, { "epoch": 0.98, "learning_rate": 1.3452247423387797e-06, "loss": 2.4483, "step": 36615 }, { "epoch": 0.98, "learning_rate": 1.3407153605413669e-06, "loss": 2.427, "step": 36616 }, { "epoch": 0.98, "learning_rate": 1.3362135444080492e-06, "loss": 2.8864, "step": 36617 }, { "epoch": 0.98, "learning_rate": 1.3317192939730216e-06, "loss": 2.6697, "step": 36618 }, { "epoch": 0.98, "learning_rate": 1.3272326092703678e-06, "loss": 2.6331, "step": 36619 }, { "epoch": 0.98, "learning_rate": 1.322753490334061e-06, "loss": 2.2714, "step": 36620 }, { "epoch": 0.98, "learning_rate": 1.3182819371979626e-06, "loss": 2.4629, "step": 36621 }, { "epoch": 0.98, "learning_rate": 1.3138179498961566e-06, "loss": 2.5014, "step": 36622 }, { "epoch": 0.98, "learning_rate": 1.3093615284621718e-06, "loss": 2.0854, "step": 36623 }, { "epoch": 0.98, "learning_rate": 1.304912672929981e-06, "loss": 2.6321, "step": 36624 }, { "epoch": 0.98, "learning_rate": 1.3004713833332238e-06, "loss": 2.4609, "step": 36625 }, { "epoch": 0.98, "learning_rate": 1.2960376597055402e-06, "loss": 2.3757, "step": 36626 }, { "epoch": 0.98, "learning_rate": 1.2916115020805696e-06, "loss": 2.3994, "step": 36627 }, { "epoch": 0.98, "learning_rate": 1.2871929104917302e-06, "loss": 2.8235, "step": 36628 }, { "epoch": 0.98, "learning_rate": 1.2827818849725503e-06, "loss": 2.0705, "step": 36629 }, { "epoch": 0.98, "learning_rate": 1.278378425556559e-06, "loss": 2.4214, "step": 36630 }, { "epoch": 0.98, "learning_rate": 1.2739825322769516e-06, "loss": 2.5736, "step": 36631 }, { "epoch": 0.98, "learning_rate": 1.269594205167035e-06, "loss": 2.532, "step": 36632 }, { "epoch": 0.98, "learning_rate": 1.265213444260227e-06, "loss": 2.6676, "step": 36633 }, { "epoch": 0.98, "learning_rate": 1.2608402495895011e-06, "loss": 2.5708, "step": 36634 }, { "epoch": 0.98, "learning_rate": 1.2564746211881638e-06, "loss": 2.5351, "step": 36635 }, { "epoch": 0.98, "learning_rate": 1.2521165590891893e-06, "loss": 2.4315, "step": 36636 }, { "epoch": 0.98, "learning_rate": 1.2477660633256615e-06, "loss": 2.6006, "step": 36637 }, { "epoch": 0.98, "learning_rate": 1.2434231339304437e-06, "loss": 2.6437, "step": 36638 }, { "epoch": 0.98, "learning_rate": 1.2390877709365089e-06, "loss": 2.956, "step": 36639 }, { "epoch": 0.98, "learning_rate": 1.2347599743767201e-06, "loss": 2.3816, "step": 36640 }, { "epoch": 0.98, "learning_rate": 1.230439744283829e-06, "loss": 2.0927, "step": 36641 }, { "epoch": 0.98, "learning_rate": 1.2261270806905866e-06, "loss": 2.8284, "step": 36642 }, { "epoch": 0.98, "learning_rate": 1.221821983629523e-06, "loss": 2.7187, "step": 36643 }, { "epoch": 0.98, "learning_rate": 1.2175244531333896e-06, "loss": 1.8817, "step": 36644 }, { "epoch": 0.98, "learning_rate": 1.213234489234827e-06, "loss": 2.4562, "step": 36645 }, { "epoch": 0.98, "learning_rate": 1.2089520919661422e-06, "loss": 2.2181, "step": 36646 }, { "epoch": 0.98, "learning_rate": 1.2046772613599766e-06, "loss": 2.2246, "step": 36647 }, { "epoch": 0.98, "learning_rate": 1.200409997448526e-06, "loss": 2.4569, "step": 36648 }, { "epoch": 0.98, "learning_rate": 1.1961503002642093e-06, "loss": 2.5437, "step": 36649 }, { "epoch": 0.98, "learning_rate": 1.1918981698393338e-06, "loss": 2.349, "step": 36650 }, { "epoch": 0.98, "learning_rate": 1.187653606205985e-06, "loss": 2.1956, "step": 36651 }, { "epoch": 0.98, "learning_rate": 1.1834166093964705e-06, "loss": 2.4212, "step": 36652 }, { "epoch": 0.99, "learning_rate": 1.1791871794427645e-06, "loss": 2.4452, "step": 36653 }, { "epoch": 0.99, "learning_rate": 1.1749653163769525e-06, "loss": 2.3482, "step": 36654 }, { "epoch": 0.99, "learning_rate": 1.17075102023112e-06, "loss": 2.1541, "step": 36655 }, { "epoch": 0.99, "learning_rate": 1.1665442910370194e-06, "loss": 2.5703, "step": 36656 }, { "epoch": 0.99, "learning_rate": 1.162345128826625e-06, "loss": 2.3567, "step": 36657 }, { "epoch": 0.99, "learning_rate": 1.1581535336316895e-06, "loss": 2.5844, "step": 36658 }, { "epoch": 0.99, "learning_rate": 1.153969505484076e-06, "loss": 2.0532, "step": 36659 }, { "epoch": 0.99, "learning_rate": 1.1497930444154258e-06, "loss": 2.3611, "step": 36660 }, { "epoch": 0.99, "learning_rate": 1.1456241504573805e-06, "loss": 2.4153, "step": 36661 }, { "epoch": 0.99, "learning_rate": 1.1414628236414703e-06, "loss": 2.62, "step": 36662 }, { "epoch": 0.99, "learning_rate": 1.1373090639992256e-06, "loss": 2.3566, "step": 36663 }, { "epoch": 0.99, "learning_rate": 1.1331628715621767e-06, "loss": 2.4891, "step": 36664 }, { "epoch": 0.99, "learning_rate": 1.1290242463616318e-06, "loss": 2.0729, "step": 36665 }, { "epoch": 0.99, "learning_rate": 1.1248931884291214e-06, "loss": 2.1967, "step": 36666 }, { "epoch": 0.99, "learning_rate": 1.1207696977958425e-06, "loss": 2.9637, "step": 36667 }, { "epoch": 0.99, "learning_rate": 1.1166537744929927e-06, "loss": 2.1286, "step": 36668 }, { "epoch": 0.99, "learning_rate": 1.112545418551769e-06, "loss": 2.9365, "step": 36669 }, { "epoch": 0.99, "learning_rate": 1.108444630003369e-06, "loss": 2.4651, "step": 36670 }, { "epoch": 0.99, "learning_rate": 1.1043514088787676e-06, "loss": 2.4276, "step": 36671 }, { "epoch": 0.99, "learning_rate": 1.1002657552090512e-06, "loss": 2.5283, "step": 36672 }, { "epoch": 0.99, "learning_rate": 1.0961876690250839e-06, "loss": 2.2827, "step": 36673 }, { "epoch": 0.99, "learning_rate": 1.0921171503577298e-06, "loss": 2.1486, "step": 36674 }, { "epoch": 0.99, "learning_rate": 1.0880541992380755e-06, "loss": 2.4448, "step": 36675 }, { "epoch": 0.99, "learning_rate": 1.0839988156966517e-06, "loss": 1.9311, "step": 36676 }, { "epoch": 0.99, "learning_rate": 1.079950999764323e-06, "loss": 2.7211, "step": 36677 }, { "epoch": 0.99, "learning_rate": 1.0759107514716204e-06, "loss": 2.1992, "step": 36678 }, { "epoch": 0.99, "learning_rate": 1.071878070849297e-06, "loss": 2.2769, "step": 36679 }, { "epoch": 0.99, "learning_rate": 1.0678529579277729e-06, "loss": 2.3991, "step": 36680 }, { "epoch": 0.99, "learning_rate": 1.0638354127375794e-06, "loss": 2.5934, "step": 36681 }, { "epoch": 0.99, "learning_rate": 1.0598254353092473e-06, "loss": 2.4106, "step": 36682 }, { "epoch": 0.99, "learning_rate": 1.0558230256730862e-06, "loss": 2.3151, "step": 36683 }, { "epoch": 0.99, "learning_rate": 1.0518281838594046e-06, "loss": 2.5143, "step": 36684 }, { "epoch": 0.99, "learning_rate": 1.047840909898401e-06, "loss": 2.5949, "step": 36685 }, { "epoch": 0.99, "learning_rate": 1.0438612038204952e-06, "loss": 1.9595, "step": 36686 }, { "epoch": 0.99, "learning_rate": 1.0398890656555527e-06, "loss": 1.848, "step": 36687 }, { "epoch": 0.99, "learning_rate": 1.035924495433882e-06, "loss": 2.5899, "step": 36688 }, { "epoch": 0.99, "learning_rate": 1.0319674931854595e-06, "loss": 2.5185, "step": 36689 }, { "epoch": 0.99, "learning_rate": 1.028018058940261e-06, "loss": 2.4518, "step": 36690 }, { "epoch": 0.99, "learning_rate": 1.0240761927281518e-06, "loss": 2.4718, "step": 36691 }, { "epoch": 0.99, "learning_rate": 1.0201418945791074e-06, "loss": 2.5572, "step": 36692 }, { "epoch": 0.99, "learning_rate": 1.0162151645227712e-06, "loss": 2.5894, "step": 36693 }, { "epoch": 0.99, "learning_rate": 1.0122960025891192e-06, "loss": 2.7843, "step": 36694 }, { "epoch": 0.99, "learning_rate": 1.0083844088075722e-06, "loss": 2.3348, "step": 36695 }, { "epoch": 0.99, "learning_rate": 1.0044803832079953e-06, "loss": 2.3814, "step": 36696 }, { "epoch": 0.99, "learning_rate": 1.0005839258198091e-06, "loss": 2.6464, "step": 36697 }, { "epoch": 0.99, "learning_rate": 9.966950366726567e-07, "loss": 2.6964, "step": 36698 }, { "epoch": 0.99, "learning_rate": 9.928137157959593e-07, "loss": 2.1712, "step": 36699 }, { "epoch": 0.99, "learning_rate": 9.889399632190266e-07, "loss": 2.1688, "step": 36700 }, { "epoch": 0.99, "learning_rate": 9.850737789712794e-07, "loss": 2.1313, "step": 36701 }, { "epoch": 0.99, "learning_rate": 9.812151630820276e-07, "loss": 2.2309, "step": 36702 }, { "epoch": 0.99, "learning_rate": 9.773641155804703e-07, "loss": 2.7119, "step": 36703 }, { "epoch": 0.99, "learning_rate": 9.73520636495806e-07, "loss": 2.1468, "step": 36704 }, { "epoch": 0.99, "learning_rate": 9.69684725857234e-07, "loss": 2.2269, "step": 36705 }, { "epoch": 0.99, "learning_rate": 9.658563836936196e-07, "loss": 2.275, "step": 36706 }, { "epoch": 0.99, "learning_rate": 9.62035610034051e-07, "loss": 2.5195, "step": 36707 }, { "epoch": 0.99, "learning_rate": 9.58222404907505e-07, "loss": 2.6252, "step": 36708 }, { "epoch": 0.99, "learning_rate": 9.544167683428474e-07, "loss": 2.8163, "step": 36709 }, { "epoch": 0.99, "learning_rate": 9.506187003689437e-07, "loss": 2.1933, "step": 36710 }, { "epoch": 0.99, "learning_rate": 9.468282010145491e-07, "loss": 2.5866, "step": 36711 }, { "epoch": 0.99, "learning_rate": 9.43045270308307e-07, "loss": 2.6607, "step": 36712 }, { "epoch": 0.99, "learning_rate": 9.392699082789724e-07, "loss": 2.4948, "step": 36713 }, { "epoch": 0.99, "learning_rate": 9.35502114955078e-07, "loss": 2.3671, "step": 36714 }, { "epoch": 0.99, "learning_rate": 9.317418903652674e-07, "loss": 2.5444, "step": 36715 }, { "epoch": 0.99, "learning_rate": 9.279892345379626e-07, "loss": 3.1815, "step": 36716 }, { "epoch": 0.99, "learning_rate": 9.24244147501585e-07, "loss": 2.3535, "step": 36717 }, { "epoch": 0.99, "learning_rate": 9.205066292845565e-07, "loss": 3.0076, "step": 36718 }, { "epoch": 0.99, "learning_rate": 9.167766799150767e-07, "loss": 2.124, "step": 36719 }, { "epoch": 0.99, "learning_rate": 9.130542994214563e-07, "loss": 2.6953, "step": 36720 }, { "epoch": 0.99, "learning_rate": 9.093394878320061e-07, "loss": 2.4398, "step": 36721 }, { "epoch": 0.99, "learning_rate": 9.056322451747034e-07, "loss": 2.6048, "step": 36722 }, { "epoch": 0.99, "learning_rate": 9.019325714777482e-07, "loss": 2.7045, "step": 36723 }, { "epoch": 0.99, "learning_rate": 8.98240466769118e-07, "loss": 2.117, "step": 36724 }, { "epoch": 0.99, "learning_rate": 8.945559310767903e-07, "loss": 2.4907, "step": 36725 }, { "epoch": 0.99, "learning_rate": 8.908789644287429e-07, "loss": 2.7489, "step": 36726 }, { "epoch": 0.99, "learning_rate": 8.872095668526203e-07, "loss": 2.6649, "step": 36727 }, { "epoch": 0.99, "learning_rate": 8.835477383765112e-07, "loss": 2.5257, "step": 36728 }, { "epoch": 0.99, "learning_rate": 8.7989347902806e-07, "loss": 2.7515, "step": 36729 }, { "epoch": 0.99, "learning_rate": 8.762467888348003e-07, "loss": 2.3608, "step": 36730 }, { "epoch": 0.99, "learning_rate": 8.726076678244877e-07, "loss": 2.2351, "step": 36731 }, { "epoch": 0.99, "learning_rate": 8.689761160246557e-07, "loss": 2.4555, "step": 36732 }, { "epoch": 0.99, "learning_rate": 8.653521334628378e-07, "loss": 1.9221, "step": 36733 }, { "epoch": 0.99, "learning_rate": 8.617357201665677e-07, "loss": 2.398, "step": 36734 }, { "epoch": 0.99, "learning_rate": 8.581268761630457e-07, "loss": 2.3175, "step": 36735 }, { "epoch": 0.99, "learning_rate": 8.545256014798052e-07, "loss": 2.5256, "step": 36736 }, { "epoch": 0.99, "learning_rate": 8.509318961440471e-07, "loss": 2.7095, "step": 36737 }, { "epoch": 0.99, "learning_rate": 8.473457601829715e-07, "loss": 2.1169, "step": 36738 }, { "epoch": 0.99, "learning_rate": 8.43767193623779e-07, "loss": 2.4087, "step": 36739 }, { "epoch": 0.99, "learning_rate": 8.40196196493559e-07, "loss": 2.6552, "step": 36740 }, { "epoch": 0.99, "learning_rate": 8.366327688194009e-07, "loss": 2.5313, "step": 36741 }, { "epoch": 0.99, "learning_rate": 8.330769106282832e-07, "loss": 2.2323, "step": 36742 }, { "epoch": 0.99, "learning_rate": 8.295286219470733e-07, "loss": 2.5688, "step": 36743 }, { "epoch": 0.99, "learning_rate": 8.259879028027495e-07, "loss": 2.1584, "step": 36744 }, { "epoch": 0.99, "learning_rate": 8.224547532221793e-07, "loss": 2.1417, "step": 36745 }, { "epoch": 0.99, "learning_rate": 8.189291732320081e-07, "loss": 2.5924, "step": 36746 }, { "epoch": 0.99, "learning_rate": 8.154111628589922e-07, "loss": 2.7974, "step": 36747 }, { "epoch": 0.99, "learning_rate": 8.11900722129777e-07, "loss": 2.8499, "step": 36748 }, { "epoch": 0.99, "learning_rate": 8.083978510708967e-07, "loss": 2.3817, "step": 36749 }, { "epoch": 0.99, "learning_rate": 8.049025497091078e-07, "loss": 2.8536, "step": 36750 }, { "epoch": 0.99, "learning_rate": 8.014148180706116e-07, "loss": 2.8364, "step": 36751 }, { "epoch": 0.99, "learning_rate": 7.979346561820533e-07, "loss": 2.7873, "step": 36752 }, { "epoch": 0.99, "learning_rate": 7.944620640696343e-07, "loss": 2.7539, "step": 36753 }, { "epoch": 0.99, "learning_rate": 7.909970417596668e-07, "loss": 2.3183, "step": 36754 }, { "epoch": 0.99, "learning_rate": 7.875395892785741e-07, "loss": 2.5888, "step": 36755 }, { "epoch": 0.99, "learning_rate": 7.840897066524466e-07, "loss": 2.1036, "step": 36756 }, { "epoch": 0.99, "learning_rate": 7.806473939073744e-07, "loss": 2.738, "step": 36757 }, { "epoch": 0.99, "learning_rate": 7.772126510694477e-07, "loss": 2.1716, "step": 36758 }, { "epoch": 0.99, "learning_rate": 7.737854781647569e-07, "loss": 2.8031, "step": 36759 }, { "epoch": 0.99, "learning_rate": 7.7036587521917e-07, "loss": 2.6764, "step": 36760 }, { "epoch": 0.99, "learning_rate": 7.669538422586664e-07, "loss": 2.3939, "step": 36761 }, { "epoch": 0.99, "learning_rate": 7.635493793091141e-07, "loss": 2.3481, "step": 36762 }, { "epoch": 0.99, "learning_rate": 7.601524863962706e-07, "loss": 2.1918, "step": 36763 }, { "epoch": 0.99, "learning_rate": 7.567631635457817e-07, "loss": 2.5853, "step": 36764 }, { "epoch": 0.99, "learning_rate": 7.533814107834048e-07, "loss": 2.0446, "step": 36765 }, { "epoch": 0.99, "learning_rate": 7.500072281348969e-07, "loss": 2.3184, "step": 36766 }, { "epoch": 0.99, "learning_rate": 7.466406156255711e-07, "loss": 2.416, "step": 36767 }, { "epoch": 0.99, "learning_rate": 7.432815732810738e-07, "loss": 2.5814, "step": 36768 }, { "epoch": 0.99, "learning_rate": 7.399301011268289e-07, "loss": 2.2375, "step": 36769 }, { "epoch": 0.99, "learning_rate": 7.365861991882606e-07, "loss": 2.6445, "step": 36770 }, { "epoch": 0.99, "learning_rate": 7.332498674905708e-07, "loss": 2.7518, "step": 36771 }, { "epoch": 0.99, "learning_rate": 7.299211060591837e-07, "loss": 2.214, "step": 36772 }, { "epoch": 0.99, "learning_rate": 7.265999149193014e-07, "loss": 2.3836, "step": 36773 }, { "epoch": 0.99, "learning_rate": 7.23286294096015e-07, "loss": 2.609, "step": 36774 }, { "epoch": 0.99, "learning_rate": 7.199802436144154e-07, "loss": 2.1521, "step": 36775 }, { "epoch": 0.99, "learning_rate": 7.166817634995937e-07, "loss": 2.1907, "step": 36776 }, { "epoch": 0.99, "learning_rate": 7.133908537765299e-07, "loss": 1.8963, "step": 36777 }, { "epoch": 0.99, "learning_rate": 7.10107514470204e-07, "loss": 2.6892, "step": 36778 }, { "epoch": 0.99, "learning_rate": 7.068317456054851e-07, "loss": 2.0912, "step": 36779 }, { "epoch": 0.99, "learning_rate": 7.035635472071311e-07, "loss": 2.655, "step": 36780 }, { "epoch": 0.99, "learning_rate": 7.00302919299789e-07, "loss": 2.4136, "step": 36781 }, { "epoch": 0.99, "learning_rate": 6.970498619084387e-07, "loss": 2.3951, "step": 36782 }, { "epoch": 0.99, "learning_rate": 6.938043750576162e-07, "loss": 2.4836, "step": 36783 }, { "epoch": 0.99, "learning_rate": 6.905664587717464e-07, "loss": 2.316, "step": 36784 }, { "epoch": 0.99, "learning_rate": 6.873361130754762e-07, "loss": 2.7365, "step": 36785 }, { "epoch": 0.99, "learning_rate": 6.841133379933417e-07, "loss": 2.1771, "step": 36786 }, { "epoch": 0.99, "learning_rate": 6.808981335497677e-07, "loss": 2.5182, "step": 36787 }, { "epoch": 0.99, "learning_rate": 6.77690499768957e-07, "loss": 2.4988, "step": 36788 }, { "epoch": 0.99, "learning_rate": 6.744904366753346e-07, "loss": 2.3347, "step": 36789 }, { "epoch": 0.99, "learning_rate": 6.712979442931034e-07, "loss": 2.2155, "step": 36790 }, { "epoch": 0.99, "learning_rate": 6.68113022646466e-07, "loss": 2.7375, "step": 36791 }, { "epoch": 0.99, "learning_rate": 6.649356717596256e-07, "loss": 2.6446, "step": 36792 }, { "epoch": 0.99, "learning_rate": 6.617658916564517e-07, "loss": 2.8227, "step": 36793 }, { "epoch": 0.99, "learning_rate": 6.586036823610364e-07, "loss": 2.0568, "step": 36794 }, { "epoch": 0.99, "learning_rate": 6.554490438974714e-07, "loss": 2.3068, "step": 36795 }, { "epoch": 0.99, "learning_rate": 6.523019762895155e-07, "loss": 2.4721, "step": 36796 }, { "epoch": 0.99, "learning_rate": 6.491624795610384e-07, "loss": 2.3732, "step": 36797 }, { "epoch": 0.99, "learning_rate": 6.460305537359102e-07, "loss": 2.677, "step": 36798 }, { "epoch": 0.99, "learning_rate": 6.429061988377782e-07, "loss": 2.802, "step": 36799 }, { "epoch": 0.99, "learning_rate": 6.397894148902905e-07, "loss": 2.5534, "step": 36800 }, { "epoch": 0.99, "learning_rate": 6.366802019170948e-07, "loss": 2.5759, "step": 36801 }, { "epoch": 0.99, "learning_rate": 6.335785599417276e-07, "loss": 2.4121, "step": 36802 }, { "epoch": 0.99, "learning_rate": 6.304844889876149e-07, "loss": 2.3991, "step": 36803 }, { "epoch": 0.99, "learning_rate": 6.273979890784043e-07, "loss": 2.0445, "step": 36804 }, { "epoch": 0.99, "learning_rate": 6.243190602372995e-07, "loss": 3.1291, "step": 36805 }, { "epoch": 0.99, "learning_rate": 6.212477024877261e-07, "loss": 2.6837, "step": 36806 }, { "epoch": 0.99, "learning_rate": 6.181839158528879e-07, "loss": 2.512, "step": 36807 }, { "epoch": 0.99, "learning_rate": 6.151277003559885e-07, "loss": 2.3943, "step": 36808 }, { "epoch": 0.99, "learning_rate": 6.120790560202316e-07, "loss": 2.5622, "step": 36809 }, { "epoch": 0.99, "learning_rate": 6.090379828687098e-07, "loss": 2.8858, "step": 36810 }, { "epoch": 0.99, "learning_rate": 6.060044809244047e-07, "loss": 2.5457, "step": 36811 }, { "epoch": 0.99, "learning_rate": 6.029785502102981e-07, "loss": 2.6156, "step": 36812 }, { "epoch": 0.99, "learning_rate": 5.999601907494823e-07, "loss": 2.1278, "step": 36813 }, { "epoch": 0.99, "learning_rate": 5.96949402564606e-07, "loss": 2.0571, "step": 36814 }, { "epoch": 0.99, "learning_rate": 5.9394618567854e-07, "loss": 2.4654, "step": 36815 }, { "epoch": 0.99, "learning_rate": 5.909505401140435e-07, "loss": 2.3352, "step": 36816 }, { "epoch": 0.99, "learning_rate": 5.879624658938764e-07, "loss": 2.3463, "step": 36817 }, { "epoch": 0.99, "learning_rate": 5.849819630406871e-07, "loss": 2.7498, "step": 36818 }, { "epoch": 0.99, "learning_rate": 5.820090315769022e-07, "loss": 2.2788, "step": 36819 }, { "epoch": 0.99, "learning_rate": 5.790436715251702e-07, "loss": 2.6105, "step": 36820 }, { "epoch": 0.99, "learning_rate": 5.760858829079174e-07, "loss": 2.2462, "step": 36821 }, { "epoch": 0.99, "learning_rate": 5.731356657475706e-07, "loss": 2.4246, "step": 36822 }, { "epoch": 0.99, "learning_rate": 5.701930200664451e-07, "loss": 2.2623, "step": 36823 }, { "epoch": 0.99, "learning_rate": 5.672579458868565e-07, "loss": 2.1498, "step": 36824 }, { "epoch": 0.99, "learning_rate": 5.643304432311203e-07, "loss": 2.479, "step": 36825 }, { "epoch": 0.99, "learning_rate": 5.614105121212187e-07, "loss": 1.896, "step": 36826 }, { "epoch": 0.99, "learning_rate": 5.584981525794674e-07, "loss": 2.7722, "step": 36827 }, { "epoch": 0.99, "learning_rate": 5.555933646278489e-07, "loss": 2.756, "step": 36828 }, { "epoch": 0.99, "learning_rate": 5.526961482883453e-07, "loss": 2.3887, "step": 36829 }, { "epoch": 0.99, "learning_rate": 5.498065035829392e-07, "loss": 2.5913, "step": 36830 }, { "epoch": 0.99, "learning_rate": 5.469244305335019e-07, "loss": 2.1944, "step": 36831 }, { "epoch": 0.99, "learning_rate": 5.440499291617939e-07, "loss": 3.0577, "step": 36832 }, { "epoch": 0.99, "learning_rate": 5.411829994897977e-07, "loss": 2.4598, "step": 36833 }, { "epoch": 0.99, "learning_rate": 5.383236415391624e-07, "loss": 2.1802, "step": 36834 }, { "epoch": 0.99, "learning_rate": 5.354718553313154e-07, "loss": 2.4392, "step": 36835 }, { "epoch": 0.99, "learning_rate": 5.326276408882391e-07, "loss": 2.577, "step": 36836 }, { "epoch": 0.99, "learning_rate": 5.297909982311388e-07, "loss": 2.4817, "step": 36837 }, { "epoch": 0.99, "learning_rate": 5.26961927381775e-07, "loss": 2.7682, "step": 36838 }, { "epoch": 0.99, "learning_rate": 5.241404283613527e-07, "loss": 2.3465, "step": 36839 }, { "epoch": 0.99, "learning_rate": 5.213265011914104e-07, "loss": 1.8795, "step": 36840 }, { "epoch": 0.99, "learning_rate": 5.185201458931533e-07, "loss": 2.9315, "step": 36841 }, { "epoch": 0.99, "learning_rate": 5.157213624880086e-07, "loss": 2.7532, "step": 36842 }, { "epoch": 0.99, "learning_rate": 5.129301509969597e-07, "loss": 2.6214, "step": 36843 }, { "epoch": 0.99, "learning_rate": 5.101465114413228e-07, "loss": 2.9271, "step": 36844 }, { "epoch": 0.99, "learning_rate": 5.073704438420812e-07, "loss": 2.4449, "step": 36845 }, { "epoch": 0.99, "learning_rate": 5.04601948220329e-07, "loss": 2.7322, "step": 36846 }, { "epoch": 0.99, "learning_rate": 5.018410245970496e-07, "loss": 2.0124, "step": 36847 }, { "epoch": 0.99, "learning_rate": 4.990876729931149e-07, "loss": 2.8647, "step": 36848 }, { "epoch": 0.99, "learning_rate": 4.963418934292863e-07, "loss": 2.3775, "step": 36849 }, { "epoch": 0.99, "learning_rate": 4.936036859266579e-07, "loss": 2.2624, "step": 36850 }, { "epoch": 0.99, "learning_rate": 4.90873050505658e-07, "loss": 2.6223, "step": 36851 }, { "epoch": 0.99, "learning_rate": 4.881499871871586e-07, "loss": 2.3604, "step": 36852 }, { "epoch": 0.99, "learning_rate": 4.85434495991699e-07, "loss": 2.2109, "step": 36853 }, { "epoch": 0.99, "learning_rate": 4.827265769399292e-07, "loss": 2.4425, "step": 36854 }, { "epoch": 0.99, "learning_rate": 4.800262300523883e-07, "loss": 2.1508, "step": 36855 }, { "epoch": 0.99, "learning_rate": 4.773334553493936e-07, "loss": 2.4312, "step": 36856 }, { "epoch": 0.99, "learning_rate": 4.7464825285148394e-07, "loss": 2.4777, "step": 36857 }, { "epoch": 0.99, "learning_rate": 4.719706225788656e-07, "loss": 2.1944, "step": 36858 }, { "epoch": 0.99, "learning_rate": 4.6930056455185555e-07, "loss": 2.195, "step": 36859 }, { "epoch": 0.99, "learning_rate": 4.6663807879088193e-07, "loss": 2.6255, "step": 36860 }, { "epoch": 0.99, "learning_rate": 4.6398316531581777e-07, "loss": 2.2821, "step": 36861 }, { "epoch": 0.99, "learning_rate": 4.6133582414698003e-07, "loss": 2.2124, "step": 36862 }, { "epoch": 0.99, "learning_rate": 4.586960553043529e-07, "loss": 2.0819, "step": 36863 }, { "epoch": 0.99, "learning_rate": 4.5606385880792024e-07, "loss": 2.4751, "step": 36864 }, { "epoch": 0.99, "learning_rate": 4.534392346776661e-07, "loss": 2.3431, "step": 36865 }, { "epoch": 0.99, "learning_rate": 4.5082218293346354e-07, "loss": 2.4645, "step": 36866 }, { "epoch": 0.99, "learning_rate": 4.482127035951855e-07, "loss": 2.5618, "step": 36867 }, { "epoch": 0.99, "learning_rate": 4.4561079668248293e-07, "loss": 2.0682, "step": 36868 }, { "epoch": 0.99, "learning_rate": 4.430164622151178e-07, "loss": 2.6556, "step": 36869 }, { "epoch": 0.99, "learning_rate": 4.404297002127411e-07, "loss": 1.8587, "step": 36870 }, { "epoch": 0.99, "learning_rate": 4.378505106950037e-07, "loss": 2.5298, "step": 36871 }, { "epoch": 0.99, "learning_rate": 4.352788936814456e-07, "loss": 2.3951, "step": 36872 }, { "epoch": 0.99, "learning_rate": 4.327148491913846e-07, "loss": 2.4357, "step": 36873 }, { "epoch": 0.99, "learning_rate": 4.3015837724447173e-07, "loss": 2.3767, "step": 36874 }, { "epoch": 0.99, "learning_rate": 4.276094778599138e-07, "loss": 2.591, "step": 36875 }, { "epoch": 0.99, "learning_rate": 4.250681510571397e-07, "loss": 2.8438, "step": 36876 }, { "epoch": 0.99, "learning_rate": 4.2253439685535634e-07, "loss": 2.2274, "step": 36877 }, { "epoch": 0.99, "learning_rate": 4.200082152736595e-07, "loss": 2.68, "step": 36878 }, { "epoch": 0.99, "learning_rate": 4.1748960633136714e-07, "loss": 2.5808, "step": 36879 }, { "epoch": 0.99, "learning_rate": 4.1497857004735293e-07, "loss": 2.5348, "step": 36880 }, { "epoch": 0.99, "learning_rate": 4.124751064408239e-07, "loss": 2.4149, "step": 36881 }, { "epoch": 0.99, "learning_rate": 4.0997921553065363e-07, "loss": 2.6018, "step": 36882 }, { "epoch": 0.99, "learning_rate": 4.074908973358271e-07, "loss": 2.8109, "step": 36883 }, { "epoch": 0.99, "learning_rate": 4.05010151874996e-07, "loss": 1.811, "step": 36884 }, { "epoch": 0.99, "learning_rate": 4.025369791672562e-07, "loss": 2.9335, "step": 36885 }, { "epoch": 0.99, "learning_rate": 4.000713792310373e-07, "loss": 2.4566, "step": 36886 }, { "epoch": 0.99, "learning_rate": 3.9761335208532423e-07, "loss": 2.2724, "step": 36887 }, { "epoch": 0.99, "learning_rate": 3.9516289774843564e-07, "loss": 1.8499, "step": 36888 }, { "epoch": 0.99, "learning_rate": 3.9272001623924524e-07, "loss": 2.5779, "step": 36889 }, { "epoch": 0.99, "learning_rate": 3.902847075759608e-07, "loss": 2.6826, "step": 36890 }, { "epoch": 0.99, "learning_rate": 3.87856971777234e-07, "loss": 2.1904, "step": 36891 }, { "epoch": 0.99, "learning_rate": 3.8543680886127253e-07, "loss": 2.4457, "step": 36892 }, { "epoch": 0.99, "learning_rate": 3.830242188466171e-07, "loss": 2.3114, "step": 36893 }, { "epoch": 0.99, "learning_rate": 3.8061920175147534e-07, "loss": 2.6519, "step": 36894 }, { "epoch": 0.99, "learning_rate": 3.78221757594055e-07, "loss": 2.4709, "step": 36895 }, { "epoch": 0.99, "learning_rate": 3.7583188639245256e-07, "loss": 1.7848, "step": 36896 }, { "epoch": 0.99, "learning_rate": 3.7344958816487585e-07, "loss": 2.637, "step": 36897 }, { "epoch": 0.99, "learning_rate": 3.7107486292931035e-07, "loss": 2.3125, "step": 36898 }, { "epoch": 0.99, "learning_rate": 3.6870771070374174e-07, "loss": 2.422, "step": 36899 }, { "epoch": 0.99, "learning_rate": 3.6634813150615565e-07, "loss": 2.0825, "step": 36900 }, { "epoch": 0.99, "learning_rate": 3.639961253544266e-07, "loss": 2.3516, "step": 36901 }, { "epoch": 0.99, "learning_rate": 3.6165169226631823e-07, "loss": 2.0849, "step": 36902 }, { "epoch": 0.99, "learning_rate": 3.5931483225959406e-07, "loss": 2.9638, "step": 36903 }, { "epoch": 0.99, "learning_rate": 3.5698554535201764e-07, "loss": 2.4962, "step": 36904 }, { "epoch": 0.99, "learning_rate": 3.546638315611306e-07, "loss": 2.9405, "step": 36905 }, { "epoch": 0.99, "learning_rate": 3.523496909046964e-07, "loss": 2.1287, "step": 36906 }, { "epoch": 0.99, "learning_rate": 3.500431234000345e-07, "loss": 2.3064, "step": 36907 }, { "epoch": 0.99, "learning_rate": 3.4774412906479756e-07, "loss": 2.6232, "step": 36908 }, { "epoch": 0.99, "learning_rate": 3.4545270791630503e-07, "loss": 2.8559, "step": 36909 }, { "epoch": 0.99, "learning_rate": 3.431688599719873e-07, "loss": 2.6066, "step": 36910 }, { "epoch": 0.99, "learning_rate": 3.40892585249053e-07, "loss": 2.5339, "step": 36911 }, { "epoch": 0.99, "learning_rate": 3.3862388376471045e-07, "loss": 2.5936, "step": 36912 }, { "epoch": 0.99, "learning_rate": 3.363627555363902e-07, "loss": 2.5115, "step": 36913 }, { "epoch": 0.99, "learning_rate": 3.341092005809676e-07, "loss": 2.5701, "step": 36914 }, { "epoch": 0.99, "learning_rate": 3.318632189156512e-07, "loss": 2.7791, "step": 36915 }, { "epoch": 0.99, "learning_rate": 3.2962481055742734e-07, "loss": 2.4757, "step": 36916 }, { "epoch": 0.99, "learning_rate": 3.273939755231714e-07, "loss": 2.0831, "step": 36917 }, { "epoch": 0.99, "learning_rate": 3.251707138298698e-07, "loss": 2.4274, "step": 36918 }, { "epoch": 0.99, "learning_rate": 3.22955025494398e-07, "loss": 2.3729, "step": 36919 }, { "epoch": 0.99, "learning_rate": 3.2074691053340933e-07, "loss": 2.1444, "step": 36920 }, { "epoch": 0.99, "learning_rate": 3.185463689637791e-07, "loss": 2.3504, "step": 36921 }, { "epoch": 0.99, "learning_rate": 3.163534008021607e-07, "loss": 2.4749, "step": 36922 }, { "epoch": 0.99, "learning_rate": 3.141680060650964e-07, "loss": 2.877, "step": 36923 }, { "epoch": 0.99, "learning_rate": 3.1199018476912864e-07, "loss": 2.5721, "step": 36924 }, { "epoch": 0.99, "learning_rate": 3.0981993693079967e-07, "loss": 2.5057, "step": 36925 }, { "epoch": 0.99, "learning_rate": 3.076572625665408e-07, "loss": 2.4512, "step": 36926 }, { "epoch": 0.99, "learning_rate": 3.0550216169278336e-07, "loss": 2.2913, "step": 36927 }, { "epoch": 0.99, "learning_rate": 3.0335463432584754e-07, "loss": 2.0109, "step": 36928 }, { "epoch": 0.99, "learning_rate": 3.0121468048183164e-07, "loss": 2.2827, "step": 36929 }, { "epoch": 0.99, "learning_rate": 2.99082300177167e-07, "loss": 3.1443, "step": 36930 }, { "epoch": 0.99, "learning_rate": 2.9695749342795174e-07, "loss": 2.1497, "step": 36931 }, { "epoch": 0.99, "learning_rate": 2.948402602501732e-07, "loss": 2.2981, "step": 36932 }, { "epoch": 0.99, "learning_rate": 2.9273060066004053e-07, "loss": 2.6015, "step": 36933 }, { "epoch": 0.99, "learning_rate": 2.9062851467343e-07, "loss": 2.2871, "step": 36934 }, { "epoch": 0.99, "learning_rate": 2.885340023062177e-07, "loss": 2.7884, "step": 36935 }, { "epoch": 0.99, "learning_rate": 2.86447063574502e-07, "loss": 2.4832, "step": 36936 }, { "epoch": 0.99, "learning_rate": 2.8436769849382594e-07, "loss": 2.7261, "step": 36937 }, { "epoch": 0.99, "learning_rate": 2.822959070799547e-07, "loss": 2.4798, "step": 36938 }, { "epoch": 0.99, "learning_rate": 2.8023168934876444e-07, "loss": 2.472, "step": 36939 }, { "epoch": 0.99, "learning_rate": 2.781750453159093e-07, "loss": 2.4484, "step": 36940 }, { "epoch": 0.99, "learning_rate": 2.761259749967104e-07, "loss": 2.5366, "step": 36941 }, { "epoch": 0.99, "learning_rate": 2.7408447840693297e-07, "loss": 2.5816, "step": 36942 }, { "epoch": 0.99, "learning_rate": 2.7205055556189795e-07, "loss": 2.4243, "step": 36943 }, { "epoch": 0.99, "learning_rate": 2.700242064771485e-07, "loss": 2.0116, "step": 36944 }, { "epoch": 0.99, "learning_rate": 2.6800543116789477e-07, "loss": 2.2017, "step": 36945 }, { "epoch": 0.99, "learning_rate": 2.6599422964945775e-07, "loss": 2.5093, "step": 36946 }, { "epoch": 0.99, "learning_rate": 2.639906019372695e-07, "loss": 2.1615, "step": 36947 }, { "epoch": 0.99, "learning_rate": 2.6199454804620714e-07, "loss": 3.1535, "step": 36948 }, { "epoch": 0.99, "learning_rate": 2.6000606799159165e-07, "loss": 2.3168, "step": 36949 }, { "epoch": 0.99, "learning_rate": 2.580251617884111e-07, "loss": 2.189, "step": 36950 }, { "epoch": 0.99, "learning_rate": 2.560518294517644e-07, "loss": 2.6238, "step": 36951 }, { "epoch": 0.99, "learning_rate": 2.540860709964177e-07, "loss": 2.4966, "step": 36952 }, { "epoch": 0.99, "learning_rate": 2.521278864374699e-07, "loss": 1.924, "step": 36953 }, { "epoch": 0.99, "learning_rate": 2.5017727578957595e-07, "loss": 2.3473, "step": 36954 }, { "epoch": 0.99, "learning_rate": 2.482342390677239e-07, "loss": 2.5025, "step": 36955 }, { "epoch": 0.99, "learning_rate": 2.462987762864577e-07, "loss": 2.8756, "step": 36956 }, { "epoch": 0.99, "learning_rate": 2.4437088746043223e-07, "loss": 2.2696, "step": 36957 }, { "epoch": 0.99, "learning_rate": 2.424505726044135e-07, "loss": 2.1111, "step": 36958 }, { "epoch": 0.99, "learning_rate": 2.405378317327234e-07, "loss": 1.8168, "step": 36959 }, { "epoch": 0.99, "learning_rate": 2.386326648601278e-07, "loss": 2.2422, "step": 36960 }, { "epoch": 0.99, "learning_rate": 2.3673507200083767e-07, "loss": 2.3573, "step": 36961 }, { "epoch": 0.99, "learning_rate": 2.3484505316928585e-07, "loss": 2.6811, "step": 36962 }, { "epoch": 0.99, "learning_rate": 2.3296260837979422e-07, "loss": 2.3732, "step": 36963 }, { "epoch": 0.99, "learning_rate": 2.3108773764668468e-07, "loss": 2.5891, "step": 36964 }, { "epoch": 0.99, "learning_rate": 2.2922044098405704e-07, "loss": 2.6989, "step": 36965 }, { "epoch": 0.99, "learning_rate": 2.2736071840612215e-07, "loss": 2.1821, "step": 36966 }, { "epoch": 0.99, "learning_rate": 2.2550856992697987e-07, "loss": 2.5563, "step": 36967 }, { "epoch": 0.99, "learning_rate": 2.23663995560619e-07, "loss": 2.7165, "step": 36968 }, { "epoch": 0.99, "learning_rate": 2.2182699532113936e-07, "loss": 2.4086, "step": 36969 }, { "epoch": 0.99, "learning_rate": 2.199975692221967e-07, "loss": 2.545, "step": 36970 }, { "epoch": 0.99, "learning_rate": 2.1817571727789088e-07, "loss": 2.3861, "step": 36971 }, { "epoch": 0.99, "learning_rate": 2.1636143950198862e-07, "loss": 2.3271, "step": 36972 }, { "epoch": 0.99, "learning_rate": 2.1455473590814568e-07, "loss": 2.564, "step": 36973 }, { "epoch": 0.99, "learning_rate": 2.1275560651001778e-07, "loss": 2.2623, "step": 36974 }, { "epoch": 0.99, "learning_rate": 2.1096405132137175e-07, "loss": 2.1182, "step": 36975 }, { "epoch": 0.99, "learning_rate": 2.0918007035575226e-07, "loss": 2.384, "step": 36976 }, { "epoch": 0.99, "learning_rate": 2.07403663626593e-07, "loss": 2.8609, "step": 36977 }, { "epoch": 0.99, "learning_rate": 2.0563483114743876e-07, "loss": 2.5126, "step": 36978 }, { "epoch": 0.99, "learning_rate": 2.0387357293161212e-07, "loss": 2.2658, "step": 36979 }, { "epoch": 0.99, "learning_rate": 2.0211988899254686e-07, "loss": 1.7043, "step": 36980 }, { "epoch": 0.99, "learning_rate": 2.0037377934334355e-07, "loss": 2.5784, "step": 36981 }, { "epoch": 0.99, "learning_rate": 1.9863524399743594e-07, "loss": 2.6347, "step": 36982 }, { "epoch": 0.99, "learning_rate": 1.9690428296792463e-07, "loss": 2.3175, "step": 36983 }, { "epoch": 0.99, "learning_rate": 1.9518089626802126e-07, "loss": 2.3829, "step": 36984 }, { "epoch": 0.99, "learning_rate": 1.9346508391049345e-07, "loss": 2.6256, "step": 36985 }, { "epoch": 0.99, "learning_rate": 1.9175684590866381e-07, "loss": 2.5275, "step": 36986 }, { "epoch": 0.99, "learning_rate": 1.9005618227529996e-07, "loss": 3.084, "step": 36987 }, { "epoch": 0.99, "learning_rate": 1.8836309302328049e-07, "loss": 2.4432, "step": 36988 }, { "epoch": 0.99, "learning_rate": 1.8667757816548393e-07, "loss": 2.4894, "step": 36989 }, { "epoch": 0.99, "learning_rate": 1.8499963771467786e-07, "loss": 2.3987, "step": 36990 }, { "epoch": 0.99, "learning_rate": 1.8332927168351887e-07, "loss": 2.4233, "step": 36991 }, { "epoch": 0.99, "learning_rate": 1.816664800847745e-07, "loss": 2.8908, "step": 36992 }, { "epoch": 0.99, "learning_rate": 1.8001126293099025e-07, "loss": 2.4174, "step": 36993 }, { "epoch": 0.99, "learning_rate": 1.7836362023460062e-07, "loss": 2.1391, "step": 36994 }, { "epoch": 0.99, "learning_rate": 1.7672355200826218e-07, "loss": 2.3235, "step": 36995 }, { "epoch": 0.99, "learning_rate": 1.7509105826429838e-07, "loss": 2.2739, "step": 36996 }, { "epoch": 0.99, "learning_rate": 1.7346613901503272e-07, "loss": 2.19, "step": 36997 }, { "epoch": 0.99, "learning_rate": 1.7184879427289968e-07, "loss": 2.4993, "step": 36998 }, { "epoch": 0.99, "learning_rate": 1.7023902405011171e-07, "loss": 2.1127, "step": 36999 }, { "epoch": 0.99, "learning_rate": 1.6863682835877024e-07, "loss": 2.6524, "step": 37000 }, { "epoch": 0.99, "learning_rate": 1.6704220721108776e-07, "loss": 2.4603, "step": 37001 }, { "epoch": 0.99, "learning_rate": 1.6545516061916565e-07, "loss": 2.4805, "step": 37002 }, { "epoch": 0.99, "learning_rate": 1.6387568859499436e-07, "loss": 2.0693, "step": 37003 }, { "epoch": 0.99, "learning_rate": 1.6230379115056427e-07, "loss": 2.3548, "step": 37004 }, { "epoch": 0.99, "learning_rate": 1.6073946829775476e-07, "loss": 2.1568, "step": 37005 }, { "epoch": 0.99, "learning_rate": 1.5918272004844525e-07, "loss": 2.625, "step": 37006 }, { "epoch": 0.99, "learning_rate": 1.5763354641440408e-07, "loss": 2.5742, "step": 37007 }, { "epoch": 0.99, "learning_rate": 1.5609194740739962e-07, "loss": 2.5508, "step": 37008 }, { "epoch": 0.99, "learning_rate": 1.545579230389782e-07, "loss": 2.2201, "step": 37009 }, { "epoch": 0.99, "learning_rate": 1.530314733210192e-07, "loss": 2.4907, "step": 37010 }, { "epoch": 0.99, "learning_rate": 1.5151259826484686e-07, "loss": 2.577, "step": 37011 }, { "epoch": 0.99, "learning_rate": 1.5000129788200756e-07, "loss": 2.0641, "step": 37012 }, { "epoch": 0.99, "learning_rate": 1.4849757218415861e-07, "loss": 2.8046, "step": 37013 }, { "epoch": 0.99, "learning_rate": 1.4700142118240222e-07, "loss": 2.5379, "step": 37014 }, { "epoch": 0.99, "learning_rate": 1.4551284488828475e-07, "loss": 2.5751, "step": 37015 }, { "epoch": 0.99, "learning_rate": 1.440318433129084e-07, "loss": 2.9206, "step": 37016 }, { "epoch": 0.99, "learning_rate": 1.425584164677085e-07, "loss": 2.443, "step": 37017 }, { "epoch": 0.99, "learning_rate": 1.4109256436367623e-07, "loss": 2.5168, "step": 37018 }, { "epoch": 0.99, "learning_rate": 1.3963428701191384e-07, "loss": 2.2967, "step": 37019 }, { "epoch": 0.99, "learning_rate": 1.3818358442363454e-07, "loss": 2.2856, "step": 37020 }, { "epoch": 0.99, "learning_rate": 1.3674045660960755e-07, "loss": 2.5939, "step": 37021 }, { "epoch": 0.99, "learning_rate": 1.3530490358093506e-07, "loss": 2.6487, "step": 37022 }, { "epoch": 0.99, "learning_rate": 1.3387692534838626e-07, "loss": 2.5039, "step": 37023 }, { "epoch": 0.99, "learning_rate": 1.324565219228413e-07, "loss": 2.6614, "step": 37024 }, { "epoch": 1.0, "learning_rate": 1.3104369331506938e-07, "loss": 2.4848, "step": 37025 }, { "epoch": 1.0, "learning_rate": 1.2963843953583965e-07, "loss": 2.3426, "step": 37026 }, { "epoch": 1.0, "learning_rate": 1.282407605955882e-07, "loss": 2.6443, "step": 37027 }, { "epoch": 1.0, "learning_rate": 1.268506565050842e-07, "loss": 2.4048, "step": 37028 }, { "epoch": 1.0, "learning_rate": 1.2546812727476376e-07, "loss": 2.1906, "step": 37029 }, { "epoch": 1.0, "learning_rate": 1.2409317291506294e-07, "loss": 2.98, "step": 37030 }, { "epoch": 1.0, "learning_rate": 1.2272579343663993e-07, "loss": 2.1835, "step": 37031 }, { "epoch": 1.0, "learning_rate": 1.213659888495977e-07, "loss": 2.5461, "step": 37032 }, { "epoch": 1.0, "learning_rate": 1.2001375916426137e-07, "loss": 2.4356, "step": 37033 }, { "epoch": 1.0, "learning_rate": 1.1866910439106703e-07, "loss": 2.8244, "step": 37034 }, { "epoch": 1.0, "learning_rate": 1.173320245400067e-07, "loss": 2.1932, "step": 37035 }, { "epoch": 1.0, "learning_rate": 1.1600251962129438e-07, "loss": 2.7171, "step": 37036 }, { "epoch": 1.0, "learning_rate": 1.1468058964492212e-07, "loss": 2.646, "step": 37037 }, { "epoch": 1.0, "learning_rate": 1.1336623462099294e-07, "loss": 2.5447, "step": 37038 }, { "epoch": 1.0, "learning_rate": 1.1205945455949884e-07, "loss": 2.2974, "step": 37039 }, { "epoch": 1.0, "learning_rate": 1.107602494702098e-07, "loss": 2.1108, "step": 37040 }, { "epoch": 1.0, "learning_rate": 1.094686193631178e-07, "loss": 2.01, "step": 37041 }, { "epoch": 1.0, "learning_rate": 1.0818456424788182e-07, "loss": 2.2877, "step": 37042 }, { "epoch": 1.0, "learning_rate": 1.0690808413416075e-07, "loss": 2.4632, "step": 37043 }, { "epoch": 1.0, "learning_rate": 1.0563917903194664e-07, "loss": 2.1764, "step": 37044 }, { "epoch": 1.0, "learning_rate": 1.0437784895045432e-07, "loss": 2.6279, "step": 37045 }, { "epoch": 1.0, "learning_rate": 1.0312409389956479e-07, "loss": 2.8216, "step": 37046 }, { "epoch": 1.0, "learning_rate": 1.018779138886039e-07, "loss": 2.5457, "step": 37047 }, { "epoch": 1.0, "learning_rate": 1.0063930892700856e-07, "loss": 2.4794, "step": 37048 }, { "epoch": 1.0, "learning_rate": 9.94082790243267e-08, "loss": 2.7119, "step": 37049 }, { "epoch": 1.0, "learning_rate": 9.818482418966212e-08, "loss": 2.4601, "step": 37050 }, { "epoch": 1.0, "learning_rate": 9.696894443234073e-08, "loss": 2.4898, "step": 37051 }, { "epoch": 1.0, "learning_rate": 9.576063976168836e-08, "loss": 2.7251, "step": 37052 }, { "epoch": 1.0, "learning_rate": 9.455991018680887e-08, "loss": 2.3713, "step": 37053 }, { "epoch": 1.0, "learning_rate": 9.336675571680608e-08, "loss": 2.3565, "step": 37054 }, { "epoch": 1.0, "learning_rate": 9.218117636056178e-08, "loss": 2.7877, "step": 37055 }, { "epoch": 1.0, "learning_rate": 9.100317212729081e-08, "loss": 2.6136, "step": 37056 }, { "epoch": 1.0, "learning_rate": 8.983274302576394e-08, "loss": 2.8852, "step": 37057 }, { "epoch": 1.0, "learning_rate": 8.866988906486296e-08, "loss": 2.5925, "step": 37058 }, { "epoch": 1.0, "learning_rate": 8.751461025346963e-08, "loss": 2.4605, "step": 37059 }, { "epoch": 1.0, "learning_rate": 8.636690660035473e-08, "loss": 2.1083, "step": 37060 }, { "epoch": 1.0, "learning_rate": 8.522677811406698e-08, "loss": 2.6013, "step": 37061 }, { "epoch": 1.0, "learning_rate": 8.409422480337714e-08, "loss": 2.1299, "step": 37062 }, { "epoch": 1.0, "learning_rate": 8.296924667683392e-08, "loss": 2.4367, "step": 37063 }, { "epoch": 1.0, "learning_rate": 8.185184374298604e-08, "loss": 2.187, "step": 37064 }, { "epoch": 1.0, "learning_rate": 8.074201601016017e-08, "loss": 2.8224, "step": 37065 }, { "epoch": 1.0, "learning_rate": 7.963976348690505e-08, "loss": 2.411, "step": 37066 }, { "epoch": 1.0, "learning_rate": 7.854508618154732e-08, "loss": 2.3798, "step": 37067 }, { "epoch": 1.0, "learning_rate": 7.745798410230265e-08, "loss": 2.2335, "step": 37068 }, { "epoch": 1.0, "learning_rate": 7.637845725760873e-08, "loss": 2.6781, "step": 37069 }, { "epoch": 1.0, "learning_rate": 7.530650565534814e-08, "loss": 2.128, "step": 37070 }, { "epoch": 1.0, "learning_rate": 7.424212930384756e-08, "loss": 2.4052, "step": 37071 }, { "epoch": 1.0, "learning_rate": 7.318532821110057e-08, "loss": 2.2706, "step": 37072 }, { "epoch": 1.0, "learning_rate": 7.213610238521185e-08, "loss": 2.1331, "step": 37073 }, { "epoch": 1.0, "learning_rate": 7.109445183395291e-08, "loss": 2.566, "step": 37074 }, { "epoch": 1.0, "learning_rate": 7.006037656542841e-08, "loss": 2.6822, "step": 37075 }, { "epoch": 1.0, "learning_rate": 6.903387658718785e-08, "loss": 2.4226, "step": 37076 }, { "epoch": 1.0, "learning_rate": 6.801495190733587e-08, "loss": 2.344, "step": 37077 }, { "epoch": 1.0, "learning_rate": 6.700360253331094e-08, "loss": 2.2748, "step": 37078 }, { "epoch": 1.0, "learning_rate": 6.599982847299569e-08, "loss": 2.5948, "step": 37079 }, { "epoch": 1.0, "learning_rate": 6.500362973382856e-08, "loss": 2.5726, "step": 37080 }, { "epoch": 1.0, "learning_rate": 6.401500632347012e-08, "loss": 2.2638, "step": 37081 }, { "epoch": 1.0, "learning_rate": 6.303395824935886e-08, "loss": 2.344, "step": 37082 }, { "epoch": 1.0, "learning_rate": 6.206048551882227e-08, "loss": 2.1642, "step": 37083 }, { "epoch": 1.0, "learning_rate": 6.109458813940982e-08, "loss": 2.5374, "step": 37084 }, { "epoch": 1.0, "learning_rate": 6.013626611844902e-08, "loss": 2.3272, "step": 37085 }, { "epoch": 1.0, "learning_rate": 5.918551946304529e-08, "loss": 2.0878, "step": 37086 }, { "epoch": 1.0, "learning_rate": 5.824234818052609e-08, "loss": 2.5191, "step": 37087 }, { "epoch": 1.0, "learning_rate": 5.7306752277885846e-08, "loss": 2.3983, "step": 37088 }, { "epoch": 1.0, "learning_rate": 5.6378731762452004e-08, "loss": 2.6697, "step": 37089 }, { "epoch": 1.0, "learning_rate": 5.5458286640996945e-08, "loss": 2.3511, "step": 37090 }, { "epoch": 1.0, "learning_rate": 5.454541692073711e-08, "loss": 2.162, "step": 37091 }, { "epoch": 1.0, "learning_rate": 5.3640122608444864e-08, "loss": 2.3167, "step": 37092 }, { "epoch": 1.0, "learning_rate": 5.274240371089256e-08, "loss": 2.2304, "step": 37093 }, { "epoch": 1.0, "learning_rate": 5.185226023507461e-08, "loss": 2.6707, "step": 37094 }, { "epoch": 1.0, "learning_rate": 5.096969218765235e-08, "loss": 2.0767, "step": 37095 }, { "epoch": 1.0, "learning_rate": 5.0094699575287115e-08, "loss": 2.6107, "step": 37096 }, { "epoch": 1.0, "learning_rate": 4.922728240464025e-08, "loss": 2.8319, "step": 37097 }, { "epoch": 1.0, "learning_rate": 4.8367440682262063e-08, "loss": 2.4898, "step": 37098 }, { "epoch": 1.0, "learning_rate": 4.751517441470288e-08, "loss": 2.579, "step": 37099 }, { "epoch": 1.0, "learning_rate": 4.667048360840198e-08, "loss": 2.4281, "step": 37100 }, { "epoch": 1.0, "learning_rate": 4.583336826968765e-08, "loss": 2.2902, "step": 37101 }, { "epoch": 1.0, "learning_rate": 4.500382840499917e-08, "loss": 2.357, "step": 37102 }, { "epoch": 1.0, "learning_rate": 4.418186402066482e-08, "loss": 2.2052, "step": 37103 }, { "epoch": 1.0, "learning_rate": 4.33674751226798e-08, "loss": 2.5887, "step": 37104 }, { "epoch": 1.0, "learning_rate": 4.256066171748341e-08, "loss": 2.4645, "step": 37105 }, { "epoch": 1.0, "learning_rate": 4.1761423811070845e-08, "loss": 2.5081, "step": 37106 }, { "epoch": 1.0, "learning_rate": 4.096976140943731e-08, "loss": 2.2393, "step": 37107 }, { "epoch": 1.0, "learning_rate": 4.0185674518689045e-08, "loss": 2.6897, "step": 37108 }, { "epoch": 1.0, "learning_rate": 3.9409163144710214e-08, "loss": 2.5786, "step": 37109 }, { "epoch": 1.0, "learning_rate": 3.864022729338501e-08, "loss": 2.8165, "step": 37110 }, { "epoch": 1.0, "learning_rate": 3.787886697048659e-08, "loss": 2.3495, "step": 37111 }, { "epoch": 1.0, "learning_rate": 3.712508218189914e-08, "loss": 2.4635, "step": 37112 }, { "epoch": 1.0, "learning_rate": 3.637887293328479e-08, "loss": 2.5774, "step": 37113 }, { "epoch": 1.0, "learning_rate": 3.564023923019466e-08, "loss": 2.3412, "step": 37114 }, { "epoch": 1.0, "learning_rate": 3.4909181078401906e-08, "loss": 2.7464, "step": 37115 }, { "epoch": 1.0, "learning_rate": 3.418569848334663e-08, "loss": 2.4727, "step": 37116 }, { "epoch": 1.0, "learning_rate": 3.3469791450579935e-08, "loss": 2.1161, "step": 37117 }, { "epoch": 1.0, "learning_rate": 3.27614599854309e-08, "loss": 2.6614, "step": 37118 }, { "epoch": 1.0, "learning_rate": 3.2060704093228585e-08, "loss": 2.5914, "step": 37119 }, { "epoch": 1.0, "learning_rate": 3.13675237794131e-08, "loss": 2.1892, "step": 37120 }, { "epoch": 1.0, "learning_rate": 3.0681919049202477e-08, "loss": 1.9824, "step": 37121 }, { "epoch": 1.0, "learning_rate": 3.000388990781478e-08, "loss": 2.5788, "step": 37122 }, { "epoch": 1.0, "learning_rate": 2.933343636024599e-08, "loss": 2.3256, "step": 37123 }, { "epoch": 1.0, "learning_rate": 2.8670558411714175e-08, "loss": 2.7804, "step": 37124 }, { "epoch": 1.0, "learning_rate": 2.801525606710431e-08, "loss": 2.771, "step": 37125 }, { "epoch": 1.0, "learning_rate": 2.7367529331634445e-08, "loss": 2.7562, "step": 37126 }, { "epoch": 1.0, "learning_rate": 2.6727378209967513e-08, "loss": 2.2395, "step": 37127 }, { "epoch": 1.0, "learning_rate": 2.6094802706988496e-08, "loss": 2.5125, "step": 37128 }, { "epoch": 1.0, "learning_rate": 2.5469802827582376e-08, "loss": 2.3487, "step": 37129 }, { "epoch": 1.0, "learning_rate": 2.4852378576412093e-08, "loss": 2.4284, "step": 37130 }, { "epoch": 1.0, "learning_rate": 2.4242529958251602e-08, "loss": 2.355, "step": 37131 }, { "epoch": 1.0, "learning_rate": 2.3640256977541796e-08, "loss": 2.6688, "step": 37132 }, { "epoch": 1.0, "learning_rate": 2.3045559639056635e-08, "loss": 2.7189, "step": 37133 }, { "epoch": 1.0, "learning_rate": 2.2458437947125986e-08, "loss": 2.5532, "step": 37134 }, { "epoch": 1.0, "learning_rate": 2.1878891906301767e-08, "loss": 2.3897, "step": 37135 }, { "epoch": 1.0, "learning_rate": 2.130692152102487e-08, "loss": 2.7721, "step": 37136 }, { "epoch": 1.0, "learning_rate": 2.0742526795403116e-08, "loss": 2.7943, "step": 37137 }, { "epoch": 1.0, "learning_rate": 2.0185707733988422e-08, "loss": 2.5152, "step": 37138 }, { "epoch": 1.0, "learning_rate": 1.9636464340777594e-08, "loss": 2.3341, "step": 37139 }, { "epoch": 1.0, "learning_rate": 1.9094796619989473e-08, "loss": 2.6374, "step": 37140 }, { "epoch": 1.0, "learning_rate": 1.8560704575842913e-08, "loss": 2.6808, "step": 37141 }, { "epoch": 1.0, "learning_rate": 1.803418821222369e-08, "loss": 2.3525, "step": 37142 }, { "epoch": 1.0, "learning_rate": 1.751524753323963e-08, "loss": 2.4169, "step": 37143 }, { "epoch": 1.0, "learning_rate": 1.700388254288754e-08, "loss": 2.3288, "step": 37144 }, { "epoch": 1.0, "learning_rate": 1.650009324483115e-08, "loss": 2.1963, "step": 37145 }, { "epoch": 1.0, "learning_rate": 1.6003879642956244e-08, "loss": 2.1998, "step": 37146 }, { "epoch": 1.0, "learning_rate": 1.5515241741037578e-08, "loss": 2.4786, "step": 37147 }, { "epoch": 1.0, "learning_rate": 1.503417954284991e-08, "loss": 2.5877, "step": 37148 }, { "epoch": 1.0, "learning_rate": 1.4560693052056984e-08, "loss": 2.5337, "step": 37149 }, { "epoch": 1.0, "learning_rate": 1.4094782272100482e-08, "loss": 2.3309, "step": 37150 }, { "epoch": 1.0, "learning_rate": 1.363644720653312e-08, "loss": 2.4313, "step": 37151 }, { "epoch": 1.0, "learning_rate": 1.3185687858907614e-08, "loss": 2.3818, "step": 37152 }, { "epoch": 1.0, "learning_rate": 1.2742504232665653e-08, "loss": 2.6433, "step": 37153 }, { "epoch": 1.0, "learning_rate": 1.2306896331026884e-08, "loss": 2.363, "step": 37154 }, { "epoch": 1.0, "learning_rate": 1.1878864157433001e-08, "loss": 2.3405, "step": 37155 }, { "epoch": 1.0, "learning_rate": 1.1458407714992625e-08, "loss": 2.6482, "step": 37156 }, { "epoch": 1.0, "learning_rate": 1.1045527007036427e-08, "loss": 2.373, "step": 37157 }, { "epoch": 1.0, "learning_rate": 1.0640222036562008e-08, "loss": 2.4178, "step": 37158 }, { "epoch": 1.0, "learning_rate": 1.0242492806677994e-08, "loss": 2.0517, "step": 37159 }, { "epoch": 1.0, "learning_rate": 9.85233932049301e-09, "loss": 1.9821, "step": 37160 }, { "epoch": 1.0, "learning_rate": 9.46976158078261e-09, "loss": 2.7395, "step": 37161 }, { "epoch": 1.0, "learning_rate": 9.094759590655421e-09, "loss": 2.461, "step": 37162 }, { "epoch": 1.0, "learning_rate": 8.727333352775979e-09, "loss": 2.1886, "step": 37163 }, { "epoch": 1.0, "learning_rate": 8.367482870030862e-09, "loss": 2.6097, "step": 37164 }, { "epoch": 1.0, "learning_rate": 8.015208145084607e-09, "loss": 2.8485, "step": 37165 }, { "epoch": 1.0, "learning_rate": 7.67050918071277e-09, "loss": 2.5506, "step": 37166 }, { "epoch": 1.0, "learning_rate": 7.333385979357843e-09, "loss": 2.2445, "step": 37167 }, { "epoch": 1.0, "learning_rate": 7.00383854368436e-09, "loss": 2.1928, "step": 37168 }, { "epoch": 1.0, "learning_rate": 6.6818668761348124e-09, "loss": 2.8147, "step": 37169 }, { "epoch": 1.0, "learning_rate": 6.367470979262713e-09, "loss": 2.5015, "step": 37170 }, { "epoch": 1.0, "learning_rate": 6.060650855288507e-09, "loss": 2.0896, "step": 37171 }, { "epoch": 1.0, "learning_rate": 5.761406506654687e-09, "loss": 2.2273, "step": 37172 }, { "epoch": 1.0, "learning_rate": 5.469737935581698e-09, "loss": 2.8608, "step": 37173 }, { "epoch": 1.0, "learning_rate": 5.185645144289986e-09, "loss": 2.3796, "step": 37174 }, { "epoch": 1.0, "learning_rate": 4.909128134999996e-09, "loss": 2.1046, "step": 37175 }, { "epoch": 1.0, "learning_rate": 4.640186909599109e-09, "loss": 2.3817, "step": 37176 }, { "epoch": 1.0, "learning_rate": 4.37882147030777e-09, "loss": 2.6364, "step": 37177 }, { "epoch": 1.0, "learning_rate": 4.125031819124381e-09, "loss": 2.4971, "step": 37178 }, { "epoch": 1.0, "learning_rate": 3.87881795793632e-09, "loss": 2.3189, "step": 37179 }, { "epoch": 1.0, "learning_rate": 3.6401798884089233e-09, "loss": 2.1549, "step": 37180 }, { "epoch": 1.0, "learning_rate": 3.4091176126516133e-09, "loss": 2.6668, "step": 37181 }, { "epoch": 1.0, "learning_rate": 3.185631132329725e-09, "loss": 2.6569, "step": 37182 }, { "epoch": 1.0, "learning_rate": 2.9697204489975705e-09, "loss": 2.7134, "step": 37183 }, { "epoch": 1.0, "learning_rate": 2.7613855643204845e-09, "loss": 2.6349, "step": 37184 }, { "epoch": 1.0, "learning_rate": 2.5606264800748236e-09, "loss": 2.4192, "step": 37185 }, { "epoch": 1.0, "learning_rate": 2.3674431975928556e-09, "loss": 2.5033, "step": 37186 }, { "epoch": 1.0, "learning_rate": 2.1818357184288928e-09, "loss": 2.4659, "step": 37187 }, { "epoch": 1.0, "learning_rate": 2.003804043915203e-09, "loss": 2.2815, "step": 37188 }, { "epoch": 1.0, "learning_rate": 1.833348175384053e-09, "loss": 2.4029, "step": 37189 }, { "epoch": 1.0, "learning_rate": 1.6704681142787338e-09, "loss": 2.1247, "step": 37190 }, { "epoch": 1.0, "learning_rate": 1.5151638617094676e-09, "loss": 2.7531, "step": 37191 }, { "epoch": 1.0, "learning_rate": 1.367435418786478e-09, "loss": 2.5563, "step": 37192 }, { "epoch": 1.0, "learning_rate": 1.2272827868420322e-09, "loss": 2.4829, "step": 37193 }, { "epoch": 1.0, "learning_rate": 1.094705966764309e-09, "loss": 2.2653, "step": 37194 }, { "epoch": 1.0, "learning_rate": 9.69704959663531e-10, "loss": 2.1666, "step": 37195 }, { "epoch": 1.0, "learning_rate": 8.522797663168546e-10, "loss": 2.4138, "step": 37196 }, { "epoch": 1.0, "learning_rate": 7.424303878345029e-10, "loss": 2.4646, "step": 37197 }, { "epoch": 1.0, "learning_rate": 6.401568248826095e-10, "loss": 1.6387, "step": 37198 }, { "epoch": 1.0, "learning_rate": 5.45459078349353e-10, "loss": 2.362, "step": 37199 }, { "epoch": 1.0, "learning_rate": 4.5833714890086697e-10, "loss": 2.6988, "step": 37200 }, { "epoch": 1.0, "learning_rate": 3.7879103720328547e-10, "loss": 2.7326, "step": 37201 }, { "epoch": 1.0, "learning_rate": 3.068207438117199e-10, "loss": 2.543, "step": 37202 }, { "epoch": 1.0, "learning_rate": 2.4242626928128173e-10, "loss": 2.8327, "step": 37203 }, { "epoch": 1.0, "learning_rate": 1.856076141670826e-10, "loss": 2.5811, "step": 37204 }, { "epoch": 1.0, "learning_rate": 1.3636477891321165e-10, "loss": 2.4328, "step": 37205 }, { "epoch": 1.0, "learning_rate": 9.469776374171346e-11, "loss": 2.9689, "step": 37206 }, { "epoch": 1.0, "learning_rate": 6.060656920769959e-11, "loss": 2.656, "step": 37207 }, { "epoch": 1.0, "learning_rate": 3.409119531117e-11, "loss": 2.8179, "step": 37208 }, { "epoch": 1.0, "learning_rate": 1.515164238519162e-11, "loss": 2.4558, "step": 37209 }, { "epoch": 1.0, "learning_rate": 3.787910651809057e-12, "loss": 1.8923, "step": 37210 }, { "epoch": 1.0, "learning_rate": 0.0, "loss": 2.6694, "step": 37211 }, { "epoch": 1.0, "step": 37211, "total_flos": 8.316238462906794e+18, "train_loss": 2.5902053065405193, "train_runtime": 58361.0639, "train_samples_per_second": 10.202, "train_steps_per_second": 0.638 } ], "max_steps": 37211, "num_train_epochs": 1, "total_flos": 8.316238462906794e+18, "trial_name": null, "trial_params": null }