Moemu's picture
Upload model
ce4b83b
{"current_steps": 10, "total_steps": 3665, "loss": 2.6446, "learning_rate": 7.999880967748602e-05, "epoch": 0.013642564802182811, "percentage": 0.27, "elapsed_time": "0:00:07", "remaining_time": "0:44:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 20, "total_steps": 3665, "loss": 2.5833, "learning_rate": 7.999469507332807e-05, "epoch": 0.027285129604365622, "percentage": 0.55, "elapsed_time": "0:00:14", "remaining_time": "0:42:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 30, "total_steps": 3665, "loss": 2.3323, "learning_rate": 7.998764179444167e-05, "epoch": 0.040927694406548434, "percentage": 0.82, "elapsed_time": "0:00:21", "remaining_time": "0:43:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 40, "total_steps": 3665, "loss": 2.2764, "learning_rate": 7.997765035907784e-05, "epoch": 0.054570259208731244, "percentage": 1.09, "elapsed_time": "0:00:28", "remaining_time": "0:42:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 50, "total_steps": 3665, "loss": 2.3653, "learning_rate": 7.99661465457664e-05, "epoch": 0.06821282401091405, "percentage": 1.36, "elapsed_time": "0:00:35", "remaining_time": "0:42:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 60, "total_steps": 3665, "loss": 2.3655, "learning_rate": 7.995057481402883e-05, "epoch": 0.08185538881309687, "percentage": 1.64, "elapsed_time": "0:00:41", "remaining_time": "0:42:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 70, "total_steps": 3665, "loss": 2.2008, "learning_rate": 7.993206764937005e-05, "epoch": 0.09549795361527967, "percentage": 1.91, "elapsed_time": "0:00:48", "remaining_time": "0:41:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 80, "total_steps": 3665, "loss": 2.4619, "learning_rate": 7.99106264116338e-05, "epoch": 0.10914051841746249, "percentage": 2.18, "elapsed_time": "0:00:55", "remaining_time": "0:41:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 90, "total_steps": 3665, "loss": 2.4662, "learning_rate": 7.988625267624962e-05, "epoch": 0.12278308321964529, "percentage": 2.46, "elapsed_time": "0:01:01", "remaining_time": "0:40:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 100, "total_steps": 3665, "loss": 2.3909, "learning_rate": 7.9858948234117e-05, "epoch": 0.1364256480218281, "percentage": 2.73, "elapsed_time": "0:01:08", "remaining_time": "0:40:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 110, "total_steps": 3665, "loss": 2.4736, "learning_rate": 7.98287150914739e-05, "epoch": 0.15006821282401092, "percentage": 3.0, "elapsed_time": "0:01:14", "remaining_time": "0:40:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 120, "total_steps": 3665, "loss": 2.3796, "learning_rate": 7.979555546974922e-05, "epoch": 0.16371077762619374, "percentage": 3.27, "elapsed_time": "0:01:21", "remaining_time": "0:39:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 130, "total_steps": 3665, "loss": 2.2357, "learning_rate": 7.975947180539966e-05, "epoch": 0.17735334242837653, "percentage": 3.55, "elapsed_time": "0:01:27", "remaining_time": "0:39:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 140, "total_steps": 3665, "loss": 2.3435, "learning_rate": 7.972046674973065e-05, "epoch": 0.19099590723055934, "percentage": 3.82, "elapsed_time": "0:01:34", "remaining_time": "0:39:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 150, "total_steps": 3665, "loss": 2.4652, "learning_rate": 7.967854316870156e-05, "epoch": 0.20463847203274216, "percentage": 4.09, "elapsed_time": "0:01:40", "remaining_time": "0:39:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 160, "total_steps": 3665, "loss": 2.2549, "learning_rate": 7.963370414271514e-05, "epoch": 0.21828103683492497, "percentage": 4.37, "elapsed_time": "0:01:47", "remaining_time": "0:39:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 170, "total_steps": 3665, "loss": 2.3102, "learning_rate": 7.958595296639115e-05, "epoch": 0.23192360163710776, "percentage": 4.64, "elapsed_time": "0:01:54", "remaining_time": "0:39:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 180, "total_steps": 3665, "loss": 2.2444, "learning_rate": 7.953529314832426e-05, "epoch": 0.24556616643929058, "percentage": 4.91, "elapsed_time": "0:02:01", "remaining_time": "0:39:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 190, "total_steps": 3665, "loss": 2.2928, "learning_rate": 7.948172841082635e-05, "epoch": 0.2592087312414734, "percentage": 5.18, "elapsed_time": "0:02:08", "remaining_time": "0:39:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 200, "total_steps": 3665, "loss": 2.2113, "learning_rate": 7.942526268965287e-05, "epoch": 0.2728512960436562, "percentage": 5.46, "elapsed_time": "0:02:14", "remaining_time": "0:38:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 210, "total_steps": 3665, "loss": 2.0795, "learning_rate": 7.936590013371378e-05, "epoch": 0.286493860845839, "percentage": 5.73, "elapsed_time": "0:02:23", "remaining_time": "0:39:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 220, "total_steps": 3665, "loss": 2.3991, "learning_rate": 7.93036451047686e-05, "epoch": 0.30013642564802184, "percentage": 6.0, "elapsed_time": "0:02:29", "remaining_time": "0:39:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 230, "total_steps": 3665, "loss": 2.3399, "learning_rate": 7.923850217710604e-05, "epoch": 0.31377899045020463, "percentage": 6.28, "elapsed_time": "0:02:36", "remaining_time": "0:38:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 240, "total_steps": 3665, "loss": 2.3305, "learning_rate": 7.917047613720773e-05, "epoch": 0.3274215552523875, "percentage": 6.55, "elapsed_time": "0:02:42", "remaining_time": "0:38:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 250, "total_steps": 3665, "loss": 2.2404, "learning_rate": 7.909957198339669e-05, "epoch": 0.34106412005457026, "percentage": 6.82, "elapsed_time": "0:02:49", "remaining_time": "0:38:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 260, "total_steps": 3665, "loss": 2.1853, "learning_rate": 7.902579492546998e-05, "epoch": 0.35470668485675305, "percentage": 7.09, "elapsed_time": "0:02:55", "remaining_time": "0:38:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 270, "total_steps": 3665, "loss": 2.3177, "learning_rate": 7.894915038431595e-05, "epoch": 0.3683492496589359, "percentage": 7.37, "elapsed_time": "0:03:02", "remaining_time": "0:38:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 280, "total_steps": 3665, "loss": 2.3621, "learning_rate": 7.886964399151586e-05, "epoch": 0.3819918144611187, "percentage": 7.64, "elapsed_time": "0:03:09", "remaining_time": "0:38:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 290, "total_steps": 3665, "loss": 2.3687, "learning_rate": 7.878728158893015e-05, "epoch": 0.3956343792633015, "percentage": 7.91, "elapsed_time": "0:03:15", "remaining_time": "0:37:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 300, "total_steps": 3665, "loss": 2.2021, "learning_rate": 7.870206922826921e-05, "epoch": 0.4092769440654843, "percentage": 8.19, "elapsed_time": "0:03:22", "remaining_time": "0:37:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 310, "total_steps": 3665, "loss": 2.0236, "learning_rate": 7.862294656001264e-05, "epoch": 0.4229195088676671, "percentage": 8.46, "elapsed_time": "0:03:29", "remaining_time": "0:37:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 320, "total_steps": 3665, "loss": 2.4181, "learning_rate": 7.853233670108533e-05, "epoch": 0.43656207366984995, "percentage": 8.73, "elapsed_time": "0:03:36", "remaining_time": "0:37:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 330, "total_steps": 3665, "loss": 2.2359, "learning_rate": 7.843889561656962e-05, "epoch": 0.45020463847203274, "percentage": 9.0, "elapsed_time": "0:03:42", "remaining_time": "0:37:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 340, "total_steps": 3665, "loss": 2.2156, "learning_rate": 7.83426301721999e-05, "epoch": 0.4638472032742155, "percentage": 9.28, "elapsed_time": "0:03:49", "remaining_time": "0:37:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 350, "total_steps": 3665, "loss": 2.256, "learning_rate": 7.824354744123498e-05, "epoch": 0.47748976807639837, "percentage": 9.55, "elapsed_time": "0:03:56", "remaining_time": "0:37:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 360, "total_steps": 3665, "loss": 2.2627, "learning_rate": 7.814165470393832e-05, "epoch": 0.49113233287858116, "percentage": 9.82, "elapsed_time": "0:04:03", "remaining_time": "0:37:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 370, "total_steps": 3665, "loss": 2.1303, "learning_rate": 7.803695944704313e-05, "epoch": 0.504774897680764, "percentage": 10.1, "elapsed_time": "0:04:10", "remaining_time": "0:37:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 380, "total_steps": 3665, "loss": 2.307, "learning_rate": 7.79294693632023e-05, "epoch": 0.5184174624829468, "percentage": 10.37, "elapsed_time": "0:04:17", "remaining_time": "0:37:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 390, "total_steps": 3665, "loss": 2.2182, "learning_rate": 7.781919235042309e-05, "epoch": 0.5320600272851296, "percentage": 10.64, "elapsed_time": "0:04:23", "remaining_time": "0:36:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 400, "total_steps": 3665, "loss": 2.2309, "learning_rate": 7.770613651148688e-05, "epoch": 0.5457025920873124, "percentage": 10.91, "elapsed_time": "0:04:30", "remaining_time": "0:36:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 410, "total_steps": 3665, "loss": 2.0949, "learning_rate": 7.75903101533538e-05, "epoch": 0.5593451568894953, "percentage": 11.19, "elapsed_time": "0:04:36", "remaining_time": "0:36:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 420, "total_steps": 3665, "loss": 2.0541, "learning_rate": 7.747172178655232e-05, "epoch": 0.572987721691678, "percentage": 11.46, "elapsed_time": "0:04:44", "remaining_time": "0:36:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 430, "total_steps": 3665, "loss": 2.0429, "learning_rate": 7.735038012455398e-05, "epoch": 0.5866302864938608, "percentage": 11.73, "elapsed_time": "0:04:51", "remaining_time": "0:36:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 440, "total_steps": 3665, "loss": 2.1867, "learning_rate": 7.722629408313309e-05, "epoch": 0.6002728512960437, "percentage": 12.01, "elapsed_time": "0:04:58", "remaining_time": "0:36:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 450, "total_steps": 3665, "loss": 2.2556, "learning_rate": 7.709947277971168e-05, "epoch": 0.6139154160982264, "percentage": 12.28, "elapsed_time": "0:05:05", "remaining_time": "0:36:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 460, "total_steps": 3665, "loss": 2.3728, "learning_rate": 7.69699255326896e-05, "epoch": 0.6275579809004093, "percentage": 12.55, "elapsed_time": "0:05:11", "remaining_time": "0:36:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 470, "total_steps": 3665, "loss": 2.4319, "learning_rate": 7.683766186075973e-05, "epoch": 0.6412005457025921, "percentage": 12.82, "elapsed_time": "0:05:18", "remaining_time": "0:36:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 480, "total_steps": 3665, "loss": 2.2417, "learning_rate": 7.670269148220874e-05, "epoch": 0.654843110504775, "percentage": 13.1, "elapsed_time": "0:05:25", "remaining_time": "0:36:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 490, "total_steps": 3665, "loss": 2.1867, "learning_rate": 7.656502431420286e-05, "epoch": 0.6684856753069577, "percentage": 13.37, "elapsed_time": "0:05:32", "remaining_time": "0:35:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 500, "total_steps": 3665, "loss": 2.2426, "learning_rate": 7.64246704720593e-05, "epoch": 0.6821282401091405, "percentage": 13.64, "elapsed_time": "0:05:40", "remaining_time": "0:35:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 510, "total_steps": 3665, "loss": 2.1057, "learning_rate": 7.628164026850302e-05, "epoch": 0.6957708049113234, "percentage": 13.92, "elapsed_time": "0:05:47", "remaining_time": "0:35:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 520, "total_steps": 3665, "loss": 2.0724, "learning_rate": 7.613594421290888e-05, "epoch": 0.7094133697135061, "percentage": 14.19, "elapsed_time": "0:05:53", "remaining_time": "0:35:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 530, "total_steps": 3665, "loss": 2.1513, "learning_rate": 7.59875930105296e-05, "epoch": 0.723055934515689, "percentage": 14.46, "elapsed_time": "0:06:00", "remaining_time": "0:35:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 540, "total_steps": 3665, "loss": 1.996, "learning_rate": 7.583659756170904e-05, "epoch": 0.7366984993178718, "percentage": 14.73, "elapsed_time": "0:06:07", "remaining_time": "0:35:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 550, "total_steps": 3665, "loss": 2.2927, "learning_rate": 7.568296896108135e-05, "epoch": 0.7503410641200545, "percentage": 15.01, "elapsed_time": "0:06:13", "remaining_time": "0:35:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 560, "total_steps": 3665, "loss": 2.2445, "learning_rate": 7.552671849675571e-05, "epoch": 0.7639836289222374, "percentage": 15.28, "elapsed_time": "0:06:20", "remaining_time": "0:35:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 570, "total_steps": 3665, "loss": 2.1723, "learning_rate": 7.536785764948705e-05, "epoch": 0.7776261937244202, "percentage": 15.55, "elapsed_time": "0:06:27", "remaining_time": "0:35:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 580, "total_steps": 3665, "loss": 2.1945, "learning_rate": 7.520639809183234e-05, "epoch": 0.791268758526603, "percentage": 15.83, "elapsed_time": "0:06:34", "remaining_time": "0:34:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 590, "total_steps": 3665, "loss": 2.385, "learning_rate": 7.5042351687293e-05, "epoch": 0.8049113233287858, "percentage": 16.1, "elapsed_time": "0:06:40", "remaining_time": "0:34:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 600, "total_steps": 3665, "loss": 1.8776, "learning_rate": 7.487573048944318e-05, "epoch": 0.8185538881309686, "percentage": 16.37, "elapsed_time": "0:06:47", "remaining_time": "0:34:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 610, "total_steps": 3665, "loss": 2.1586, "learning_rate": 7.470654674104415e-05, "epoch": 0.8321964529331515, "percentage": 16.64, "elapsed_time": "0:06:53", "remaining_time": "0:34:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 620, "total_steps": 3665, "loss": 2.1229, "learning_rate": 7.453481287314469e-05, "epoch": 0.8458390177353342, "percentage": 16.92, "elapsed_time": "0:07:00", "remaining_time": "0:34:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 630, "total_steps": 3665, "loss": 2.1562, "learning_rate": 7.436054150416777e-05, "epoch": 0.859481582537517, "percentage": 17.19, "elapsed_time": "0:07:07", "remaining_time": "0:34:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 640, "total_steps": 3665, "loss": 2.2563, "learning_rate": 7.418374543898328e-05, "epoch": 0.8731241473396999, "percentage": 17.46, "elapsed_time": "0:07:14", "remaining_time": "0:34:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 650, "total_steps": 3665, "loss": 2.0738, "learning_rate": 7.400443766796728e-05, "epoch": 0.8867667121418826, "percentage": 17.74, "elapsed_time": "0:07:20", "remaining_time": "0:34:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 660, "total_steps": 3665, "loss": 1.9363, "learning_rate": 7.382263136604744e-05, "epoch": 0.9004092769440655, "percentage": 18.01, "elapsed_time": "0:07:27", "remaining_time": "0:33:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 670, "total_steps": 3665, "loss": 2.3014, "learning_rate": 7.363833989173504e-05, "epoch": 0.9140518417462483, "percentage": 18.28, "elapsed_time": "0:07:34", "remaining_time": "0:33:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 680, "total_steps": 3665, "loss": 2.1957, "learning_rate": 7.34515767861434e-05, "epoch": 0.927694406548431, "percentage": 18.55, "elapsed_time": "0:07:40", "remaining_time": "0:33:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 690, "total_steps": 3665, "loss": 2.4058, "learning_rate": 7.326235577199292e-05, "epoch": 0.9413369713506139, "percentage": 18.83, "elapsed_time": "0:07:47", "remaining_time": "0:33:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 700, "total_steps": 3665, "loss": 2.0714, "learning_rate": 7.307069075260283e-05, "epoch": 0.9549795361527967, "percentage": 19.1, "elapsed_time": "0:07:54", "remaining_time": "0:33:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 710, "total_steps": 3665, "loss": 2.0244, "learning_rate": 7.287659581086957e-05, "epoch": 0.9686221009549796, "percentage": 19.37, "elapsed_time": "0:08:00", "remaining_time": "0:33:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 720, "total_steps": 3665, "loss": 2.1891, "learning_rate": 7.268008520823203e-05, "epoch": 0.9822646657571623, "percentage": 19.65, "elapsed_time": "0:08:07", "remaining_time": "0:33:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 730, "total_steps": 3665, "loss": 2.0008, "learning_rate": 7.248117338362371e-05, "epoch": 0.9959072305593452, "percentage": 19.92, "elapsed_time": "0:08:13", "remaining_time": "0:33:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 740, "total_steps": 3665, "loss": 1.7823, "learning_rate": 7.227987495241174e-05, "epoch": 1.009549795361528, "percentage": 20.19, "elapsed_time": "0:08:20", "remaining_time": "0:33:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 750, "total_steps": 3665, "loss": 1.7272, "learning_rate": 7.207620470532302e-05, "epoch": 1.0231923601637107, "percentage": 20.46, "elapsed_time": "0:08:27", "remaining_time": "0:32:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 760, "total_steps": 3665, "loss": 1.7809, "learning_rate": 7.187017760735748e-05, "epoch": 1.0368349249658937, "percentage": 20.74, "elapsed_time": "0:08:35", "remaining_time": "0:32:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 770, "total_steps": 3665, "loss": 1.5226, "learning_rate": 7.166180879668843e-05, "epoch": 1.0504774897680764, "percentage": 21.01, "elapsed_time": "0:08:41", "remaining_time": "0:32:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 780, "total_steps": 3665, "loss": 1.6743, "learning_rate": 7.145111358355031e-05, "epoch": 1.0641200545702592, "percentage": 21.28, "elapsed_time": "0:08:48", "remaining_time": "0:32:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 790, "total_steps": 3665, "loss": 1.3974, "learning_rate": 7.123810744911376e-05, "epoch": 1.077762619372442, "percentage": 21.56, "elapsed_time": "0:08:55", "remaining_time": "0:32:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 800, "total_steps": 3665, "loss": 1.4882, "learning_rate": 7.102280604434805e-05, "epoch": 1.0914051841746248, "percentage": 21.83, "elapsed_time": "0:09:01", "remaining_time": "0:32:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 810, "total_steps": 3665, "loss": 1.8217, "learning_rate": 7.080522518887116e-05, "epoch": 1.1050477489768076, "percentage": 22.1, "elapsed_time": "0:09:08", "remaining_time": "0:32:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 820, "total_steps": 3665, "loss": 1.5443, "learning_rate": 7.058538086978738e-05, "epoch": 1.1186903137789905, "percentage": 22.37, "elapsed_time": "0:09:15", "remaining_time": "0:32:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 830, "total_steps": 3665, "loss": 1.426, "learning_rate": 7.036328924051266e-05, "epoch": 1.1323328785811733, "percentage": 22.65, "elapsed_time": "0:09:22", "remaining_time": "0:31:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 840, "total_steps": 3665, "loss": 1.6086, "learning_rate": 7.013896661958766e-05, "epoch": 1.145975443383356, "percentage": 22.92, "elapsed_time": "0:09:28", "remaining_time": "0:31:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 850, "total_steps": 3665, "loss": 1.64, "learning_rate": 6.991242948947879e-05, "epoch": 1.159618008185539, "percentage": 23.19, "elapsed_time": "0:09:34", "remaining_time": "0:31:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 860, "total_steps": 3665, "loss": 1.6026, "learning_rate": 6.968369449536705e-05, "epoch": 1.1732605729877217, "percentage": 23.47, "elapsed_time": "0:09:41", "remaining_time": "0:31:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 870, "total_steps": 3665, "loss": 1.5026, "learning_rate": 6.945277844392504e-05, "epoch": 1.1869031377899044, "percentage": 23.74, "elapsed_time": "0:09:47", "remaining_time": "0:31:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 880, "total_steps": 3665, "loss": 1.6705, "learning_rate": 6.921969830208212e-05, "epoch": 1.2005457025920874, "percentage": 24.01, "elapsed_time": "0:09:54", "remaining_time": "0:31:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 890, "total_steps": 3665, "loss": 1.6982, "learning_rate": 6.898447119577764e-05, "epoch": 1.21418826739427, "percentage": 24.28, "elapsed_time": "0:10:01", "remaining_time": "0:31:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 900, "total_steps": 3665, "loss": 1.2631, "learning_rate": 6.874711440870264e-05, "epoch": 1.2278308321964528, "percentage": 24.56, "elapsed_time": "0:10:08", "remaining_time": "0:31:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 910, "total_steps": 3665, "loss": 1.5005, "learning_rate": 6.85076453810299e-05, "epoch": 1.2414733969986358, "percentage": 24.83, "elapsed_time": "0:10:15", "remaining_time": "0:31:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 920, "total_steps": 3665, "loss": 1.6076, "learning_rate": 6.826608170813243e-05, "epoch": 1.2551159618008185, "percentage": 25.1, "elapsed_time": "0:10:21", "remaining_time": "0:30:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 930, "total_steps": 3665, "loss": 1.7727, "learning_rate": 6.802244113929075e-05, "epoch": 1.2687585266030013, "percentage": 25.38, "elapsed_time": "0:10:28", "remaining_time": "0:30:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 940, "total_steps": 3665, "loss": 1.6125, "learning_rate": 6.777674157638862e-05, "epoch": 1.2824010914051842, "percentage": 25.65, "elapsed_time": "0:10:35", "remaining_time": "0:30:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 950, "total_steps": 3665, "loss": 1.4289, "learning_rate": 6.75290010725977e-05, "epoch": 1.296043656207367, "percentage": 25.92, "elapsed_time": "0:10:42", "remaining_time": "0:30:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 960, "total_steps": 3665, "loss": 1.6043, "learning_rate": 6.727923783105111e-05, "epoch": 1.30968622100955, "percentage": 26.19, "elapsed_time": "0:10:48", "remaining_time": "0:30:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 970, "total_steps": 3665, "loss": 1.6637, "learning_rate": 6.702747020350586e-05, "epoch": 1.3233287858117326, "percentage": 26.47, "elapsed_time": "0:10:55", "remaining_time": "0:30:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 980, "total_steps": 3665, "loss": 1.717, "learning_rate": 6.677371668899448e-05, "epoch": 1.3369713506139154, "percentage": 26.74, "elapsed_time": "0:11:02", "remaining_time": "0:30:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 990, "total_steps": 3665, "loss": 1.572, "learning_rate": 6.651799593246569e-05, "epoch": 1.350613915416098, "percentage": 27.01, "elapsed_time": "0:11:09", "remaining_time": "0:30:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1000, "total_steps": 3665, "loss": 1.6264, "learning_rate": 6.626032672341458e-05, "epoch": 1.364256480218281, "percentage": 27.29, "elapsed_time": "0:11:15", "remaining_time": "0:30:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1010, "total_steps": 3665, "loss": 1.5057, "learning_rate": 6.600072799450186e-05, "epoch": 1.3778990450204638, "percentage": 27.56, "elapsed_time": "0:11:22", "remaining_time": "0:29:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1020, "total_steps": 3665, "loss": 1.6963, "learning_rate": 6.573921882016284e-05, "epoch": 1.3915416098226467, "percentage": 27.83, "elapsed_time": "0:11:29", "remaining_time": "0:29:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1030, "total_steps": 3665, "loss": 1.3956, "learning_rate": 6.547581841520589e-05, "epoch": 1.4051841746248295, "percentage": 28.1, "elapsed_time": "0:11:35", "remaining_time": "0:29:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1040, "total_steps": 3665, "loss": 1.469, "learning_rate": 6.521054613340064e-05, "epoch": 1.4188267394270122, "percentage": 28.38, "elapsed_time": "0:11:42", "remaining_time": "0:29:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1050, "total_steps": 3665, "loss": 1.5518, "learning_rate": 6.494342146605581e-05, "epoch": 1.4324693042291952, "percentage": 28.65, "elapsed_time": "0:11:50", "remaining_time": "0:29:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1060, "total_steps": 3665, "loss": 1.5123, "learning_rate": 6.467446404058722e-05, "epoch": 1.446111869031378, "percentage": 28.92, "elapsed_time": "0:11:57", "remaining_time": "0:29:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1070, "total_steps": 3665, "loss": 1.5065, "learning_rate": 6.44036936190755e-05, "epoch": 1.4597544338335606, "percentage": 29.2, "elapsed_time": "0:12:03", "remaining_time": "0:29:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1080, "total_steps": 3665, "loss": 1.5362, "learning_rate": 6.413113009681411e-05, "epoch": 1.4733969986357436, "percentage": 29.47, "elapsed_time": "0:12:10", "remaining_time": "0:29:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1090, "total_steps": 3665, "loss": 1.7138, "learning_rate": 6.385679350084743e-05, "epoch": 1.4870395634379263, "percentage": 29.74, "elapsed_time": "0:12:16", "remaining_time": "0:29:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1100, "total_steps": 3665, "loss": 1.6659, "learning_rate": 6.358070398849938e-05, "epoch": 1.500682128240109, "percentage": 30.01, "elapsed_time": "0:12:23", "remaining_time": "0:28:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1110, "total_steps": 3665, "loss": 1.6374, "learning_rate": 6.330288184589216e-05, "epoch": 1.514324693042292, "percentage": 30.29, "elapsed_time": "0:12:29", "remaining_time": "0:28:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1120, "total_steps": 3665, "loss": 1.6296, "learning_rate": 6.30233474864558e-05, "epoch": 1.5279672578444747, "percentage": 30.56, "elapsed_time": "0:12:36", "remaining_time": "0:28:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1130, "total_steps": 3665, "loss": 1.6491, "learning_rate": 6.274212144942824e-05, "epoch": 1.5416098226466577, "percentage": 30.83, "elapsed_time": "0:12:43", "remaining_time": "0:28:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1140, "total_steps": 3665, "loss": 1.6309, "learning_rate": 6.245922439834612e-05, "epoch": 1.5552523874488404, "percentage": 31.11, "elapsed_time": "0:12:50", "remaining_time": "0:28:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1150, "total_steps": 3665, "loss": 1.5365, "learning_rate": 6.217467711952658e-05, "epoch": 1.5688949522510232, "percentage": 31.38, "elapsed_time": "0:12:57", "remaining_time": "0:28:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1160, "total_steps": 3665, "loss": 1.493, "learning_rate": 6.188850052053985e-05, "epoch": 1.5825375170532059, "percentage": 31.65, "elapsed_time": "0:13:04", "remaining_time": "0:28:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1170, "total_steps": 3665, "loss": 1.6771, "learning_rate": 6.160071562867316e-05, "epoch": 1.5961800818553888, "percentage": 31.92, "elapsed_time": "0:13:11", "remaining_time": "0:28:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1180, "total_steps": 3665, "loss": 1.5381, "learning_rate": 6.131134358938559e-05, "epoch": 1.6098226466575716, "percentage": 32.2, "elapsed_time": "0:13:18", "remaining_time": "0:28:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1190, "total_steps": 3665, "loss": 1.4791, "learning_rate": 6.1020405664754455e-05, "epoch": 1.6234652114597545, "percentage": 32.47, "elapsed_time": "0:13:24", "remaining_time": "0:27:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1200, "total_steps": 3665, "loss": 1.5296, "learning_rate": 6.0727923231913035e-05, "epoch": 1.6371077762619373, "percentage": 32.74, "elapsed_time": "0:13:32", "remaining_time": "0:27:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1210, "total_steps": 3665, "loss": 1.4165, "learning_rate": 6.04339177814798e-05, "epoch": 1.65075034106412, "percentage": 33.02, "elapsed_time": "0:13:39", "remaining_time": "0:27:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1220, "total_steps": 3665, "loss": 1.5694, "learning_rate": 6.013841091597947e-05, "epoch": 1.6643929058663027, "percentage": 33.29, "elapsed_time": "0:13:45", "remaining_time": "0:27:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1230, "total_steps": 3665, "loss": 1.6024, "learning_rate": 5.9841424348255596e-05, "epoch": 1.6780354706684857, "percentage": 33.56, "elapsed_time": "0:13:52", "remaining_time": "0:27:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1240, "total_steps": 3665, "loss": 1.499, "learning_rate": 5.954297989987526e-05, "epoch": 1.6916780354706686, "percentage": 33.83, "elapsed_time": "0:13:59", "remaining_time": "0:27:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1250, "total_steps": 3665, "loss": 1.5177, "learning_rate": 5.924309949952565e-05, "epoch": 1.7053206002728514, "percentage": 34.11, "elapsed_time": "0:14:06", "remaining_time": "0:27:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1260, "total_steps": 3665, "loss": 1.4564, "learning_rate": 5.8941805181402886e-05, "epoch": 1.718963165075034, "percentage": 34.38, "elapsed_time": "0:14:12", "remaining_time": "0:27:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1270, "total_steps": 3665, "loss": 1.3263, "learning_rate": 5.8639119083592954e-05, "epoch": 1.7326057298772168, "percentage": 34.65, "elapsed_time": "0:14:19", "remaining_time": "0:27:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1280, "total_steps": 3665, "loss": 1.6518, "learning_rate": 5.833506344644507e-05, "epoch": 1.7462482946793996, "percentage": 34.92, "elapsed_time": "0:14:26", "remaining_time": "0:26:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1290, "total_steps": 3665, "loss": 1.4169, "learning_rate": 5.802966061093762e-05, "epoch": 1.7598908594815825, "percentage": 35.2, "elapsed_time": "0:14:33", "remaining_time": "0:26:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1300, "total_steps": 3665, "loss": 1.4631, "learning_rate": 5.7722933017036515e-05, "epoch": 1.7735334242837655, "percentage": 35.47, "elapsed_time": "0:14:39", "remaining_time": "0:26:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1310, "total_steps": 3665, "loss": 1.5939, "learning_rate": 5.741490320204644e-05, "epoch": 1.7871759890859482, "percentage": 35.74, "elapsed_time": "0:14:47", "remaining_time": "0:26:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1320, "total_steps": 3665, "loss": 1.4775, "learning_rate": 5.7105593798954895e-05, "epoch": 1.800818553888131, "percentage": 36.02, "elapsed_time": "0:14:53", "remaining_time": "0:26:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1330, "total_steps": 3665, "loss": 1.6513, "learning_rate": 5.679502753476913e-05, "epoch": 1.8144611186903137, "percentage": 36.29, "elapsed_time": "0:15:00", "remaining_time": "0:26:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1340, "total_steps": 3665, "loss": 1.6092, "learning_rate": 5.648322722884635e-05, "epoch": 1.8281036834924966, "percentage": 36.56, "elapsed_time": "0:15:07", "remaining_time": "0:26:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1350, "total_steps": 3665, "loss": 1.5116, "learning_rate": 5.6170215791216926e-05, "epoch": 1.8417462482946794, "percentage": 36.83, "elapsed_time": "0:15:13", "remaining_time": "0:26:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1360, "total_steps": 3665, "loss": 1.3667, "learning_rate": 5.58560162209011e-05, "epoch": 1.8553888130968623, "percentage": 37.11, "elapsed_time": "0:15:20", "remaining_time": "0:25:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1370, "total_steps": 3665, "loss": 1.4584, "learning_rate": 5.554065160421907e-05, "epoch": 1.869031377899045, "percentage": 37.38, "elapsed_time": "0:15:26", "remaining_time": "0:25:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1380, "total_steps": 3665, "loss": 1.7889, "learning_rate": 5.522414511309472e-05, "epoch": 1.8826739427012278, "percentage": 37.65, "elapsed_time": "0:15:34", "remaining_time": "0:25:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1390, "total_steps": 3665, "loss": 1.5623, "learning_rate": 5.490652000335297e-05, "epoch": 1.8963165075034105, "percentage": 37.93, "elapsed_time": "0:15:40", "remaining_time": "0:25:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1400, "total_steps": 3665, "loss": 1.5508, "learning_rate": 5.461972027286809e-05, "epoch": 1.9099590723055935, "percentage": 38.2, "elapsed_time": "0:15:47", "remaining_time": "0:25:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1410, "total_steps": 3665, "loss": 1.4951, "learning_rate": 5.430003415054097e-05, "epoch": 1.9236016371077762, "percentage": 38.47, "elapsed_time": "0:15:53", "remaining_time": "0:25:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1420, "total_steps": 3665, "loss": 1.601, "learning_rate": 5.397929731013993e-05, "epoch": 1.9372442019099592, "percentage": 38.74, "elapsed_time": "0:16:00", "remaining_time": "0:25:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1430, "total_steps": 3665, "loss": 1.5427, "learning_rate": 5.365753331832165e-05, "epoch": 1.950886766712142, "percentage": 39.02, "elapsed_time": "0:16:06", "remaining_time": "0:25:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1440, "total_steps": 3665, "loss": 1.4017, "learning_rate": 5.3334765817214407e-05, "epoch": 1.9645293315143246, "percentage": 39.29, "elapsed_time": "0:16:13", "remaining_time": "0:25:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1450, "total_steps": 3665, "loss": 1.6255, "learning_rate": 5.301101852268093e-05, "epoch": 1.9781718963165074, "percentage": 39.56, "elapsed_time": "0:16:19", "remaining_time": "0:24:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1460, "total_steps": 3665, "loss": 1.5628, "learning_rate": 5.268631522257586e-05, "epoch": 1.9918144611186903, "percentage": 39.84, "elapsed_time": "0:16:26", "remaining_time": "0:24:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1470, "total_steps": 3665, "loss": 1.2903, "learning_rate": 5.23606797749979e-05, "epoch": 2.0054570259208733, "percentage": 40.11, "elapsed_time": "0:16:34", "remaining_time": "0:24:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1480, "total_steps": 3665, "loss": 0.8694, "learning_rate": 5.2034136106536784e-05, "epoch": 2.019099590723056, "percentage": 40.38, "elapsed_time": "0:16:41", "remaining_time": "0:24:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1490, "total_steps": 3665, "loss": 1.0926, "learning_rate": 5.1706708210515225e-05, "epoch": 2.0327421555252387, "percentage": 40.65, "elapsed_time": "0:16:50", "remaining_time": "0:24:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1500, "total_steps": 3665, "loss": 0.9019, "learning_rate": 5.1378420145226e-05, "epoch": 2.0463847203274215, "percentage": 40.93, "elapsed_time": "0:16:56", "remaining_time": "0:24:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1510, "total_steps": 3665, "loss": 0.9077, "learning_rate": 5.104929603216422e-05, "epoch": 2.060027285129604, "percentage": 41.2, "elapsed_time": "0:17:03", "remaining_time": "0:24:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1520, "total_steps": 3665, "loss": 0.8833, "learning_rate": 5.0719360054254925e-05, "epoch": 2.0736698499317874, "percentage": 41.47, "elapsed_time": "0:17:10", "remaining_time": "0:24:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1530, "total_steps": 3665, "loss": 0.8182, "learning_rate": 5.0388636454076256e-05, "epoch": 2.08731241473397, "percentage": 41.75, "elapsed_time": "0:17:17", "remaining_time": "0:24:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1540, "total_steps": 3665, "loss": 0.7097, "learning_rate": 5.0057149532078165e-05, "epoch": 2.100954979536153, "percentage": 42.02, "elapsed_time": "0:17:23", "remaining_time": "0:24:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1550, "total_steps": 3665, "loss": 0.8243, "learning_rate": 4.9724923644796904e-05, "epoch": 2.1145975443383356, "percentage": 42.29, "elapsed_time": "0:17:30", "remaining_time": "0:23:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1560, "total_steps": 3665, "loss": 0.8468, "learning_rate": 4.939198320306537e-05, "epoch": 2.1282401091405183, "percentage": 42.56, "elapsed_time": "0:17:36", "remaining_time": "0:23:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1570, "total_steps": 3665, "loss": 0.8348, "learning_rate": 4.9058352670219576e-05, "epoch": 2.141882673942701, "percentage": 42.84, "elapsed_time": "0:17:43", "remaining_time": "0:23:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1580, "total_steps": 3665, "loss": 0.9292, "learning_rate": 4.872405656030099e-05, "epoch": 2.155525238744884, "percentage": 43.11, "elapsed_time": "0:17:51", "remaining_time": "0:23:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1590, "total_steps": 3665, "loss": 0.7706, "learning_rate": 4.83891194362555e-05, "epoch": 2.169167803547067, "percentage": 43.38, "elapsed_time": "0:17:57", "remaining_time": "0:23:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1600, "total_steps": 3665, "loss": 0.8487, "learning_rate": 4.805356590812852e-05, "epoch": 2.1828103683492497, "percentage": 43.66, "elapsed_time": "0:18:03", "remaining_time": "0:23:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1610, "total_steps": 3665, "loss": 0.8509, "learning_rate": 4.771742063125674e-05, "epoch": 2.1964529331514324, "percentage": 43.93, "elapsed_time": "0:18:10", "remaining_time": "0:23:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1620, "total_steps": 3665, "loss": 0.8833, "learning_rate": 4.7380708304456554e-05, "epoch": 2.210095497953615, "percentage": 44.2, "elapsed_time": "0:18:17", "remaining_time": "0:23:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1630, "total_steps": 3665, "loss": 0.8968, "learning_rate": 4.704345366820927e-05, "epoch": 2.223738062755798, "percentage": 44.47, "elapsed_time": "0:18:24", "remaining_time": "0:22:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1640, "total_steps": 3665, "loss": 0.9044, "learning_rate": 4.670568150284323e-05, "epoch": 2.237380627557981, "percentage": 44.75, "elapsed_time": "0:18:31", "remaining_time": "0:22:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1650, "total_steps": 3665, "loss": 0.974, "learning_rate": 4.636741662671308e-05, "epoch": 2.251023192360164, "percentage": 45.02, "elapsed_time": "0:18:38", "remaining_time": "0:22:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1660, "total_steps": 3665, "loss": 0.8121, "learning_rate": 4.602868389437622e-05, "epoch": 2.2646657571623465, "percentage": 45.29, "elapsed_time": "0:18:44", "remaining_time": "0:22:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1670, "total_steps": 3665, "loss": 1.1324, "learning_rate": 4.568950819476648e-05, "epoch": 2.2783083219645293, "percentage": 45.57, "elapsed_time": "0:18:51", "remaining_time": "0:22:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1680, "total_steps": 3665, "loss": 0.8856, "learning_rate": 4.5349914449365435e-05, "epoch": 2.291950886766712, "percentage": 45.84, "elapsed_time": "0:18:58", "remaining_time": "0:22:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1690, "total_steps": 3665, "loss": 0.8276, "learning_rate": 4.500992761037129e-05, "epoch": 2.305593451568895, "percentage": 46.11, "elapsed_time": "0:19:05", "remaining_time": "0:22:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1700, "total_steps": 3665, "loss": 0.7492, "learning_rate": 4.4669572658865405e-05, "epoch": 2.319236016371078, "percentage": 46.38, "elapsed_time": "0:19:12", "remaining_time": "0:22:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1710, "total_steps": 3665, "loss": 0.9167, "learning_rate": 4.4328874602976786e-05, "epoch": 2.3328785811732606, "percentage": 46.66, "elapsed_time": "0:19:18", "remaining_time": "0:22:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1720, "total_steps": 3665, "loss": 0.9453, "learning_rate": 4.3987858476044617e-05, "epoch": 2.3465211459754434, "percentage": 46.93, "elapsed_time": "0:19:25", "remaining_time": "0:21:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1730, "total_steps": 3665, "loss": 0.8714, "learning_rate": 4.364654933477886e-05, "epoch": 2.360163710777626, "percentage": 47.2, "elapsed_time": "0:19:33", "remaining_time": "0:21:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1740, "total_steps": 3665, "loss": 0.9251, "learning_rate": 4.330497225741917e-05, "epoch": 2.373806275579809, "percentage": 47.48, "elapsed_time": "0:19:39", "remaining_time": "0:21:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1750, "total_steps": 3665, "loss": 0.9479, "learning_rate": 4.296315234189223e-05, "epoch": 2.3874488403819916, "percentage": 47.75, "elapsed_time": "0:19:46", "remaining_time": "0:21:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1760, "total_steps": 3665, "loss": 0.8346, "learning_rate": 4.262111470396766e-05, "epoch": 2.4010914051841747, "percentage": 48.02, "elapsed_time": "0:19:53", "remaining_time": "0:21:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1770, "total_steps": 3665, "loss": 0.754, "learning_rate": 4.2278884475412585e-05, "epoch": 2.4147339699863575, "percentage": 48.29, "elapsed_time": "0:20:00", "remaining_time": "0:21:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1780, "total_steps": 3665, "loss": 0.7743, "learning_rate": 4.193648680214505e-05, "epoch": 2.42837653478854, "percentage": 48.57, "elapsed_time": "0:20:06", "remaining_time": "0:21:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1790, "total_steps": 3665, "loss": 0.9273, "learning_rate": 4.159394684238635e-05, "epoch": 2.442019099590723, "percentage": 48.84, "elapsed_time": "0:20:13", "remaining_time": "0:21:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1800, "total_steps": 3665, "loss": 1.0037, "learning_rate": 4.1251289764812495e-05, "epoch": 2.4556616643929057, "percentage": 49.11, "elapsed_time": "0:20:20", "remaining_time": "0:21:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1810, "total_steps": 3665, "loss": 0.7728, "learning_rate": 4.090854074670495e-05, "epoch": 2.469304229195089, "percentage": 49.39, "elapsed_time": "0:20:26", "remaining_time": "0:20:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1820, "total_steps": 3665, "loss": 0.8098, "learning_rate": 4.056572497210066e-05, "epoch": 2.4829467939972716, "percentage": 49.66, "elapsed_time": "0:20:33", "remaining_time": "0:20:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1830, "total_steps": 3665, "loss": 0.8404, "learning_rate": 4.0222867629941554e-05, "epoch": 2.4965893587994543, "percentage": 49.93, "elapsed_time": "0:20:40", "remaining_time": "0:20:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1840, "total_steps": 3665, "loss": 0.7021, "learning_rate": 3.987999391222389e-05, "epoch": 2.510231923601637, "percentage": 50.2, "elapsed_time": "0:20:46", "remaining_time": "0:20:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1850, "total_steps": 3665, "loss": 0.9656, "learning_rate": 3.953712901214707e-05, "epoch": 2.52387448840382, "percentage": 50.48, "elapsed_time": "0:20:54", "remaining_time": "0:20:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1860, "total_steps": 3665, "loss": 0.7487, "learning_rate": 3.9194298122262666e-05, "epoch": 2.5375170532060025, "percentage": 50.75, "elapsed_time": "0:21:00", "remaining_time": "0:20:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1870, "total_steps": 3665, "loss": 0.8693, "learning_rate": 3.8851526432623254e-05, "epoch": 2.5511596180081857, "percentage": 51.02, "elapsed_time": "0:21:06", "remaining_time": "0:20:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1880, "total_steps": 3665, "loss": 0.8933, "learning_rate": 3.850883912893158e-05, "epoch": 2.5648021828103684, "percentage": 51.3, "elapsed_time": "0:21:13", "remaining_time": "0:20:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1890, "total_steps": 3665, "loss": 0.7098, "learning_rate": 3.816626139069004e-05, "epoch": 2.578444747612551, "percentage": 51.57, "elapsed_time": "0:21:19", "remaining_time": "0:20:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1900, "total_steps": 3665, "loss": 0.8742, "learning_rate": 3.782381838935047e-05, "epoch": 2.592087312414734, "percentage": 51.84, "elapsed_time": "0:21:26", "remaining_time": "0:19:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1910, "total_steps": 3665, "loss": 0.7846, "learning_rate": 3.748153528646472e-05, "epoch": 2.6057298772169166, "percentage": 52.11, "elapsed_time": "0:21:33", "remaining_time": "0:19:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1920, "total_steps": 3665, "loss": 0.9032, "learning_rate": 3.713943723183587e-05, "epoch": 2.6193724420191, "percentage": 52.39, "elapsed_time": "0:21:39", "remaining_time": "0:19:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1930, "total_steps": 3665, "loss": 0.8044, "learning_rate": 3.6797549361670257e-05, "epoch": 2.6330150068212825, "percentage": 52.66, "elapsed_time": "0:21:45", "remaining_time": "0:19:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1940, "total_steps": 3665, "loss": 0.8528, "learning_rate": 3.6455896796730554e-05, "epoch": 2.6466575716234653, "percentage": 52.93, "elapsed_time": "0:21:52", "remaining_time": "0:19:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1950, "total_steps": 3665, "loss": 0.9294, "learning_rate": 3.611450464049005e-05, "epoch": 2.660300136425648, "percentage": 53.21, "elapsed_time": "0:21:58", "remaining_time": "0:19:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1960, "total_steps": 3665, "loss": 0.9441, "learning_rate": 3.577339797728805e-05, "epoch": 2.6739427012278307, "percentage": 53.48, "elapsed_time": "0:22:06", "remaining_time": "0:19:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1970, "total_steps": 3665, "loss": 0.8572, "learning_rate": 3.5432601870486795e-05, "epoch": 2.6875852660300135, "percentage": 53.75, "elapsed_time": "0:22:12", "remaining_time": "0:19:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1980, "total_steps": 3665, "loss": 0.9912, "learning_rate": 3.509214136062993e-05, "epoch": 2.701227830832196, "percentage": 54.02, "elapsed_time": "0:22:19", "remaining_time": "0:19:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1990, "total_steps": 3665, "loss": 0.9876, "learning_rate": 3.475204146360254e-05, "epoch": 2.7148703956343794, "percentage": 54.3, "elapsed_time": "0:22:26", "remaining_time": "0:18:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2000, "total_steps": 3665, "loss": 0.8796, "learning_rate": 3.44123271687931e-05, "epoch": 2.728512960436562, "percentage": 54.57, "elapsed_time": "0:22:33", "remaining_time": "0:18:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2010, "total_steps": 3665, "loss": 0.8394, "learning_rate": 3.407302343725737e-05, "epoch": 2.742155525238745, "percentage": 54.84, "elapsed_time": "0:22:39", "remaining_time": "0:18:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2020, "total_steps": 3665, "loss": 0.7603, "learning_rate": 3.3734155199884275e-05, "epoch": 2.7557980900409276, "percentage": 55.12, "elapsed_time": "0:22:46", "remaining_time": "0:18:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2030, "total_steps": 3665, "loss": 0.8944, "learning_rate": 3.339574735556412e-05, "epoch": 2.7694406548431107, "percentage": 55.39, "elapsed_time": "0:22:53", "remaining_time": "0:18:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2040, "total_steps": 3665, "loss": 0.9737, "learning_rate": 3.3057824769359104e-05, "epoch": 2.7830832196452935, "percentage": 55.66, "elapsed_time": "0:23:00", "remaining_time": "0:18:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2050, "total_steps": 3665, "loss": 0.9483, "learning_rate": 3.2720412270676275e-05, "epoch": 2.796725784447476, "percentage": 55.93, "elapsed_time": "0:23:07", "remaining_time": "0:18:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2060, "total_steps": 3665, "loss": 0.9254, "learning_rate": 3.2383534651443206e-05, "epoch": 2.810368349249659, "percentage": 56.21, "elapsed_time": "0:23:13", "remaining_time": "0:18:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2070, "total_steps": 3665, "loss": 0.7472, "learning_rate": 3.204721666428631e-05, "epoch": 2.8240109140518417, "percentage": 56.48, "elapsed_time": "0:23:20", "remaining_time": "0:17:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2080, "total_steps": 3665, "loss": 0.8689, "learning_rate": 3.171148302071215e-05, "epoch": 2.8376534788540244, "percentage": 56.75, "elapsed_time": "0:23:27", "remaining_time": "0:17:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2090, "total_steps": 3665, "loss": 0.7493, "learning_rate": 3.137635838929169e-05, "epoch": 2.851296043656207, "percentage": 57.03, "elapsed_time": "0:23:33", "remaining_time": "0:17:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2100, "total_steps": 3665, "loss": 1.0867, "learning_rate": 3.1041867393847764e-05, "epoch": 2.8649386084583903, "percentage": 57.3, "elapsed_time": "0:23:41", "remaining_time": "0:17:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2110, "total_steps": 3665, "loss": 0.9846, "learning_rate": 3.070803461164575e-05, "epoch": 2.878581173260573, "percentage": 57.57, "elapsed_time": "0:23:48", "remaining_time": "0:17:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2120, "total_steps": 3665, "loss": 0.7862, "learning_rate": 3.0374884571587776e-05, "epoch": 2.892223738062756, "percentage": 57.84, "elapsed_time": "0:23:55", "remaining_time": "0:17:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2130, "total_steps": 3665, "loss": 1.0586, "learning_rate": 3.004244175241038e-05, "epoch": 2.9058663028649385, "percentage": 58.12, "elapsed_time": "0:24:01", "remaining_time": "0:17:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2140, "total_steps": 3665, "loss": 0.8757, "learning_rate": 2.971073058088587e-05, "epoch": 2.9195088676671213, "percentage": 58.39, "elapsed_time": "0:24:08", "remaining_time": "0:17:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2150, "total_steps": 3665, "loss": 0.9026, "learning_rate": 2.937977543002764e-05, "epoch": 2.9331514324693044, "percentage": 58.66, "elapsed_time": "0:24:15", "remaining_time": "0:17:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2160, "total_steps": 3665, "loss": 0.8864, "learning_rate": 2.9049600617299188e-05, "epoch": 2.946793997271487, "percentage": 58.94, "elapsed_time": "0:24:22", "remaining_time": "0:16:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2170, "total_steps": 3665, "loss": 0.8224, "learning_rate": 2.872023040282739e-05, "epoch": 2.96043656207367, "percentage": 59.21, "elapsed_time": "0:24:29", "remaining_time": "0:16:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2180, "total_steps": 3665, "loss": 0.794, "learning_rate": 2.8391688987620045e-05, "epoch": 2.9740791268758526, "percentage": 59.48, "elapsed_time": "0:24:35", "remaining_time": "0:16:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2190, "total_steps": 3665, "loss": 0.9792, "learning_rate": 2.8064000511787523e-05, "epoch": 2.9877216916780354, "percentage": 59.75, "elapsed_time": "0:24:42", "remaining_time": "0:16:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2200, "total_steps": 3665, "loss": 0.7812, "learning_rate": 2.77371890527691e-05, "epoch": 3.001364256480218, "percentage": 60.03, "elapsed_time": "0:24:50", "remaining_time": "0:16:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2210, "total_steps": 3665, "loss": 0.496, "learning_rate": 2.741127862356389e-05, "epoch": 3.0150068212824013, "percentage": 60.3, "elapsed_time": "0:24:57", "remaining_time": "0:16:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2220, "total_steps": 3665, "loss": 0.3416, "learning_rate": 2.7086293170966312e-05, "epoch": 3.028649386084584, "percentage": 60.57, "elapsed_time": "0:25:03", "remaining_time": "0:16:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2230, "total_steps": 3665, "loss": 0.3462, "learning_rate": 2.6762256573806664e-05, "epoch": 3.0422919508867667, "percentage": 60.85, "elapsed_time": "0:25:10", "remaining_time": "0:16:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2240, "total_steps": 3665, "loss": 0.4756, "learning_rate": 2.6439192641196583e-05, "epoch": 3.0559345156889495, "percentage": 61.12, "elapsed_time": "0:25:17", "remaining_time": "0:16:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2250, "total_steps": 3665, "loss": 0.357, "learning_rate": 2.611712511077959e-05, "epoch": 3.069577080491132, "percentage": 61.39, "elapsed_time": "0:25:24", "remaining_time": "0:15:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2260, "total_steps": 3665, "loss": 0.3361, "learning_rate": 2.5796077646986922e-05, "epoch": 3.083219645293315, "percentage": 61.66, "elapsed_time": "0:25:31", "remaining_time": "0:15:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2270, "total_steps": 3665, "loss": 0.419, "learning_rate": 2.5476073839298857e-05, "epoch": 3.096862210095498, "percentage": 61.94, "elapsed_time": "0:25:37", "remaining_time": "0:15:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2280, "total_steps": 3665, "loss": 0.4211, "learning_rate": 2.5157137200511253e-05, "epoch": 3.110504774897681, "percentage": 62.21, "elapsed_time": "0:25:45", "remaining_time": "0:15:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2290, "total_steps": 3665, "loss": 0.5248, "learning_rate": 2.4839291165008073e-05, "epoch": 3.1241473396998636, "percentage": 62.48, "elapsed_time": "0:25:52", "remaining_time": "0:15:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2300, "total_steps": 3665, "loss": 0.3983, "learning_rate": 2.452255908703945e-05, "epoch": 3.1377899045020463, "percentage": 62.76, "elapsed_time": "0:25:59", "remaining_time": "0:15:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2310, "total_steps": 3665, "loss": 0.3728, "learning_rate": 2.420696423900567e-05, "epoch": 3.151432469304229, "percentage": 63.03, "elapsed_time": "0:26:07", "remaining_time": "0:15:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2320, "total_steps": 3665, "loss": 0.4099, "learning_rate": 2.3892529809747195e-05, "epoch": 3.1650750341064118, "percentage": 63.3, "elapsed_time": "0:26:13", "remaining_time": "0:15:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2330, "total_steps": 3665, "loss": 0.5466, "learning_rate": 2.35792789028409e-05, "epoch": 3.178717598908595, "percentage": 63.57, "elapsed_time": "0:26:21", "remaining_time": "0:15:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2340, "total_steps": 3665, "loss": 0.3956, "learning_rate": 2.32672345349024e-05, "epoch": 3.1923601637107777, "percentage": 63.85, "elapsed_time": "0:26:28", "remaining_time": "0:14:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2350, "total_steps": 3665, "loss": 0.2686, "learning_rate": 2.2956419633894922e-05, "epoch": 3.2060027285129604, "percentage": 64.12, "elapsed_time": "0:26:35", "remaining_time": "0:14:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2360, "total_steps": 3665, "loss": 0.3545, "learning_rate": 2.264685703744466e-05, "epoch": 3.219645293315143, "percentage": 64.39, "elapsed_time": "0:26:42", "remaining_time": "0:14:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2370, "total_steps": 3665, "loss": 0.4361, "learning_rate": 2.2338569491162688e-05, "epoch": 3.233287858117326, "percentage": 64.67, "elapsed_time": "0:26:48", "remaining_time": "0:14:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2380, "total_steps": 3665, "loss": 0.4616, "learning_rate": 2.2031579646973662e-05, "epoch": 3.246930422919509, "percentage": 64.94, "elapsed_time": "0:26:55", "remaining_time": "0:14:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2390, "total_steps": 3665, "loss": 0.4095, "learning_rate": 2.1725910061451582e-05, "epoch": 3.260572987721692, "percentage": 65.21, "elapsed_time": "0:27:03", "remaining_time": "0:14:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2400, "total_steps": 3665, "loss": 0.4428, "learning_rate": 2.1421583194162237e-05, "epoch": 3.2742155525238745, "percentage": 65.48, "elapsed_time": "0:27:09", "remaining_time": "0:14:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2410, "total_steps": 3665, "loss": 0.4946, "learning_rate": 2.1118621406013045e-05, "epoch": 3.2878581173260573, "percentage": 65.76, "elapsed_time": "0:27:16", "remaining_time": "0:14:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2420, "total_steps": 3665, "loss": 0.3676, "learning_rate": 2.0817046957610073e-05, "epoch": 3.30150068212824, "percentage": 66.03, "elapsed_time": "0:27:23", "remaining_time": "0:14:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2430, "total_steps": 3665, "loss": 0.4319, "learning_rate": 2.0516882007622318e-05, "epoch": 3.3151432469304227, "percentage": 66.3, "elapsed_time": "0:27:30", "remaining_time": "0:13:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2440, "total_steps": 3665, "loss": 0.3973, "learning_rate": 2.0218148611153614e-05, "epoch": 3.328785811732606, "percentage": 66.58, "elapsed_time": "0:27:36", "remaining_time": "0:13:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2450, "total_steps": 3665, "loss": 0.3728, "learning_rate": 1.99208687181221e-05, "epoch": 3.3424283765347886, "percentage": 66.85, "elapsed_time": "0:27:43", "remaining_time": "0:13:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2460, "total_steps": 3665, "loss": 0.4029, "learning_rate": 1.9625064171647403e-05, "epoch": 3.3560709413369714, "percentage": 67.12, "elapsed_time": "0:27:50", "remaining_time": "0:13:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2470, "total_steps": 3665, "loss": 0.5182, "learning_rate": 1.933075670644566e-05, "epoch": 3.369713506139154, "percentage": 67.39, "elapsed_time": "0:27:57", "remaining_time": "0:13:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2480, "total_steps": 3665, "loss": 0.3211, "learning_rate": 1.903796794723261e-05, "epoch": 3.383356070941337, "percentage": 67.67, "elapsed_time": "0:28:03", "remaining_time": "0:13:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2490, "total_steps": 3665, "loss": 0.3218, "learning_rate": 1.8746719407134558e-05, "epoch": 3.39699863574352, "percentage": 67.94, "elapsed_time": "0:28:09", "remaining_time": "0:13:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2500, "total_steps": 3665, "loss": 0.3561, "learning_rate": 1.8457032486107733e-05, "epoch": 3.4106412005457027, "percentage": 68.21, "elapsed_time": "0:28:16", "remaining_time": "0:13:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2510, "total_steps": 3665, "loss": 0.4223, "learning_rate": 1.816892846936592e-05, "epoch": 3.4242837653478855, "percentage": 68.49, "elapsed_time": "0:28:23", "remaining_time": "0:13:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2520, "total_steps": 3665, "loss": 0.2911, "learning_rate": 1.7882428525816434e-05, "epoch": 3.437926330150068, "percentage": 68.76, "elapsed_time": "0:28:29", "remaining_time": "0:12:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2530, "total_steps": 3665, "loss": 0.3991, "learning_rate": 1.759755370650472e-05, "epoch": 3.451568894952251, "percentage": 69.03, "elapsed_time": "0:28:36", "remaining_time": "0:12:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2540, "total_steps": 3665, "loss": 0.3823, "learning_rate": 1.7314324943067598e-05, "epoch": 3.4652114597544337, "percentage": 69.3, "elapsed_time": "0:28:42", "remaining_time": "0:12:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2550, "total_steps": 3665, "loss": 0.3564, "learning_rate": 1.70327630461953e-05, "epoch": 3.4788540245566164, "percentage": 69.58, "elapsed_time": "0:28:49", "remaining_time": "0:12:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2560, "total_steps": 3665, "loss": 0.4012, "learning_rate": 1.6752888704102304e-05, "epoch": 3.4924965893587996, "percentage": 69.85, "elapsed_time": "0:28:56", "remaining_time": "0:12:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2570, "total_steps": 3665, "loss": 0.3622, "learning_rate": 1.6474722481007344e-05, "epoch": 3.5061391541609823, "percentage": 70.12, "elapsed_time": "0:29:03", "remaining_time": "0:12:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2580, "total_steps": 3665, "loss": 0.3502, "learning_rate": 1.619828481562229e-05, "epoch": 3.519781718963165, "percentage": 70.4, "elapsed_time": "0:29:09", "remaining_time": "0:12:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2590, "total_steps": 3665, "loss": 0.4129, "learning_rate": 1.5923596019650517e-05, "epoch": 3.533424283765348, "percentage": 70.67, "elapsed_time": "0:29:16", "remaining_time": "0:12:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2600, "total_steps": 3665, "loss": 0.455, "learning_rate": 1.565067627629432e-05, "epoch": 3.547066848567531, "percentage": 70.94, "elapsed_time": "0:29:23", "remaining_time": "0:12:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2610, "total_steps": 3665, "loss": 0.3905, "learning_rate": 1.5379545638772032e-05, "epoch": 3.5607094133697137, "percentage": 71.21, "elapsed_time": "0:29:30", "remaining_time": "0:11:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2620, "total_steps": 3665, "loss": 0.4603, "learning_rate": 1.511022402884459e-05, "epoch": 3.5743519781718964, "percentage": 71.49, "elapsed_time": "0:29:37", "remaining_time": "0:11:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2630, "total_steps": 3665, "loss": 0.3654, "learning_rate": 1.4842731235351653e-05, "epoch": 3.587994542974079, "percentage": 71.76, "elapsed_time": "0:29:43", "remaining_time": "0:11:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2640, "total_steps": 3665, "loss": 0.4481, "learning_rate": 1.4577086912757659e-05, "epoch": 3.601637107776262, "percentage": 72.03, "elapsed_time": "0:29:49", "remaining_time": "0:11:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2650, "total_steps": 3665, "loss": 0.4829, "learning_rate": 1.4313310579707697e-05, "epoch": 3.6152796725784446, "percentage": 72.31, "elapsed_time": "0:29:56", "remaining_time": "0:11:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2660, "total_steps": 3665, "loss": 0.3937, "learning_rate": 1.405142161759327e-05, "epoch": 3.6289222373806274, "percentage": 72.58, "elapsed_time": "0:30:03", "remaining_time": "0:11:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2670, "total_steps": 3665, "loss": 0.3902, "learning_rate": 1.3791439269128274e-05, "epoch": 3.64256480218281, "percentage": 72.85, "elapsed_time": "0:30:10", "remaining_time": "0:11:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2680, "total_steps": 3665, "loss": 0.4495, "learning_rate": 1.3533382636935092e-05, "epoch": 3.6562073669849933, "percentage": 73.12, "elapsed_time": "0:30:17", "remaining_time": "0:11:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2690, "total_steps": 3665, "loss": 0.4707, "learning_rate": 1.3277270682140996e-05, "epoch": 3.669849931787176, "percentage": 73.4, "elapsed_time": "0:30:24", "remaining_time": "0:11:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2700, "total_steps": 3665, "loss": 0.4189, "learning_rate": 1.3023122222984941e-05, "epoch": 3.6834924965893587, "percentage": 73.67, "elapsed_time": "0:30:31", "remaining_time": "0:10:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2710, "total_steps": 3665, "loss": 0.3741, "learning_rate": 1.2770955933434906e-05, "epoch": 3.6971350613915415, "percentage": 73.94, "elapsed_time": "0:30:37", "remaining_time": "0:10:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2720, "total_steps": 3665, "loss": 0.3724, "learning_rate": 1.2520790341815726e-05, "epoch": 3.7107776261937246, "percentage": 74.22, "elapsed_time": "0:30:44", "remaining_time": "0:10:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2730, "total_steps": 3665, "loss": 0.4002, "learning_rate": 1.2272643829447723e-05, "epoch": 3.7244201909959074, "percentage": 74.49, "elapsed_time": "0:30:50", "remaining_time": "0:10:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2740, "total_steps": 3665, "loss": 0.4129, "learning_rate": 1.2026534629296168e-05, "epoch": 3.73806275579809, "percentage": 74.76, "elapsed_time": "0:30:57", "remaining_time": "0:10:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2750, "total_steps": 3665, "loss": 0.3354, "learning_rate": 1.1782480824631478e-05, "epoch": 3.751705320600273, "percentage": 75.03, "elapsed_time": "0:31:04", "remaining_time": "0:10:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2760, "total_steps": 3665, "loss": 0.3, "learning_rate": 1.154050034770057e-05, "epoch": 3.7653478854024556, "percentage": 75.31, "elapsed_time": "0:31:10", "remaining_time": "0:10:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2770, "total_steps": 3665, "loss": 0.4613, "learning_rate": 1.1300610978409301e-05, "epoch": 3.7789904502046383, "percentage": 75.58, "elapsed_time": "0:31:16", "remaining_time": "0:10:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2780, "total_steps": 3665, "loss": 0.3782, "learning_rate": 1.1062830343015998e-05, "epoch": 3.792633015006821, "percentage": 75.85, "elapsed_time": "0:31:23", "remaining_time": "0:09:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2790, "total_steps": 3665, "loss": 0.3154, "learning_rate": 1.0827175912836352e-05, "epoch": 3.806275579809004, "percentage": 76.13, "elapsed_time": "0:31:30", "remaining_time": "0:09:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2800, "total_steps": 3665, "loss": 0.3941, "learning_rate": 1.059366500295973e-05, "epoch": 3.819918144611187, "percentage": 76.4, "elapsed_time": "0:31:36", "remaining_time": "0:09:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2810, "total_steps": 3665, "loss": 0.4402, "learning_rate": 1.0362314770976858e-05, "epoch": 3.8335607094133697, "percentage": 76.67, "elapsed_time": "0:31:43", "remaining_time": "0:09:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2820, "total_steps": 3665, "loss": 0.3588, "learning_rate": 1.0133142215719176e-05, "epoch": 3.8472032742155524, "percentage": 76.94, "elapsed_time": "0:31:50", "remaining_time": "0:09:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2830, "total_steps": 3665, "loss": 0.4171, "learning_rate": 9.906164176009825e-06, "epoch": 3.8608458390177356, "percentage": 77.22, "elapsed_time": "0:31:57", "remaining_time": "0:09:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2840, "total_steps": 3665, "loss": 0.4008, "learning_rate": 9.681397329426363e-06, "epoch": 3.8744884038199183, "percentage": 77.49, "elapsed_time": "0:32:03", "remaining_time": "0:09:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2850, "total_steps": 3665, "loss": 0.2851, "learning_rate": 9.458858191075358e-06, "epoch": 3.888130968622101, "percentage": 77.76, "elapsed_time": "0:32:10", "remaining_time": "0:09:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2860, "total_steps": 3665, "loss": 0.486, "learning_rate": 9.238563112378967e-06, "epoch": 3.901773533424284, "percentage": 78.04, "elapsed_time": "0:32:17", "remaining_time": "0:09:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2870, "total_steps": 3665, "loss": 0.3321, "learning_rate": 9.02052827987339e-06, "epoch": 3.9154160982264665, "percentage": 78.31, "elapsed_time": "0:32:24", "remaining_time": "0:08:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2880, "total_steps": 3665, "loss": 0.2981, "learning_rate": 8.804769714019619e-06, "epoch": 3.9290586630286493, "percentage": 78.58, "elapsed_time": "0:32:30", "remaining_time": "0:08:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2890, "total_steps": 3665, "loss": 0.3412, "learning_rate": 8.591303268026293e-06, "epoch": 3.942701227830832, "percentage": 78.85, "elapsed_time": "0:32:37", "remaining_time": "0:08:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2900, "total_steps": 3665, "loss": 0.3648, "learning_rate": 8.380144626684829e-06, "epoch": 3.956343792633015, "percentage": 79.13, "elapsed_time": "0:32:43", "remaining_time": "0:08:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2910, "total_steps": 3665, "loss": 0.4028, "learning_rate": 8.171309305216973e-06, "epoch": 3.969986357435198, "percentage": 79.4, "elapsed_time": "0:32:50", "remaining_time": "0:08:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2920, "total_steps": 3665, "loss": 0.5365, "learning_rate": 7.96481264813481e-06, "epoch": 3.9836289222373806, "percentage": 79.67, "elapsed_time": "0:32:57", "remaining_time": "0:08:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2930, "total_steps": 3665, "loss": 0.3312, "learning_rate": 7.760669828113276e-06, "epoch": 3.9972714870395634, "percentage": 79.95, "elapsed_time": "0:33:03", "remaining_time": "0:08:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2940, "total_steps": 3665, "loss": 0.2586, "learning_rate": 7.558895844875325e-06, "epoch": 4.0109140518417465, "percentage": 80.22, "elapsed_time": "0:33:10", "remaining_time": "0:08:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2950, "total_steps": 3665, "loss": 0.174, "learning_rate": 7.359505524089843e-06, "epoch": 4.024556616643929, "percentage": 80.49, "elapsed_time": "0:33:17", "remaining_time": "0:08:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2960, "total_steps": 3665, "loss": 0.1319, "learning_rate": 7.162513516282236e-06, "epoch": 4.038199181446112, "percentage": 80.76, "elapsed_time": "0:33:23", "remaining_time": "0:07:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2970, "total_steps": 3665, "loss": 0.1098, "learning_rate": 6.967934295758003e-06, "epoch": 4.051841746248295, "percentage": 81.04, "elapsed_time": "0:33:30", "remaining_time": "0:07:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2980, "total_steps": 3665, "loss": 0.1351, "learning_rate": 6.775782159539237e-06, "epoch": 4.0654843110504775, "percentage": 81.31, "elapsed_time": "0:33:36", "remaining_time": "0:07:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2990, "total_steps": 3665, "loss": 0.2408, "learning_rate": 6.586071226314046e-06, "epoch": 4.07912687585266, "percentage": 81.58, "elapsed_time": "0:33:43", "remaining_time": "0:07:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3000, "total_steps": 3665, "loss": 0.1759, "learning_rate": 6.3988154353992285e-06, "epoch": 4.092769440654843, "percentage": 81.86, "elapsed_time": "0:33:50", "remaining_time": "0:07:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3010, "total_steps": 3665, "loss": 0.2398, "learning_rate": 6.214028545716071e-06, "epoch": 4.106412005457026, "percentage": 82.13, "elapsed_time": "0:33:57", "remaining_time": "0:07:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3020, "total_steps": 3665, "loss": 0.1491, "learning_rate": 6.031724134779331e-06, "epoch": 4.120054570259208, "percentage": 82.4, "elapsed_time": "0:34:04", "remaining_time": "0:07:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3030, "total_steps": 3665, "loss": 0.1711, "learning_rate": 5.851915597699638e-06, "epoch": 4.133697135061391, "percentage": 82.67, "elapsed_time": "0:34:10", "remaining_time": "0:07:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3040, "total_steps": 3665, "loss": 0.1815, "learning_rate": 5.674616146199277e-06, "epoch": 4.147339699863575, "percentage": 82.95, "elapsed_time": "0:34:17", "remaining_time": "0:07:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3050, "total_steps": 3665, "loss": 0.2796, "learning_rate": 5.499838807641413e-06, "epoch": 4.1609822646657575, "percentage": 83.22, "elapsed_time": "0:34:24", "remaining_time": "0:06:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3060, "total_steps": 3665, "loss": 0.2307, "learning_rate": 5.327596424072896e-06, "epoch": 4.17462482946794, "percentage": 83.49, "elapsed_time": "0:34:31", "remaining_time": "0:06:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3070, "total_steps": 3665, "loss": 0.1955, "learning_rate": 5.157901651280672e-06, "epoch": 4.188267394270123, "percentage": 83.77, "elapsed_time": "0:34:38", "remaining_time": "0:06:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3080, "total_steps": 3665, "loss": 0.2332, "learning_rate": 4.990766957861875e-06, "epoch": 4.201909959072306, "percentage": 84.04, "elapsed_time": "0:34:45", "remaining_time": "0:06:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3090, "total_steps": 3665, "loss": 0.1317, "learning_rate": 4.826204624307665e-06, "epoch": 4.215552523874488, "percentage": 84.31, "elapsed_time": "0:34:52", "remaining_time": "0:06:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3100, "total_steps": 3665, "loss": 0.1772, "learning_rate": 4.664226742100946e-06, "epoch": 4.229195088676671, "percentage": 84.58, "elapsed_time": "0:34:58", "remaining_time": "0:06:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3110, "total_steps": 3665, "loss": 0.1893, "learning_rate": 4.504845212827848e-06, "epoch": 4.242837653478854, "percentage": 84.86, "elapsed_time": "0:35:05", "remaining_time": "0:06:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3120, "total_steps": 3665, "loss": 0.2459, "learning_rate": 4.348071747303322e-06, "epoch": 4.256480218281037, "percentage": 85.13, "elapsed_time": "0:35:14", "remaining_time": "0:06:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3130, "total_steps": 3665, "loss": 0.1615, "learning_rate": 4.193917864710599e-06, "epoch": 4.270122783083219, "percentage": 85.4, "elapsed_time": "0:35:20", "remaining_time": "0:06:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3140, "total_steps": 3665, "loss": 0.1488, "learning_rate": 4.042394891754846e-06, "epoch": 4.283765347885402, "percentage": 85.68, "elapsed_time": "0:35:27", "remaining_time": "0:05:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3150, "total_steps": 3665, "loss": 0.1507, "learning_rate": 3.893513961830886e-06, "epoch": 4.297407912687586, "percentage": 85.95, "elapsed_time": "0:35:33", "remaining_time": "0:05:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3160, "total_steps": 3665, "loss": 0.1768, "learning_rate": 3.74728601420518e-06, "epoch": 4.311050477489768, "percentage": 86.22, "elapsed_time": "0:35:40", "remaining_time": "0:05:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3170, "total_steps": 3665, "loss": 0.3008, "learning_rate": 3.6037217932120272e-06, "epoch": 4.324693042291951, "percentage": 86.49, "elapsed_time": "0:35:47", "remaining_time": "0:05:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3180, "total_steps": 3665, "loss": 0.1839, "learning_rate": 3.4628318474641344e-06, "epoch": 4.338335607094134, "percentage": 86.77, "elapsed_time": "0:35:54", "remaining_time": "0:05:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3190, "total_steps": 3665, "loss": 0.1681, "learning_rate": 3.3246265290775013e-06, "epoch": 4.351978171896317, "percentage": 87.04, "elapsed_time": "0:36:00", "remaining_time": "0:05:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3200, "total_steps": 3665, "loss": 0.2091, "learning_rate": 3.1891159929108074e-06, "epoch": 4.365620736698499, "percentage": 87.31, "elapsed_time": "0:36:07", "remaining_time": "0:05:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3210, "total_steps": 3665, "loss": 0.175, "learning_rate": 3.0563101958192677e-06, "epoch": 4.379263301500682, "percentage": 87.59, "elapsed_time": "0:36:14", "remaining_time": "0:05:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3220, "total_steps": 3665, "loss": 0.2715, "learning_rate": 2.9262188959230297e-06, "epoch": 4.392905866302865, "percentage": 87.86, "elapsed_time": "0:36:21", "remaining_time": "0:05:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3230, "total_steps": 3665, "loss": 0.205, "learning_rate": 2.7988516518901643e-06, "epoch": 4.406548431105048, "percentage": 88.13, "elapsed_time": "0:36:28", "remaining_time": "0:04:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3240, "total_steps": 3665, "loss": 0.1804, "learning_rate": 2.674217822234382e-06, "epoch": 4.42019099590723, "percentage": 88.4, "elapsed_time": "0:36:35", "remaining_time": "0:04:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3250, "total_steps": 3665, "loss": 0.2301, "learning_rate": 2.5523265646273252e-06, "epoch": 4.433833560709413, "percentage": 88.68, "elapsed_time": "0:36:42", "remaining_time": "0:04:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3260, "total_steps": 3665, "loss": 0.2665, "learning_rate": 2.433186835225745e-06, "epoch": 4.447476125511596, "percentage": 88.95, "elapsed_time": "0:36:49", "remaining_time": "0:04:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3270, "total_steps": 3665, "loss": 0.1443, "learning_rate": 2.316807388013431e-06, "epoch": 4.461118690313779, "percentage": 89.22, "elapsed_time": "0:36:55", "remaining_time": "0:04:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3280, "total_steps": 3665, "loss": 0.2292, "learning_rate": 2.203196774157972e-06, "epoch": 4.474761255115962, "percentage": 89.5, "elapsed_time": "0:37:03", "remaining_time": "0:04:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3290, "total_steps": 3665, "loss": 0.1765, "learning_rate": 2.0923633413824663e-06, "epoch": 4.488403819918145, "percentage": 89.77, "elapsed_time": "0:37:09", "remaining_time": "0:04:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3300, "total_steps": 3665, "loss": 0.1966, "learning_rate": 1.98431523335215e-06, "epoch": 4.502046384720328, "percentage": 90.04, "elapsed_time": "0:37:16", "remaining_time": "0:04:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3310, "total_steps": 3665, "loss": 0.2525, "learning_rate": 1.8790603890760328e-06, "epoch": 4.51568894952251, "percentage": 90.31, "elapsed_time": "0:37:23", "remaining_time": "0:04:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3320, "total_steps": 3665, "loss": 0.1502, "learning_rate": 1.7766065423235624e-06, "epoch": 4.529331514324693, "percentage": 90.59, "elapsed_time": "0:37:30", "remaining_time": "0:03:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3330, "total_steps": 3665, "loss": 0.2251, "learning_rate": 1.6769612210563834e-06, "epoch": 4.542974079126876, "percentage": 90.86, "elapsed_time": "0:37:37", "remaining_time": "0:03:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3340, "total_steps": 3665, "loss": 0.1724, "learning_rate": 1.5801317468751954e-06, "epoch": 4.5566166439290585, "percentage": 91.13, "elapsed_time": "0:37:44", "remaining_time": "0:03:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3350, "total_steps": 3665, "loss": 0.1416, "learning_rate": 1.4861252344817812e-06, "epoch": 4.570259208731241, "percentage": 91.41, "elapsed_time": "0:37:50", "remaining_time": "0:03:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3360, "total_steps": 3665, "loss": 0.1507, "learning_rate": 1.3949485911562799e-06, "epoch": 4.583901773533424, "percentage": 91.68, "elapsed_time": "0:37:57", "remaining_time": "0:03:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3370, "total_steps": 3665, "loss": 0.1486, "learning_rate": 1.3066085162496057e-06, "epoch": 4.597544338335607, "percentage": 91.95, "elapsed_time": "0:38:03", "remaining_time": "0:03:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3380, "total_steps": 3665, "loss": 0.1823, "learning_rate": 1.2211115006912499e-06, "epoch": 4.61118690313779, "percentage": 92.22, "elapsed_time": "0:38:11", "remaining_time": "0:03:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3390, "total_steps": 3665, "loss": 0.1146, "learning_rate": 1.1384638265123305e-06, "epoch": 4.624829467939973, "percentage": 92.5, "elapsed_time": "0:38:17", "remaining_time": "0:03:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3400, "total_steps": 3665, "loss": 0.2206, "learning_rate": 1.0586715663840175e-06, "epoch": 4.638472032742156, "percentage": 92.77, "elapsed_time": "0:38:24", "remaining_time": "0:02:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3410, "total_steps": 3665, "loss": 0.137, "learning_rate": 9.817405831713135e-07, "epoch": 4.6521145975443385, "percentage": 93.04, "elapsed_time": "0:38:30", "remaining_time": "0:02:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3420, "total_steps": 3665, "loss": 0.1969, "learning_rate": 9.076765295022949e-07, "epoch": 4.665757162346521, "percentage": 93.32, "elapsed_time": "0:38:37", "remaining_time": "0:02:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3430, "total_steps": 3665, "loss": 0.1712, "learning_rate": 8.364848473527698e-07, "epoch": 4.679399727148704, "percentage": 93.59, "elapsed_time": "0:38:44", "remaining_time": "0:02:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3440, "total_steps": 3665, "loss": 0.1606, "learning_rate": 7.748725387928791e-07, "epoch": 4.693042291950887, "percentage": 93.86, "elapsed_time": "0:38:50", "remaining_time": "0:02:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3450, "total_steps": 3665, "loss": 0.1722, "learning_rate": 7.09152598980536e-07, "epoch": 4.7066848567530695, "percentage": 94.13, "elapsed_time": "0:38:57", "remaining_time": "0:02:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3460, "total_steps": 3665, "loss": 0.2592, "learning_rate": 6.463196175536768e-07, "epoch": 4.720327421555252, "percentage": 94.41, "elapsed_time": "0:39:04", "remaining_time": "0:02:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3470, "total_steps": 3665, "loss": 0.2729, "learning_rate": 5.863782112669647e-07, "epoch": 4.733969986357435, "percentage": 94.68, "elapsed_time": "0:39:11", "remaining_time": "0:02:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3480, "total_steps": 3665, "loss": 0.1888, "learning_rate": 5.293327844118956e-07, "epoch": 4.747612551159618, "percentage": 94.95, "elapsed_time": "0:39:18", "remaining_time": "0:02:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3490, "total_steps": 3665, "loss": 0.1367, "learning_rate": 4.751875284932217e-07, "epoch": 4.7612551159618, "percentage": 95.23, "elapsed_time": "0:39:24", "remaining_time": "0:01:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3500, "total_steps": 3665, "loss": 0.2003, "learning_rate": 4.2394642192095327e-07, "epoch": 4.774897680763983, "percentage": 95.5, "elapsed_time": "0:39:31", "remaining_time": "0:01:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3510, "total_steps": 3665, "loss": 0.1503, "learning_rate": 3.7561322971803706e-07, "epoch": 4.788540245566167, "percentage": 95.77, "elapsed_time": "0:39:38", "remaining_time": "0:01:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3520, "total_steps": 3665, "loss": 0.1425, "learning_rate": 3.301915032437375e-07, "epoch": 4.8021828103683495, "percentage": 96.04, "elapsed_time": "0:39:44", "remaining_time": "0:01:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3530, "total_steps": 3665, "loss": 0.1265, "learning_rate": 2.8768457993266775e-07, "epoch": 4.815825375170532, "percentage": 96.32, "elapsed_time": "0:39:51", "remaining_time": "0:01:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3540, "total_steps": 3665, "loss": 0.2103, "learning_rate": 2.480955830495679e-07, "epoch": 4.829467939972715, "percentage": 96.59, "elapsed_time": "0:39:57", "remaining_time": "0:01:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3550, "total_steps": 3665, "loss": 0.2395, "learning_rate": 2.1142742145984442e-07, "epoch": 4.843110504774898, "percentage": 96.86, "elapsed_time": "0:40:04", "remaining_time": "0:01:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3560, "total_steps": 3665, "loss": 0.1317, "learning_rate": 1.7768278941581617e-07, "epoch": 4.85675306957708, "percentage": 97.14, "elapsed_time": "0:40:10", "remaining_time": "0:01:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3570, "total_steps": 3665, "loss": 0.1802, "learning_rate": 1.4686416635874445e-07, "epoch": 4.870395634379263, "percentage": 97.41, "elapsed_time": "0:40:17", "remaining_time": "0:01:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3580, "total_steps": 3665, "loss": 0.2484, "learning_rate": 1.1897381673666719e-07, "epoch": 4.884038199181446, "percentage": 97.68, "elapsed_time": "0:40:24", "remaining_time": "0:00:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3590, "total_steps": 3665, "loss": 0.1346, "learning_rate": 9.40137898380078e-08, "epoch": 4.897680763983629, "percentage": 97.95, "elapsed_time": "0:40:30", "remaining_time": "0:00:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3600, "total_steps": 3665, "loss": 0.2097, "learning_rate": 7.198591964099777e-08, "epoch": 4.911323328785811, "percentage": 98.23, "elapsed_time": "0:40:37", "remaining_time": "0:00:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3610, "total_steps": 3665, "loss": 0.1865, "learning_rate": 5.289182467893561e-08, "epoch": 4.924965893587995, "percentage": 98.5, "elapsed_time": "0:40:43", "remaining_time": "0:00:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3620, "total_steps": 3665, "loss": 0.2137, "learning_rate": 3.6732907921241956e-08, "epoch": 4.938608458390178, "percentage": 98.77, "elapsed_time": "0:40:50", "remaining_time": "0:00:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3630, "total_steps": 3665, "loss": 0.1699, "learning_rate": 2.351035667038648e-08, "epoch": 4.95225102319236, "percentage": 99.05, "elapsed_time": "0:40:57", "remaining_time": "0:00:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3640, "total_steps": 3665, "loss": 0.247, "learning_rate": 1.3225142474651009e-08, "epoch": 4.965893587994543, "percentage": 99.32, "elapsed_time": "0:41:04", "remaining_time": "0:00:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3650, "total_steps": 3665, "loss": 0.1884, "learning_rate": 5.878021056742178e-09, "epoch": 4.979536152796726, "percentage": 99.59, "elapsed_time": "0:41:11", "remaining_time": "0:00:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3660, "total_steps": 3665, "loss": 0.186, "learning_rate": 1.4695322582491956e-09, "epoch": 4.993178717598909, "percentage": 99.86, "elapsed_time": "0:41:18", "remaining_time": "0:00:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3665, "total_steps": 3665, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:41:22", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}