Safetensors
qwen2
reasoning
ptrdvn's picture
Upload folder using huggingface_hub
baec9b6 verified
raw
history blame
22.5 kB
{"current_steps": 1, "total_steps": 108, "loss": 0.5807, "lr": 5e-06, "epoch": 0.009259259259259259, "percentage": 0.93, "elapsed_time": "0:00:13", "remaining_time": "0:24:55"}
{"current_steps": 2, "total_steps": 108, "loss": 0.534, "lr": 1e-05, "epoch": 0.018518518518518517, "percentage": 1.85, "elapsed_time": "0:00:24", "remaining_time": "0:21:27"}
{"current_steps": 3, "total_steps": 108, "loss": 0.6069, "lr": 9.997804182543973e-06, "epoch": 0.027777777777777776, "percentage": 2.78, "elapsed_time": "0:00:34", "remaining_time": "0:20:09"}
{"current_steps": 4, "total_steps": 108, "loss": 0.5863, "lr": 9.991218658821609e-06, "epoch": 0.037037037037037035, "percentage": 3.7, "elapsed_time": "0:00:44", "remaining_time": "0:19:22"}
{"current_steps": 5, "total_steps": 108, "loss": 0.5952, "lr": 9.980249213076085e-06, "epoch": 0.046296296296296294, "percentage": 4.63, "elapsed_time": "0:00:54", "remaining_time": "0:18:50"}
{"current_steps": 6, "total_steps": 108, "loss": 0.5384, "lr": 9.964905480067585e-06, "epoch": 0.05555555555555555, "percentage": 5.56, "elapsed_time": "0:01:05", "remaining_time": "0:18:27"}
{"current_steps": 7, "total_steps": 108, "loss": 0.5779, "lr": 9.945200936610821e-06, "epoch": 0.06481481481481481, "percentage": 6.48, "elapsed_time": "0:01:15", "remaining_time": "0:18:07"}
{"current_steps": 8, "total_steps": 108, "loss": 0.5487, "lr": 9.921152889737985e-06, "epoch": 0.07407407407407407, "percentage": 7.41, "elapsed_time": "0:01:25", "remaining_time": "0:17:49"}
{"current_steps": 9, "total_steps": 108, "loss": 0.5162, "lr": 9.892782461497521e-06, "epoch": 0.08333333333333333, "percentage": 8.33, "elapsed_time": "0:01:35", "remaining_time": "0:17:33"}
{"current_steps": 10, "total_steps": 108, "loss": 0.4825, "lr": 9.860114570402055e-06, "epoch": 0.09259259259259259, "percentage": 9.26, "elapsed_time": "0:01:45", "remaining_time": "0:17:18"}
{"current_steps": 11, "total_steps": 108, "loss": 0.4962, "lr": 9.823177909541795e-06, "epoch": 0.10185185185185185, "percentage": 10.19, "elapsed_time": "0:01:56", "remaining_time": "0:17:04"}
{"current_steps": 11, "total_steps": 108, "eval_loss": 0.5000379085540771, "epoch": 0.10185185185185185, "percentage": 10.19, "elapsed_time": "0:02:03", "remaining_time": "0:18:08"}
{"current_steps": 12, "total_steps": 108, "loss": 0.4456, "lr": 9.782004921382612e-06, "epoch": 0.1111111111111111, "percentage": 11.11, "elapsed_time": "0:02:13", "remaining_time": "0:17:47"}
{"current_steps": 13, "total_steps": 108, "loss": 0.4288, "lr": 9.736631769270958e-06, "epoch": 0.12037037037037036, "percentage": 12.04, "elapsed_time": "0:02:23", "remaining_time": "0:17:29"}
{"current_steps": 14, "total_steps": 108, "loss": 0.5855, "lr": 9.687098305670606e-06, "epoch": 0.12962962962962962, "percentage": 12.96, "elapsed_time": "0:02:33", "remaining_time": "0:17:13"}
{"current_steps": 15, "total_steps": 108, "loss": 0.5184, "lr": 9.633448037159167e-06, "epoch": 0.1388888888888889, "percentage": 13.89, "elapsed_time": "0:02:44", "remaining_time": "0:16:57"}
{"current_steps": 16, "total_steps": 108, "loss": 0.5568, "lr": 9.575728086215093e-06, "epoch": 0.14814814814814814, "percentage": 14.81, "elapsed_time": "0:02:54", "remaining_time": "0:16:42"}
{"current_steps": 17, "total_steps": 108, "loss": 0.4272, "lr": 9.513989149828718e-06, "epoch": 0.1574074074074074, "percentage": 15.74, "elapsed_time": "0:03:04", "remaining_time": "0:16:28"}
{"current_steps": 18, "total_steps": 108, "loss": 0.487, "lr": 9.448285454973739e-06, "epoch": 0.16666666666666666, "percentage": 16.67, "elapsed_time": "0:03:14", "remaining_time": "0:16:14"}
{"current_steps": 19, "total_steps": 108, "loss": 0.5321, "lr": 9.378674710978185e-06, "epoch": 0.17592592592592593, "percentage": 17.59, "elapsed_time": "0:03:25", "remaining_time": "0:16:00"}
{"current_steps": 20, "total_steps": 108, "loss": 0.5396, "lr": 9.305218058836778e-06, "epoch": 0.18518518518518517, "percentage": 18.52, "elapsed_time": "0:03:35", "remaining_time": "0:15:47"}
{"current_steps": 21, "total_steps": 108, "loss": 0.446, "lr": 9.22798001750913e-06, "epoch": 0.19444444444444445, "percentage": 19.44, "elapsed_time": "0:03:45", "remaining_time": "0:15:34"}
{"current_steps": 22, "total_steps": 108, "loss": 0.5313, "lr": 9.14702842725101e-06, "epoch": 0.2037037037037037, "percentage": 20.37, "elapsed_time": "0:03:55", "remaining_time": "0:15:21"}
{"current_steps": 22, "total_steps": 108, "eval_loss": 0.4791085124015808, "epoch": 0.2037037037037037, "percentage": 20.37, "elapsed_time": "0:04:02", "remaining_time": "0:15:49"}
{"current_steps": 23, "total_steps": 108, "loss": 0.4983, "lr": 9.062434390028407e-06, "epoch": 0.21296296296296297, "percentage": 21.3, "elapsed_time": "0:04:13", "remaining_time": "0:15:36"}
{"current_steps": 24, "total_steps": 108, "loss": 0.4642, "lr": 8.974272207066767e-06, "epoch": 0.2222222222222222, "percentage": 22.22, "elapsed_time": "0:04:23", "remaining_time": "0:15:23"}
{"current_steps": 25, "total_steps": 108, "loss": 0.4832, "lr": 8.882619313590212e-06, "epoch": 0.23148148148148148, "percentage": 23.15, "elapsed_time": "0:04:34", "remaining_time": "0:15:10"}
{"current_steps": 26, "total_steps": 108, "loss": 0.441, "lr": 8.787556210808101e-06, "epoch": 0.24074074074074073, "percentage": 24.07, "elapsed_time": "0:04:44", "remaining_time": "0:14:56"}
{"current_steps": 27, "total_steps": 108, "loss": 0.4489, "lr": 8.689166395208638e-06, "epoch": 0.25, "percentage": 25.0, "elapsed_time": "0:04:54", "remaining_time": "0:14:43"}
{"current_steps": 28, "total_steps": 108, "loss": 0.4971, "lr": 8.587536285221656e-06, "epoch": 0.25925925925925924, "percentage": 25.93, "elapsed_time": "0:05:04", "remaining_time": "0:14:31"}
{"current_steps": 29, "total_steps": 108, "loss": 0.5289, "lr": 8.482755145314987e-06, "epoch": 0.26851851851851855, "percentage": 26.85, "elapsed_time": "0:05:15", "remaining_time": "0:14:18"}
{"current_steps": 30, "total_steps": 108, "loss": 0.5496, "lr": 8.374915007591053e-06, "epoch": 0.2777777777777778, "percentage": 27.78, "elapsed_time": "0:05:25", "remaining_time": "0:14:06"}
{"current_steps": 31, "total_steps": 108, "loss": 0.5261, "lr": 8.264110590952609e-06, "epoch": 0.28703703703703703, "percentage": 28.7, "elapsed_time": "0:05:35", "remaining_time": "0:13:53"}
{"current_steps": 32, "total_steps": 108, "loss": 0.4814, "lr": 8.150439217908557e-06, "epoch": 0.2962962962962963, "percentage": 29.63, "elapsed_time": "0:05:45", "remaining_time": "0:13:41"}
{"current_steps": 33, "total_steps": 108, "loss": 0.4692, "lr": 8.034000729092967e-06, "epoch": 0.3055555555555556, "percentage": 30.56, "elapsed_time": "0:05:56", "remaining_time": "0:13:29"}
{"current_steps": 33, "total_steps": 108, "eval_loss": 0.46850860118865967, "epoch": 0.3055555555555556, "percentage": 30.56, "elapsed_time": "0:06:03", "remaining_time": "0:13:45"}
{"current_steps": 34, "total_steps": 108, "loss": 0.4372, "lr": 7.914897395572362e-06, "epoch": 0.3148148148148148, "percentage": 31.48, "elapsed_time": "0:06:13", "remaining_time": "0:13:33"}
{"current_steps": 35, "total_steps": 108, "loss": 0.5235, "lr": 7.793233829018263e-06, "epoch": 0.32407407407407407, "percentage": 32.41, "elapsed_time": "0:06:23", "remaining_time": "0:13:20"}
{"current_steps": 36, "total_steps": 108, "loss": 0.4339, "lr": 7.669116889823955e-06, "epoch": 0.3333333333333333, "percentage": 33.33, "elapsed_time": "0:06:34", "remaining_time": "0:13:08"}
{"current_steps": 37, "total_steps": 108, "loss": 0.4426, "lr": 7.542655593246103e-06, "epoch": 0.3425925925925926, "percentage": 34.26, "elapsed_time": "0:06:44", "remaining_time": "0:12:55"}
{"current_steps": 38, "total_steps": 108, "loss": 0.5744, "lr": 7.413961013653725e-06, "epoch": 0.35185185185185186, "percentage": 35.19, "elapsed_time": "0:06:54", "remaining_time": "0:12:43"}
{"current_steps": 39, "total_steps": 108, "loss": 0.3849, "lr": 7.283146186968566e-06, "epoch": 0.3611111111111111, "percentage": 36.11, "elapsed_time": "0:07:04", "remaining_time": "0:12:31"}
{"current_steps": 40, "total_steps": 108, "loss": 0.4057, "lr": 7.1503260113826035e-06, "epoch": 0.37037037037037035, "percentage": 37.04, "elapsed_time": "0:07:15", "remaining_time": "0:12:19"}
{"current_steps": 41, "total_steps": 108, "loss": 0.4149, "lr": 7.015617146439863e-06, "epoch": 0.37962962962962965, "percentage": 37.96, "elapsed_time": "0:07:25", "remaining_time": "0:12:07"}
{"current_steps": 42, "total_steps": 108, "loss": 0.4557, "lr": 6.879137910571191e-06, "epoch": 0.3888888888888889, "percentage": 38.89, "elapsed_time": "0:07:35", "remaining_time": "0:11:55"}
{"current_steps": 43, "total_steps": 108, "loss": 0.5052, "lr": 6.741008177171995e-06, "epoch": 0.39814814814814814, "percentage": 39.81, "elapsed_time": "0:07:45", "remaining_time": "0:11:43"}
{"current_steps": 44, "total_steps": 108, "loss": 0.3876, "lr": 6.601349269314188e-06, "epoch": 0.4074074074074074, "percentage": 40.74, "elapsed_time": "0:07:55", "remaining_time": "0:11:32"}
{"current_steps": 44, "total_steps": 108, "eval_loss": 0.4595443606376648, "epoch": 0.4074074074074074, "percentage": 40.74, "elapsed_time": "0:08:03", "remaining_time": "0:11:42"}
{"current_steps": 45, "total_steps": 108, "loss": 0.4381, "lr": 6.46028385318488e-06, "epoch": 0.4166666666666667, "percentage": 41.67, "elapsed_time": "0:08:13", "remaining_time": "0:11:30"}
{"current_steps": 46, "total_steps": 108, "loss": 0.433, "lr": 6.3179358303453386e-06, "epoch": 0.42592592592592593, "percentage": 42.59, "elapsed_time": "0:08:23", "remaining_time": "0:11:18"}
{"current_steps": 47, "total_steps": 108, "loss": 0.4699, "lr": 6.17443022890492e-06, "epoch": 0.4351851851851852, "percentage": 43.52, "elapsed_time": "0:08:33", "remaining_time": "0:11:06"}
{"current_steps": 48, "total_steps": 108, "loss": 0.4584, "lr": 6.029893093705492e-06, "epoch": 0.4444444444444444, "percentage": 44.44, "elapsed_time": "0:08:43", "remaining_time": "0:10:54"}
{"current_steps": 49, "total_steps": 108, "loss": 0.5243, "lr": 5.884451375612865e-06, "epoch": 0.4537037037037037, "percentage": 45.37, "elapsed_time": "0:08:54", "remaining_time": "0:10:43"}
{"current_steps": 50, "total_steps": 108, "loss": 0.4329, "lr": 5.738232820012407e-06, "epoch": 0.46296296296296297, "percentage": 46.3, "elapsed_time": "0:09:04", "remaining_time": "0:10:31"}
{"current_steps": 51, "total_steps": 108, "loss": 0.5633, "lr": 5.591365854606829e-06, "epoch": 0.4722222222222222, "percentage": 47.22, "elapsed_time": "0:09:14", "remaining_time": "0:10:19"}
{"current_steps": 52, "total_steps": 108, "loss": 0.445, "lr": 5.443979476614674e-06, "epoch": 0.48148148148148145, "percentage": 48.15, "elapsed_time": "0:09:24", "remaining_time": "0:10:08"}
{"current_steps": 53, "total_steps": 108, "loss": 0.3809, "lr": 5.296203139468572e-06, "epoch": 0.49074074074074076, "percentage": 49.07, "elapsed_time": "0:09:35", "remaining_time": "0:09:56"}
{"current_steps": 54, "total_steps": 108, "loss": 0.3964, "lr": 5.148166639112799e-06, "epoch": 0.5, "percentage": 50.0, "elapsed_time": "0:09:45", "remaining_time": "0:09:45"}
{"current_steps": 55, "total_steps": 108, "loss": 0.4768, "lr": 5e-06, "epoch": 0.5092592592592593, "percentage": 50.93, "elapsed_time": "0:09:55", "remaining_time": "0:09:33"}
{"current_steps": 55, "total_steps": 108, "eval_loss": 0.4542139768600464, "epoch": 0.5092592592592593, "percentage": 50.93, "elapsed_time": "0:10:02", "remaining_time": "0:09:40"}
{"current_steps": 56, "total_steps": 108, "loss": 0.4238, "lr": 4.8518333608872015e-06, "epoch": 0.5185185185185185, "percentage": 51.85, "elapsed_time": "0:10:13", "remaining_time": "0:09:29"}
{"current_steps": 57, "total_steps": 108, "loss": 0.5484, "lr": 4.703796860531429e-06, "epoch": 0.5277777777777778, "percentage": 52.78, "elapsed_time": "0:10:23", "remaining_time": "0:09:17"}
{"current_steps": 58, "total_steps": 108, "loss": 0.397, "lr": 4.556020523385326e-06, "epoch": 0.5370370370370371, "percentage": 53.7, "elapsed_time": "0:10:33", "remaining_time": "0:09:06"}
{"current_steps": 59, "total_steps": 108, "loss": 0.4452, "lr": 4.408634145393172e-06, "epoch": 0.5462962962962963, "percentage": 54.63, "elapsed_time": "0:10:44", "remaining_time": "0:08:54"}
{"current_steps": 60, "total_steps": 108, "loss": 0.4896, "lr": 4.261767179987595e-06, "epoch": 0.5555555555555556, "percentage": 55.56, "elapsed_time": "0:10:54", "remaining_time": "0:08:43"}
{"current_steps": 61, "total_steps": 108, "loss": 0.4887, "lr": 4.115548624387136e-06, "epoch": 0.5648148148148148, "percentage": 56.48, "elapsed_time": "0:11:04", "remaining_time": "0:08:31"}
{"current_steps": 62, "total_steps": 108, "loss": 0.4997, "lr": 3.970106906294509e-06, "epoch": 0.5740740740740741, "percentage": 57.41, "elapsed_time": "0:11:14", "remaining_time": "0:08:20"}
{"current_steps": 63, "total_steps": 108, "loss": 0.417, "lr": 3.825569771095082e-06, "epoch": 0.5833333333333334, "percentage": 58.33, "elapsed_time": "0:11:24", "remaining_time": "0:08:09"}
{"current_steps": 64, "total_steps": 108, "loss": 0.4504, "lr": 3.682064169654663e-06, "epoch": 0.5925925925925926, "percentage": 59.26, "elapsed_time": "0:11:35", "remaining_time": "0:07:57"}
{"current_steps": 65, "total_steps": 108, "loss": 0.4694, "lr": 3.539716146815122e-06, "epoch": 0.6018518518518519, "percentage": 60.19, "elapsed_time": "0:11:45", "remaining_time": "0:07:46"}
{"current_steps": 66, "total_steps": 108, "loss": 0.4985, "lr": 3.398650730685813e-06, "epoch": 0.6111111111111112, "percentage": 61.11, "elapsed_time": "0:11:55", "remaining_time": "0:07:35"}
{"current_steps": 66, "total_steps": 108, "eval_loss": 0.4495806097984314, "epoch": 0.6111111111111112, "percentage": 61.11, "elapsed_time": "0:12:02", "remaining_time": "0:07:40"}
{"current_steps": 67, "total_steps": 108, "loss": 0.4104, "lr": 3.258991822828007e-06, "epoch": 0.6203703703703703, "percentage": 62.04, "elapsed_time": "0:12:13", "remaining_time": "0:07:28"}
{"current_steps": 68, "total_steps": 108, "loss": 0.4926, "lr": 3.1208620894288105e-06, "epoch": 0.6296296296296297, "percentage": 62.96, "elapsed_time": "0:12:23", "remaining_time": "0:07:17"}
{"current_steps": 69, "total_steps": 108, "loss": 0.4655, "lr": 2.98438285356014e-06, "epoch": 0.6388888888888888, "percentage": 63.89, "elapsed_time": "0:12:34", "remaining_time": "0:07:06"}
{"current_steps": 70, "total_steps": 108, "loss": 0.4535, "lr": 2.8496739886173994e-06, "epoch": 0.6481481481481481, "percentage": 64.81, "elapsed_time": "0:12:44", "remaining_time": "0:06:54"}
{"current_steps": 71, "total_steps": 108, "loss": 0.5186, "lr": 2.716853813031435e-06, "epoch": 0.6574074074074074, "percentage": 65.74, "elapsed_time": "0:12:54", "remaining_time": "0:06:43"}
{"current_steps": 72, "total_steps": 108, "loss": 0.522, "lr": 2.5860389863462765e-06, "epoch": 0.6666666666666666, "percentage": 66.67, "elapsed_time": "0:13:04", "remaining_time": "0:06:32"}
{"current_steps": 73, "total_steps": 108, "loss": 0.4245, "lr": 2.457344406753899e-06, "epoch": 0.6759259259259259, "percentage": 67.59, "elapsed_time": "0:13:14", "remaining_time": "0:06:21"}
{"current_steps": 74, "total_steps": 108, "loss": 0.4806, "lr": 2.330883110176049e-06, "epoch": 0.6851851851851852, "percentage": 68.52, "elapsed_time": "0:13:25", "remaining_time": "0:06:09"}
{"current_steps": 75, "total_steps": 108, "loss": 0.5149, "lr": 2.2067661709817384e-06, "epoch": 0.6944444444444444, "percentage": 69.44, "elapsed_time": "0:13:35", "remaining_time": "0:05:58"}
{"current_steps": 76, "total_steps": 108, "loss": 0.4107, "lr": 2.0851026044276405e-06, "epoch": 0.7037037037037037, "percentage": 70.37, "elapsed_time": "0:13:45", "remaining_time": "0:05:47"}
{"current_steps": 77, "total_steps": 108, "loss": 0.4687, "lr": 1.9659992709070346e-06, "epoch": 0.7129629629629629, "percentage": 71.3, "elapsed_time": "0:13:55", "remaining_time": "0:05:36"}
{"current_steps": 77, "total_steps": 108, "eval_loss": 0.44653645157814026, "epoch": 0.7129629629629629, "percentage": 71.3, "elapsed_time": "0:14:03", "remaining_time": "0:05:39"}
{"current_steps": 78, "total_steps": 108, "loss": 0.4197, "lr": 1.8495607820914451e-06, "epoch": 0.7222222222222222, "percentage": 72.22, "elapsed_time": "0:14:13", "remaining_time": "0:05:28"}
{"current_steps": 79, "total_steps": 108, "loss": 0.3619, "lr": 1.7358894090473928e-06, "epoch": 0.7314814814814815, "percentage": 73.15, "elapsed_time": "0:14:23", "remaining_time": "0:05:17"}
{"current_steps": 80, "total_steps": 108, "loss": 0.3587, "lr": 1.6250849924089485e-06, "epoch": 0.7407407407407407, "percentage": 74.07, "elapsed_time": "0:14:34", "remaining_time": "0:05:05"}
{"current_steps": 81, "total_steps": 108, "loss": 0.3391, "lr": 1.5172448546850166e-06, "epoch": 0.75, "percentage": 75.0, "elapsed_time": "0:14:44", "remaining_time": "0:04:54"}
{"current_steps": 82, "total_steps": 108, "loss": 0.5386, "lr": 1.4124637147783431e-06, "epoch": 0.7592592592592593, "percentage": 75.93, "elapsed_time": "0:14:54", "remaining_time": "0:04:43"}
{"current_steps": 83, "total_steps": 108, "loss": 0.4069, "lr": 1.3108336047913633e-06, "epoch": 0.7685185185185185, "percentage": 76.85, "elapsed_time": "0:15:04", "remaining_time": "0:04:32"}
{"current_steps": 84, "total_steps": 108, "loss": 0.4371, "lr": 1.2124437891918995e-06, "epoch": 0.7777777777777778, "percentage": 77.78, "elapsed_time": "0:15:15", "remaining_time": "0:04:21"}
{"current_steps": 85, "total_steps": 108, "loss": 0.4374, "lr": 1.1173806864097885e-06, "epoch": 0.7870370370370371, "percentage": 78.7, "elapsed_time": "0:15:25", "remaining_time": "0:04:10"}
{"current_steps": 86, "total_steps": 108, "loss": 0.3986, "lr": 1.0257277929332332e-06, "epoch": 0.7962962962962963, "percentage": 79.63, "elapsed_time": "0:15:35", "remaining_time": "0:03:59"}
{"current_steps": 87, "total_steps": 108, "loss": 0.4473, "lr": 9.375656099715935e-07, "epoch": 0.8055555555555556, "percentage": 80.56, "elapsed_time": "0:15:45", "remaining_time": "0:03:48"}
{"current_steps": 88, "total_steps": 108, "loss": 0.4484, "lr": 8.529715727489912e-07, "epoch": 0.8148148148148148, "percentage": 81.48, "elapsed_time": "0:15:56", "remaining_time": "0:03:37"}
{"current_steps": 88, "total_steps": 108, "eval_loss": 0.4449349045753479, "epoch": 0.8148148148148148, "percentage": 81.48, "elapsed_time": "0:16:03", "remaining_time": "0:03:38"}
{"current_steps": 89, "total_steps": 108, "loss": 0.3425, "lr": 7.720199824908692e-07, "epoch": 0.8240740740740741, "percentage": 82.41, "elapsed_time": "0:16:13", "remaining_time": "0:03:27"}
{"current_steps": 90, "total_steps": 108, "loss": 0.4269, "lr": 6.947819411632223e-07, "epoch": 0.8333333333333334, "percentage": 83.33, "elapsed_time": "0:16:24", "remaining_time": "0:03:16"}
{"current_steps": 91, "total_steps": 108, "loss": 0.5674, "lr": 6.213252890218163e-07, "epoch": 0.8425925925925926, "percentage": 84.26, "elapsed_time": "0:16:34", "remaining_time": "0:03:05"}
{"current_steps": 92, "total_steps": 108, "loss": 0.454, "lr": 5.517145450262639e-07, "epoch": 0.8518518518518519, "percentage": 85.19, "elapsed_time": "0:16:44", "remaining_time": "0:02:54"}
{"current_steps": 93, "total_steps": 108, "loss": 0.3412, "lr": 4.860108501712824e-07, "epoch": 0.8611111111111112, "percentage": 86.11, "elapsed_time": "0:16:54", "remaining_time": "0:02:43"}
{"current_steps": 94, "total_steps": 108, "loss": 0.4292, "lr": 4.242719137849077e-07, "epoch": 0.8703703703703703, "percentage": 87.04, "elapsed_time": "0:17:05", "remaining_time": "0:02:32"}
{"current_steps": 95, "total_steps": 108, "loss": 0.4765, "lr": 3.665519628408332e-07, "epoch": 0.8796296296296297, "percentage": 87.96, "elapsed_time": "0:17:15", "remaining_time": "0:02:21"}
{"current_steps": 96, "total_steps": 108, "loss": 0.428, "lr": 3.1290169432939556e-07, "epoch": 0.8888888888888888, "percentage": 88.89, "elapsed_time": "0:17:25", "remaining_time": "0:02:10"}
{"current_steps": 97, "total_steps": 108, "loss": 0.4488, "lr": 2.6336823072904305e-07, "epoch": 0.8981481481481481, "percentage": 89.81, "elapsed_time": "0:17:35", "remaining_time": "0:01:59"}
{"current_steps": 98, "total_steps": 108, "loss": 0.3881, "lr": 2.179950786173879e-07, "epoch": 0.9074074074074074, "percentage": 90.74, "elapsed_time": "0:17:46", "remaining_time": "0:01:48"}
{"current_steps": 99, "total_steps": 108, "loss": 0.4809, "lr": 1.7682209045820687e-07, "epoch": 0.9166666666666666, "percentage": 91.67, "elapsed_time": "0:17:56", "remaining_time": "0:01:37"}
{"current_steps": 99, "total_steps": 108, "eval_loss": 0.4441840946674347, "epoch": 0.9166666666666666, "percentage": 91.67, "elapsed_time": "0:18:03", "remaining_time": "0:01:38"}
{"current_steps": 100, "total_steps": 108, "loss": 0.4533, "lr": 1.3988542959794627e-07, "epoch": 0.9259259259259259, "percentage": 92.59, "elapsed_time": "0:18:13", "remaining_time": "0:01:27"}
{"current_steps": 101, "total_steps": 108, "loss": 0.5236, "lr": 1.0721753850247984e-07, "epoch": 0.9351851851851852, "percentage": 93.52, "elapsed_time": "0:18:24", "remaining_time": "0:01:16"}
{"current_steps": 102, "total_steps": 108, "loss": 0.3763, "lr": 7.884711026201586e-08, "epoch": 0.9444444444444444, "percentage": 94.44, "elapsed_time": "0:18:34", "remaining_time": "0:01:05"}
{"current_steps": 103, "total_steps": 108, "loss": 0.4101, "lr": 5.479906338917984e-08, "epoch": 0.9537037037037037, "percentage": 95.37, "elapsed_time": "0:18:44", "remaining_time": "0:00:54"}
{"current_steps": 104, "total_steps": 108, "loss": 0.4942, "lr": 3.5094519932415417e-08, "epoch": 0.9629629629629629, "percentage": 96.3, "elapsed_time": "0:18:54", "remaining_time": "0:00:43"}
{"current_steps": 105, "total_steps": 108, "loss": 0.4778, "lr": 1.975078692391552e-08, "epoch": 0.9722222222222222, "percentage": 97.22, "elapsed_time": "0:19:05", "remaining_time": "0:00:32"}
{"current_steps": 106, "total_steps": 108, "loss": 0.4537, "lr": 8.781341178393244e-09, "epoch": 0.9814814814814815, "percentage": 98.15, "elapsed_time": "0:19:15", "remaining_time": "0:00:21"}
{"current_steps": 107, "total_steps": 108, "loss": 0.4192, "lr": 2.19581745602826e-09, "epoch": 0.9907407407407407, "percentage": 99.07, "elapsed_time": "0:19:25", "remaining_time": "0:00:10"}
{"current_steps": 108, "total_steps": 108, "loss": 0.3589, "lr": 0.0, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:19:35", "remaining_time": "0:00:00"}
{"current_steps": 108, "total_steps": 108, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:20:48", "remaining_time": "0:00:00"}