Xinging's picture
Upload trainer_log.jsonl with huggingface_hub
c11b960 verified
raw
history blame
12.1 kB
{"current_steps": 1, "total_steps": 63, "loss": 1.0485, "lr": 2.8571428571428573e-06, "epoch": 0.047619047619047616, "percentage": 1.59, "elapsed_time": "0:00:14", "remaining_time": "0:14:46"}
{"current_steps": 2, "total_steps": 63, "loss": 1.0247, "lr": 5.7142857142857145e-06, "epoch": 0.09523809523809523, "percentage": 3.17, "elapsed_time": "0:00:28", "remaining_time": "0:14:16"}
{"current_steps": 3, "total_steps": 63, "loss": 1.0005, "lr": 8.571428571428571e-06, "epoch": 0.14285714285714285, "percentage": 4.76, "elapsed_time": "0:00:45", "remaining_time": "0:15:06"}
{"current_steps": 4, "total_steps": 63, "loss": 0.9607, "lr": 1.1428571428571429e-05, "epoch": 0.19047619047619047, "percentage": 6.35, "elapsed_time": "0:01:00", "remaining_time": "0:14:45"}
{"current_steps": 5, "total_steps": 63, "loss": 0.9474, "lr": 1.4285714285714287e-05, "epoch": 0.23809523809523808, "percentage": 7.94, "elapsed_time": "0:01:13", "remaining_time": "0:14:13"}
{"current_steps": 6, "total_steps": 63, "loss": 0.9091, "lr": 1.7142857142857142e-05, "epoch": 0.2857142857142857, "percentage": 9.52, "elapsed_time": "0:01:27", "remaining_time": "0:13:50"}
{"current_steps": 7, "total_steps": 63, "loss": 0.9359, "lr": 2e-05, "epoch": 0.3333333333333333, "percentage": 11.11, "elapsed_time": "0:01:42", "remaining_time": "0:13:39"}
{"current_steps": 8, "total_steps": 63, "loss": 0.9072, "lr": 1.998426815017817e-05, "epoch": 0.38095238095238093, "percentage": 12.7, "elapsed_time": "0:01:55", "remaining_time": "0:13:16"}
{"current_steps": 9, "total_steps": 63, "loss": 0.9051, "lr": 1.9937122098932428e-05, "epoch": 0.42857142857142855, "percentage": 14.29, "elapsed_time": "0:02:09", "remaining_time": "0:12:58"}
{"current_steps": 10, "total_steps": 63, "loss": 0.8882, "lr": 1.985871018518236e-05, "epoch": 0.47619047619047616, "percentage": 15.87, "elapsed_time": "0:02:25", "remaining_time": "0:12:51"}
{"current_steps": 11, "total_steps": 63, "loss": 0.894, "lr": 1.9749279121818235e-05, "epoch": 0.5238095238095238, "percentage": 17.46, "elapsed_time": "0:02:39", "remaining_time": "0:12:33"}
{"current_steps": 12, "total_steps": 63, "loss": 0.8808, "lr": 1.9609173219450998e-05, "epoch": 0.5714285714285714, "percentage": 19.05, "elapsed_time": "0:02:54", "remaining_time": "0:12:19"}
{"current_steps": 13, "total_steps": 63, "loss": 0.8738, "lr": 1.9438833303083677e-05, "epoch": 0.6190476190476191, "percentage": 20.63, "elapsed_time": "0:03:09", "remaining_time": "0:12:07"}
{"current_steps": 14, "total_steps": 63, "loss": 0.9113, "lr": 1.9238795325112867e-05, "epoch": 0.6666666666666666, "percentage": 22.22, "elapsed_time": "0:03:23", "remaining_time": "0:11:51"}
{"current_steps": 15, "total_steps": 63, "loss": 0.8581, "lr": 1.900968867902419e-05, "epoch": 0.7142857142857143, "percentage": 23.81, "elapsed_time": "0:03:37", "remaining_time": "0:11:34"}
{"current_steps": 16, "total_steps": 63, "loss": 0.8969, "lr": 1.8752234219087538e-05, "epoch": 0.7619047619047619, "percentage": 25.4, "elapsed_time": "0:03:51", "remaining_time": "0:11:21"}
{"current_steps": 17, "total_steps": 63, "loss": 0.906, "lr": 1.8467241992282842e-05, "epoch": 0.8095238095238095, "percentage": 26.98, "elapsed_time": "0:04:06", "remaining_time": "0:11:07"}
{"current_steps": 18, "total_steps": 63, "loss": 0.8859, "lr": 1.8155608689592604e-05, "epoch": 0.8571428571428571, "percentage": 28.57, "elapsed_time": "0:04:20", "remaining_time": "0:10:52"}
{"current_steps": 19, "total_steps": 63, "loss": 0.8931, "lr": 1.78183148246803e-05, "epoch": 0.9047619047619048, "percentage": 30.16, "elapsed_time": "0:04:36", "remaining_time": "0:10:40"}
{"current_steps": 20, "total_steps": 63, "loss": 0.8946, "lr": 1.7456421648831658e-05, "epoch": 0.9523809523809523, "percentage": 31.75, "elapsed_time": "0:04:50", "remaining_time": "0:10:24"}
{"current_steps": 21, "total_steps": 63, "loss": 0.8441, "lr": 1.7071067811865477e-05, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:05:04", "remaining_time": "0:10:09"}
{"current_steps": 22, "total_steps": 63, "loss": 0.6841, "lr": 1.6663465779520042e-05, "epoch": 1.0476190476190477, "percentage": 34.92, "elapsed_time": "0:05:18", "remaining_time": "0:09:53"}
{"current_steps": 23, "total_steps": 63, "loss": 0.6804, "lr": 1.6234898018587336e-05, "epoch": 1.0952380952380953, "percentage": 36.51, "elapsed_time": "0:05:33", "remaining_time": "0:09:40"}
{"current_steps": 24, "total_steps": 63, "loss": 0.6712, "lr": 1.578671296179806e-05, "epoch": 1.1428571428571428, "percentage": 38.1, "elapsed_time": "0:05:48", "remaining_time": "0:09:26"}
{"current_steps": 25, "total_steps": 63, "loss": 0.6592, "lr": 1.5320320765153367e-05, "epoch": 1.1904761904761905, "percentage": 39.68, "elapsed_time": "0:06:02", "remaining_time": "0:09:10"}
{"current_steps": 26, "total_steps": 63, "loss": 0.6547, "lr": 1.4837188871052399e-05, "epoch": 1.2380952380952381, "percentage": 41.27, "elapsed_time": "0:06:16", "remaining_time": "0:08:55"}
{"current_steps": 27, "total_steps": 63, "loss": 0.6555, "lr": 1.4338837391175582e-05, "epoch": 1.2857142857142856, "percentage": 42.86, "elapsed_time": "0:06:30", "remaining_time": "0:08:40"}
{"current_steps": 28, "total_steps": 63, "loss": 0.6326, "lr": 1.3826834323650899e-05, "epoch": 1.3333333333333333, "percentage": 44.44, "elapsed_time": "0:06:46", "remaining_time": "0:08:28"}
{"current_steps": 29, "total_steps": 63, "loss": 0.6659, "lr": 1.3302790619551673e-05, "epoch": 1.380952380952381, "percentage": 46.03, "elapsed_time": "0:07:01", "remaining_time": "0:08:13"}
{"current_steps": 30, "total_steps": 63, "loss": 0.6172, "lr": 1.2768355114248493e-05, "epoch": 1.4285714285714286, "percentage": 47.62, "elapsed_time": "0:07:16", "remaining_time": "0:08:00"}
{"current_steps": 31, "total_steps": 63, "loss": 0.6394, "lr": 1.2225209339563144e-05, "epoch": 1.4761904761904763, "percentage": 49.21, "elapsed_time": "0:07:30", "remaining_time": "0:07:44"}
{"current_steps": 32, "total_steps": 63, "loss": 0.6278, "lr": 1.1675062233047365e-05, "epoch": 1.5238095238095237, "percentage": 50.79, "elapsed_time": "0:07:44", "remaining_time": "0:07:29"}
{"current_steps": 33, "total_steps": 63, "loss": 0.6447, "lr": 1.1119644761033079e-05, "epoch": 1.5714285714285714, "percentage": 52.38, "elapsed_time": "0:07:58", "remaining_time": "0:07:15"}
{"current_steps": 34, "total_steps": 63, "loss": 0.6293, "lr": 1.0560704472371919e-05, "epoch": 1.619047619047619, "percentage": 53.97, "elapsed_time": "0:08:13", "remaining_time": "0:07:00"}
{"current_steps": 35, "total_steps": 63, "loss": 0.6135, "lr": 1e-05, "epoch": 1.6666666666666665, "percentage": 55.56, "elapsed_time": "0:08:28", "remaining_time": "0:06:46"}
{"current_steps": 36, "total_steps": 63, "loss": 0.5951, "lr": 9.439295527628083e-06, "epoch": 1.7142857142857144, "percentage": 57.14, "elapsed_time": "0:08:46", "remaining_time": "0:06:34"}
{"current_steps": 37, "total_steps": 63, "loss": 0.6291, "lr": 8.880355238966923e-06, "epoch": 1.7619047619047619, "percentage": 58.73, "elapsed_time": "0:09:01", "remaining_time": "0:06:20"}
{"current_steps": 38, "total_steps": 63, "loss": 0.6515, "lr": 8.324937766952638e-06, "epoch": 1.8095238095238095, "percentage": 60.32, "elapsed_time": "0:09:15", "remaining_time": "0:06:05"}
{"current_steps": 39, "total_steps": 63, "loss": 0.6229, "lr": 7.774790660436857e-06, "epoch": 1.8571428571428572, "percentage": 61.9, "elapsed_time": "0:09:30", "remaining_time": "0:05:51"}
{"current_steps": 40, "total_steps": 63, "loss": 0.634, "lr": 7.2316448857515076e-06, "epoch": 1.9047619047619047, "percentage": 63.49, "elapsed_time": "0:09:44", "remaining_time": "0:05:36"}
{"current_steps": 41, "total_steps": 63, "loss": 0.6351, "lr": 6.697209380448333e-06, "epoch": 1.9523809523809523, "percentage": 65.08, "elapsed_time": "0:09:59", "remaining_time": "0:05:21"}
{"current_steps": 42, "total_steps": 63, "loss": 0.5002, "lr": 6.173165676349103e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:10:12", "remaining_time": "0:05:06"}
{"current_steps": 43, "total_steps": 63, "loss": 0.4895, "lr": 5.66116260882442e-06, "epoch": 2.0476190476190474, "percentage": 68.25, "elapsed_time": "0:10:28", "remaining_time": "0:04:52"}
{"current_steps": 44, "total_steps": 63, "loss": 0.4941, "lr": 5.1628111289476025e-06, "epoch": 2.0952380952380953, "percentage": 69.84, "elapsed_time": "0:10:42", "remaining_time": "0:04:37"}
{"current_steps": 45, "total_steps": 63, "loss": 0.4848, "lr": 4.679679234846636e-06, "epoch": 2.142857142857143, "percentage": 71.43, "elapsed_time": "0:10:58", "remaining_time": "0:04:23"}
{"current_steps": 46, "total_steps": 63, "loss": 0.4795, "lr": 4.213287038201943e-06, "epoch": 2.1904761904761907, "percentage": 73.02, "elapsed_time": "0:11:12", "remaining_time": "0:04:08"}
{"current_steps": 47, "total_steps": 63, "loss": 0.4889, "lr": 3.7651019814126656e-06, "epoch": 2.238095238095238, "percentage": 74.6, "elapsed_time": "0:11:26", "remaining_time": "0:03:53"}
{"current_steps": 48, "total_steps": 63, "loss": 0.4689, "lr": 3.3365342204799613e-06, "epoch": 2.2857142857142856, "percentage": 76.19, "elapsed_time": "0:11:40", "remaining_time": "0:03:39"}
{"current_steps": 49, "total_steps": 63, "loss": 0.4845, "lr": 2.9289321881345257e-06, "epoch": 2.3333333333333335, "percentage": 77.78, "elapsed_time": "0:11:55", "remaining_time": "0:03:24"}
{"current_steps": 50, "total_steps": 63, "loss": 0.4718, "lr": 2.5435783511683444e-06, "epoch": 2.380952380952381, "percentage": 79.37, "elapsed_time": "0:12:10", "remaining_time": "0:03:09"}
{"current_steps": 51, "total_steps": 63, "loss": 0.4781, "lr": 2.1816851753197023e-06, "epoch": 2.4285714285714284, "percentage": 80.95, "elapsed_time": "0:12:28", "remaining_time": "0:02:56"}
{"current_steps": 52, "total_steps": 63, "loss": 0.459, "lr": 1.8443913104073984e-06, "epoch": 2.4761904761904763, "percentage": 82.54, "elapsed_time": "0:12:42", "remaining_time": "0:02:41"}
{"current_steps": 53, "total_steps": 63, "loss": 0.4772, "lr": 1.5327580077171589e-06, "epoch": 2.5238095238095237, "percentage": 84.13, "elapsed_time": "0:12:55", "remaining_time": "0:02:26"}
{"current_steps": 54, "total_steps": 63, "loss": 0.4674, "lr": 1.2477657809124632e-06, "epoch": 2.571428571428571, "percentage": 85.71, "elapsed_time": "0:13:09", "remaining_time": "0:02:11"}
{"current_steps": 55, "total_steps": 63, "loss": 0.4697, "lr": 9.903113209758098e-07, "epoch": 2.619047619047619, "percentage": 87.3, "elapsed_time": "0:13:25", "remaining_time": "0:01:57"}
{"current_steps": 56, "total_steps": 63, "loss": 0.4661, "lr": 7.612046748871327e-07, "epoch": 2.6666666666666665, "percentage": 88.89, "elapsed_time": "0:13:39", "remaining_time": "0:01:42"}
{"current_steps": 57, "total_steps": 63, "loss": 0.4517, "lr": 5.611666969163243e-07, "epoch": 2.7142857142857144, "percentage": 90.48, "elapsed_time": "0:13:55", "remaining_time": "0:01:27"}
{"current_steps": 58, "total_steps": 63, "loss": 0.4688, "lr": 3.908267805490051e-07, "epoch": 2.761904761904762, "percentage": 92.06, "elapsed_time": "0:14:09", "remaining_time": "0:01:13"}
{"current_steps": 59, "total_steps": 63, "loss": 0.4674, "lr": 2.507208781817638e-07, "epoch": 2.8095238095238093, "percentage": 93.65, "elapsed_time": "0:14:22", "remaining_time": "0:00:58"}
{"current_steps": 60, "total_steps": 63, "loss": 0.4591, "lr": 1.4128981481764115e-07, "epoch": 2.857142857142857, "percentage": 95.24, "elapsed_time": "0:14:36", "remaining_time": "0:00:43"}
{"current_steps": 61, "total_steps": 63, "loss": 0.4704, "lr": 6.287790106757396e-08, "epoch": 2.9047619047619047, "percentage": 96.83, "elapsed_time": "0:14:50", "remaining_time": "0:00:29"}
{"current_steps": 62, "total_steps": 63, "loss": 0.4716, "lr": 1.5731849821833955e-08, "epoch": 2.9523809523809526, "percentage": 98.41, "elapsed_time": "0:15:05", "remaining_time": "0:00:14"}
{"current_steps": 63, "total_steps": 63, "loss": 0.4279, "lr": 0.0, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:15:19", "remaining_time": "0:00:00"}
{"current_steps": 63, "total_steps": 63, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:16:22", "remaining_time": "0:00:00"}