Training in progress, step 5627
Browse files- model-00001-of-00002.safetensors +1 -1
- model-00002-of-00002.safetensors +1 -1
- trainer_log.jsonl +16 -0
model-00001-of-00002.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4988025760
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:197ae811361af25c27dab57f91035904a2ee4f10f71a7158793a51811700638a
|
3 |
size 4988025760
|
model-00002-of-00002.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 240691728
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5834e9dd49ce6196c3245301a15f5132fe33538f9ceaae21317becd1bb2a3852
|
3 |
size 240691728
|
trainer_log.jsonl
CHANGED
@@ -5610,3 +5610,19 @@
|
|
5610 |
{"current_steps": 5610, "total_steps": 5627, "loss": 1.3166, "learning_rate": 9.193563297094088e-10, "epoch": 0.9969345595095295, "percentage": 99.7, "elapsed_time": "20:37:39", "remaining_time": "0:03:45"}
|
5611 |
{"current_steps": 5611, "total_steps": 5627, "loss": 1.3155, "learning_rate": 8.143786377190488e-10, "epoch": 0.9971122662046292, "percentage": 99.72, "elapsed_time": "20:37:52", "remaining_time": "0:03:31"}
|
5612 |
{"current_steps": 5612, "total_steps": 5627, "loss": 1.3398, "learning_rate": 7.157630627774303e-10, "epoch": 0.997289972899729, "percentage": 99.73, "elapsed_time": "20:38:05", "remaining_time": "0:03:18"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
5610 |
{"current_steps": 5610, "total_steps": 5627, "loss": 1.3166, "learning_rate": 9.193563297094088e-10, "epoch": 0.9969345595095295, "percentage": 99.7, "elapsed_time": "20:37:39", "remaining_time": "0:03:45"}
|
5611 |
{"current_steps": 5611, "total_steps": 5627, "loss": 1.3155, "learning_rate": 8.143786377190488e-10, "epoch": 0.9971122662046292, "percentage": 99.72, "elapsed_time": "20:37:52", "remaining_time": "0:03:31"}
|
5612 |
{"current_steps": 5612, "total_steps": 5627, "loss": 1.3398, "learning_rate": 7.157630627774303e-10, "epoch": 0.997289972899729, "percentage": 99.73, "elapsed_time": "20:38:05", "remaining_time": "0:03:18"}
|
5613 |
+
{"current_steps": 5613, "total_steps": 5627, "loss": 1.2682, "learning_rate": 6.235096362550153e-10, "epoch": 0.9974676795948287, "percentage": 99.75, "elapsed_time": "20:38:18", "remaining_time": "0:03:05"}
|
5614 |
+
{"current_steps": 5614, "total_steps": 5627, "loss": 1.3134, "learning_rate": 5.376183874994389e-10, "epoch": 0.9976453862899285, "percentage": 99.77, "elapsed_time": "20:38:32", "remaining_time": "0:02:52"}
|
5615 |
+
{"current_steps": 5615, "total_steps": 5627, "loss": 1.3194, "learning_rate": 4.5808934383329007e-10, "epoch": 0.9978230929850282, "percentage": 99.79, "elapsed_time": "20:38:45", "remaining_time": "0:02:38"}
|
5616 |
+
{"current_steps": 5616, "total_steps": 5627, "loss": 1.301, "learning_rate": 3.8492253055855133e-10, "epoch": 0.998000799680128, "percentage": 99.8, "elapsed_time": "20:38:58", "remaining_time": "0:02:25"}
|
5617 |
+
{"current_steps": 5617, "total_steps": 5627, "loss": 1.2711, "learning_rate": 3.1811797094993824e-10, "epoch": 0.9981785063752276, "percentage": 99.82, "elapsed_time": "20:39:11", "remaining_time": "0:02:12"}
|
5618 |
+
{"current_steps": 5618, "total_steps": 5627, "loss": 1.2779, "learning_rate": 2.5767568625711946e-10, "epoch": 0.9983562130703274, "percentage": 99.84, "elapsed_time": "20:39:24", "remaining_time": "0:01:59"}
|
5619 |
+
{"current_steps": 5619, "total_steps": 5627, "loss": 1.2756, "learning_rate": 2.0359569570915781e-10, "epoch": 0.9985339197654272, "percentage": 99.86, "elapsed_time": "20:39:37", "remaining_time": "0:01:45"}
|
5620 |
+
{"current_steps": 5620, "total_steps": 5627, "loss": 1.2977, "learning_rate": 1.5587801651228973e-10, "epoch": 0.9987116264605269, "percentage": 99.88, "elapsed_time": "20:39:51", "remaining_time": "0:01:32"}
|
5621 |
+
{"current_steps": 5621, "total_steps": 5627, "loss": 1.2365, "learning_rate": 1.1452266384548439e-10, "epoch": 0.9988893331556267, "percentage": 99.89, "elapsed_time": "20:40:04", "remaining_time": "0:01:19"}
|
5622 |
+
{"current_steps": 5622, "total_steps": 5627, "loss": 1.3766, "learning_rate": 7.952965086044373e-11, "epoch": 0.9990670398507264, "percentage": 99.91, "elapsed_time": "20:40:17", "remaining_time": "0:01:06"}
|
5623 |
+
{"current_steps": 5623, "total_steps": 5627, "loss": 1.3173, "learning_rate": 5.089898869492516e-11, "epoch": 0.9992447465458261, "percentage": 99.93, "elapsed_time": "20:40:30", "remaining_time": "0:00:52"}
|
5624 |
+
{"current_steps": 5624, "total_steps": 5627, "loss": 1.3245, "learning_rate": 2.8630686454977908e-11, "epoch": 0.9994224532409258, "percentage": 99.95, "elapsed_time": "20:40:43", "remaining_time": "0:00:39"}
|
5625 |
+
{"current_steps": 5625, "total_steps": 5627, "loss": 1.2789, "learning_rate": 1.2724751221604436e-11, "epoch": 0.9996001599360256, "percentage": 99.96, "elapsed_time": "20:40:57", "remaining_time": "0:00:26"}
|
5626 |
+
{"current_steps": 5626, "total_steps": 5627, "loss": 1.3026, "learning_rate": 3.1811880574217357e-12, "epoch": 0.9997778666311253, "percentage": 99.98, "elapsed_time": "20:41:10", "remaining_time": "0:00:13"}
|
5627 |
+
{"current_steps": 5627, "total_steps": 5627, "loss": 1.2749, "learning_rate": 0.0, "epoch": 0.9999555733262251, "percentage": 100.0, "elapsed_time": "20:41:23", "remaining_time": "0:00:00"}
|
5628 |
+
{"current_steps": 5627, "total_steps": 5627, "epoch": 0.9999555733262251, "percentage": 100.0, "elapsed_time": "20:41:41", "remaining_time": "0:00:00"}
|