Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f20f5e81932fd147953ce18dbdc37344901ac695564b4e3fc4a2fc54bb30e60e
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:927d2222a3044127428529d408de7c0c0769db63c94c03b2aaae8160837ebf01
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c43891680cf21c3115289e73f42a523477e856d689d664decc4567be8564282
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f43edcfe5832a143b2cb08481aecf2ef8e3cc6c6c1256c7b1b28cfa5f0570e6
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -10,3 +10,10 @@
|
|
10 |
{"current_steps": 90, "total_steps": 159, "loss": 0.5662, "lr": 5e-06, "epoch": 1.6901408450704225, "percentage": 56.6, "elapsed_time": "1:28:56", "remaining_time": "1:08:11"}
|
11 |
{"current_steps": 100, "total_steps": 159, "loss": 0.5597, "lr": 5e-06, "epoch": 1.8779342723004695, "percentage": 62.89, "elapsed_time": "1:38:34", "remaining_time": "0:58:09"}
|
12 |
{"current_steps": 106, "total_steps": 159, "eval_loss": 0.5878855586051941, "epoch": 1.9906103286384975, "percentage": 66.67, "elapsed_time": "1:45:46", "remaining_time": "0:52:53"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
10 |
{"current_steps": 90, "total_steps": 159, "loss": 0.5662, "lr": 5e-06, "epoch": 1.6901408450704225, "percentage": 56.6, "elapsed_time": "1:28:56", "remaining_time": "1:08:11"}
|
11 |
{"current_steps": 100, "total_steps": 159, "loss": 0.5597, "lr": 5e-06, "epoch": 1.8779342723004695, "percentage": 62.89, "elapsed_time": "1:38:34", "remaining_time": "0:58:09"}
|
12 |
{"current_steps": 106, "total_steps": 159, "eval_loss": 0.5878855586051941, "epoch": 1.9906103286384975, "percentage": 66.67, "elapsed_time": "1:45:46", "remaining_time": "0:52:53"}
|
13 |
+
{"current_steps": 110, "total_steps": 159, "loss": 0.5894, "lr": 5e-06, "epoch": 2.0657276995305165, "percentage": 69.18, "elapsed_time": "1:50:22", "remaining_time": "0:49:10"}
|
14 |
+
{"current_steps": 120, "total_steps": 159, "loss": 0.5112, "lr": 5e-06, "epoch": 2.2535211267605635, "percentage": 75.47, "elapsed_time": "2:00:01", "remaining_time": "0:39:00"}
|
15 |
+
{"current_steps": 130, "total_steps": 159, "loss": 0.5115, "lr": 5e-06, "epoch": 2.4413145539906105, "percentage": 81.76, "elapsed_time": "2:09:39", "remaining_time": "0:28:55"}
|
16 |
+
{"current_steps": 140, "total_steps": 159, "loss": 0.5121, "lr": 5e-06, "epoch": 2.629107981220657, "percentage": 88.05, "elapsed_time": "2:19:17", "remaining_time": "0:18:54"}
|
17 |
+
{"current_steps": 150, "total_steps": 159, "loss": 0.513, "lr": 5e-06, "epoch": 2.816901408450704, "percentage": 94.34, "elapsed_time": "2:28:55", "remaining_time": "0:08:56"}
|
18 |
+
{"current_steps": 159, "total_steps": 159, "eval_loss": 0.5900523066520691, "epoch": 2.9859154929577465, "percentage": 100.0, "elapsed_time": "2:39:47", "remaining_time": "0:00:00"}
|
19 |
+
{"current_steps": 159, "total_steps": 159, "epoch": 2.9859154929577465, "percentage": 100.0, "elapsed_time": "2:41:01", "remaining_time": "0:00:00"}
|