sedrickkeh commited on
Commit
af0bd0c
·
verified ·
1 Parent(s): f7693b4

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78fd94ad3968700809ca0e962ef45325ebb374cf76999877fcf72fc99231789f
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74aa81d766747d487f5a38c3cc685cf2b5658a2f161daf2b57bdc1187a83427c
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a28c7b7aa51e100c8798ccb28a9aa3fe9af3829bd52ed19bab34bb353f4c0cd
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29820c7b952833040fb380b8d89b2b1fded592db490f56481f1e40a5b9eb21a6
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:366f6f0412276de2cba9064f23c048c520697b19c3f7b80ea2b08d1b9f51db33
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecfc94d45b1253da45117f224273a2546ee2b608d664169272b166a1b7a6fe77
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ef2051c3e4487831ff26c72af7cb550d3ac2433d172fcefc1845b6236bd64e8
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c8a6d37e7d9880f56f58873302a20d4f642dd63a9074b300d21d93b823f6627
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -12,3 +12,10 @@
12
  {"current_steps": 110, "total_steps": 177, "loss": 0.6543, "lr": 5e-06, "epoch": 1.8469601677148848, "percentage": 62.15, "elapsed_time": "1:48:08", "remaining_time": "1:05:52"}
13
  {"current_steps": 119, "total_steps": 177, "eval_loss": 0.6759442090988159, "epoch": 1.9979035639412999, "percentage": 67.23, "elapsed_time": "1:57:51", "remaining_time": "0:57:26"}
14
  {"current_steps": 120, "total_steps": 177, "loss": 0.6821, "lr": 5e-06, "epoch": 2.0167714884696015, "percentage": 67.8, "elapsed_time": "2:00:03", "remaining_time": "0:57:01"}
 
 
 
 
 
 
 
 
12
  {"current_steps": 110, "total_steps": 177, "loss": 0.6543, "lr": 5e-06, "epoch": 1.8469601677148848, "percentage": 62.15, "elapsed_time": "1:48:08", "remaining_time": "1:05:52"}
13
  {"current_steps": 119, "total_steps": 177, "eval_loss": 0.6759442090988159, "epoch": 1.9979035639412999, "percentage": 67.23, "elapsed_time": "1:57:51", "remaining_time": "0:57:26"}
14
  {"current_steps": 120, "total_steps": 177, "loss": 0.6821, "lr": 5e-06, "epoch": 2.0167714884696015, "percentage": 67.8, "elapsed_time": "2:00:03", "remaining_time": "0:57:01"}
15
+ {"current_steps": 130, "total_steps": 177, "loss": 0.6222, "lr": 5e-06, "epoch": 2.1844863731656186, "percentage": 73.45, "elapsed_time": "2:09:40", "remaining_time": "0:46:52"}
16
+ {"current_steps": 140, "total_steps": 177, "loss": 0.6206, "lr": 5e-06, "epoch": 2.352201257861635, "percentage": 79.1, "elapsed_time": "2:19:18", "remaining_time": "0:36:49"}
17
+ {"current_steps": 150, "total_steps": 177, "loss": 0.6165, "lr": 5e-06, "epoch": 2.519916142557652, "percentage": 84.75, "elapsed_time": "2:28:56", "remaining_time": "0:26:48"}
18
+ {"current_steps": 160, "total_steps": 177, "loss": 0.6165, "lr": 5e-06, "epoch": 2.6876310272536688, "percentage": 90.4, "elapsed_time": "2:38:34", "remaining_time": "0:16:50"}
19
+ {"current_steps": 170, "total_steps": 177, "loss": 0.6175, "lr": 5e-06, "epoch": 2.8553459119496853, "percentage": 96.05, "elapsed_time": "2:48:12", "remaining_time": "0:06:55"}
20
+ {"current_steps": 177, "total_steps": 177, "eval_loss": 0.6712015867233276, "epoch": 2.9727463312368974, "percentage": 100.0, "elapsed_time": "2:57:17", "remaining_time": "0:00:00"}
21
+ {"current_steps": 177, "total_steps": 177, "epoch": 2.9727463312368974, "percentage": 100.0, "elapsed_time": "2:58:32", "remaining_time": "0:00:00"}