Training in progress, step 20040

Files changed (8) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3ec7e54952bc54ca05e6a7c9817a51d21c2b914c81f6e55d54a50404ef5736be
 size 6319689

 version https://git-lfs.github.com/spec/v1
+oid sha256:49a9d4479ab81c206da26a1466ae173504ca995ede4e55d1bc18fce1df67b042
 size 6319689

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d7f79f3c42580dee8e32d426568e5ae031b6874f33c3913b68cc8c7af0742467
 size 1121737121

 version https://git-lfs.github.com/spec/v1
+oid sha256:4b7519f227d3c07ddf3df757968ff707de4dbbf2dbc4f1f71161830b700c55e5
 size 1121737121

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9c685d97b074863e580814a25b52c10d0780108aad591f1da31aa06488b8f12c
 size 14639

 version https://git-lfs.github.com/spec/v1
+oid sha256:da6c9e12beb94b7c12139c56f51164322bd23825c31ff719fbd3c777e3951565
 size 14639

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7eecebc2e496c20147235b282760a916bd72d06e3ae62a3320ff8008631f1566
 size 557

 version https://git-lfs.github.com/spec/v1
+oid sha256:d6e2aa9d6ca48b39b3e26e013343899d80b7cef352ad6e422a4633c48e8f6b83
 size 557

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dee86f8605bc08f195b3c17973806ad73c2ebfe99fec8f213523cd3f7624193e
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:ef6700cd562244019f5168fd7177dc8c3ba417e6a293e30f76daf923e92625ab
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.22040079185913242,
-  "global_step": 19038,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -132,11 +132,17 @@
       "learning_rate": 1.5602866437444287e-05,
       "loss": 1.5247,
       "step": 19000
     }
   ],
   "max_steps": 86379,
   "num_train_epochs": 1,
-  "total_flos": 3.545343573413069e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.23200083353592887,
+  "global_step": 20040,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.5602866437444287e-05,
       "loss": 1.5247,
       "step": 19000
+    },
+    {
+      "epoch": 0.23,
+      "learning_rate": 1.5371560217182417e-05,
+      "loss": 1.5199,
+      "step": 20000
     }
   ],
   "max_steps": 86379,
   "num_train_epochs": 1,
+  "total_flos": 3.731940603592704e+16,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d7f79f3c42580dee8e32d426568e5ae031b6874f33c3913b68cc8c7af0742467
 size 1121737121

 version https://git-lfs.github.com/spec/v1
+oid sha256:4b7519f227d3c07ddf3df757968ff707de4dbbf2dbc4f1f71161830b700c55e5
 size 1121737121

runs/Jun04_02-06-39_4367d7224c9f/events.out.tfevents.1685845095.4367d7224c9f.857.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5cb4a9448529bb31dc3bce9d9f47191cd0792bd9b7c7d468ac164df8a193b27f
-size 5768

 version https://git-lfs.github.com/spec/v1
+oid sha256:53741a98d0ebfc0680eee44685402916d8e856e3ccff93783cdd5fd7c63ff929
+size 5928