Training in progress, step 21042

Files changed (8) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:49a9d4479ab81c206da26a1466ae173504ca995ede4e55d1bc18fce1df67b042
 size 6319689

 version https://git-lfs.github.com/spec/v1
+oid sha256:2e65f053f2963eb8945280988d6f16c4b7d758e4c12b63a679651ad22bd08338
 size 6319689

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4b7519f227d3c07ddf3df757968ff707de4dbbf2dbc4f1f71161830b700c55e5
 size 1121737121

 version https://git-lfs.github.com/spec/v1
+oid sha256:7d58f0865ba9cd63f9eff84f57a722722e94934e0295387b1f2b33a78c03d538
 size 1121737121

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:da6c9e12beb94b7c12139c56f51164322bd23825c31ff719fbd3c777e3951565
 size 14639

 version https://git-lfs.github.com/spec/v1
+oid sha256:317ce681e8eb1423dabc4b84cd994b1ad7ffa68a4667dc7cd899238214cf68a9
 size 14639

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d6e2aa9d6ca48b39b3e26e013343899d80b7cef352ad6e422a4633c48e8f6b83
 size 557

 version https://git-lfs.github.com/spec/v1
+oid sha256:fa09a791e2030012fbe7f9194bef77b7c004978a95455d3032ff0f9883fb6681
 size 557

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ef6700cd562244019f5168fd7177dc8c3ba417e6a293e30f76daf923e92625ab
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:27d27d07af3c091744b7367354198e2990d77e9a99302e949d949c391bcd3fc8
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.23200083353592887,
-  "global_step": 20040,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -138,11 +138,17 @@
       "learning_rate": 1.5371560217182417e-05,
       "loss": 1.5199,
       "step": 20000
     }
   ],
   "max_steps": 86379,
   "num_train_epochs": 1,
-  "total_flos": 3.731940603592704e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.2436008752127253,
+  "global_step": 21042,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.5371560217182417e-05,
       "loss": 1.5199,
       "step": 20000
+    },
+    {
+      "epoch": 0.24,
+      "learning_rate": 1.514002245916253e-05,
+      "loss": 1.5341,
+      "step": 21000
     }
   ],
   "max_steps": 86379,
   "num_train_epochs": 1,
+  "total_flos": 3.918537633772339e+16,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4b7519f227d3c07ddf3df757968ff707de4dbbf2dbc4f1f71161830b700c55e5
 size 1121737121

 version https://git-lfs.github.com/spec/v1
+oid sha256:7d58f0865ba9cd63f9eff84f57a722722e94934e0295387b1f2b33a78c03d538
 size 1121737121

runs/Jun04_02-06-39_4367d7224c9f/events.out.tfevents.1685845095.4367d7224c9f.857.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:53741a98d0ebfc0680eee44685402916d8e856e3ccff93783cdd5fd7c63ff929
-size 5928

 version https://git-lfs.github.com/spec/v1
+oid sha256:49bfc265402cf80e1d700c8e0170c924cd5e0da85a4012b3cdd14e239cdbd11e
+size 6088