Training in progress, step 86, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ca64e1bc21a66cf4f936b2ed516611c1088c1ad25b25c70c0440ed384e73b515
 size 97728

 version https://git-lfs.github.com/spec/v1
+oid sha256:d1a9c52ed13da5612a14112158920cca2f09b9a89974273eb5e0bb27768cd11a
 size 97728

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:db697e1991b34936f0d77b86b5e578a88bd35b26f670092c6126c393e25ef29d
 size 212298

 version https://git-lfs.github.com/spec/v1
+oid sha256:9682ca5fb57b1689756727eac9a7184e622c893fdee97446f578996d94aefd55
 size 212298

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:24eab67923497bc06cae1eaf0b8b5de49eefa88609da76e041852bb21060b40a
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:a062223c58d6bce32f13c4933c306b16cc26ff4708e733ebc3ca0df52404bb19
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5d1e4429a3b99e660815786d3a7846a2fc0f39f97c2ce4dd14d2b15e5d88b2c2
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:12f81afce521056555d6c5a2a40e41e87a722cdb1ae567ea49429c16d514f88b
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.833698030634573,
   "eval_steps": 8,
-  "global_step": 80,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -277,6 +277,20 @@
       "eval_samples_per_second": 134.151,
       "eval_steps_per_second": 67.767,
       "step": 80
     }
   ],
   "logging_steps": 3,
@@ -291,12 +305,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 34334732845056.0,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 3.060175054704595,
   "eval_steps": 8,
+  "global_step": 86,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 134.151,
       "eval_steps_per_second": 67.767,
       "step": 80
+    },
+    {
+      "epoch": 2.8687089715536107,
+      "grad_norm": 0.08289742469787598,
+      "learning_rate": 2.818843167645835e-06,
+      "loss": 10.2928,
+      "step": 81
+    },
+    {
+      "epoch": 2.973741794310722,
+      "grad_norm": 0.08898758143186569,
+      "learning_rate": 4.5280774269154115e-07,
+      "loss": 10.5421,
+      "step": 84
     }
   ],
   "logging_steps": 3,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 36914181439488.0,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null