Training in progress, step 34, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fdcb24de1af5f355fc6f397e4fa176ccce4da7d84ca6236d312fba7b37713538
 size 608249904

 version https://git-lfs.github.com/spec/v1
+oid sha256:c03d71f7ab330b18ad346334a241748f2b1444a605f5c518969f069576d47ec4
 size 608249904

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8ccb04434d6a3e161cb9878b4b3f57d668a8fa7cba2c332a3987cff25c456169
 size 43122580

 version https://git-lfs.github.com/spec/v1
+oid sha256:76ebe3643a2223dc55588522f451fcf84c1f3f26255dde8a61a9e2cef46a77c3
 size 43122580

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:45d933a07aade8a49bb8dc8d3bcb7da3273871b976473408cd44c3a5c6bcd640
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:0ca28602a8329d58469fb3371a0eb088334bc1b9324ec2b3e34c9885c7b95763
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:27ca192899ed606f0971eef111fc1026e18024acb472ba59e8b2804c88f803cf
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:1fe247b8abd9f098bbbafb55011dbe010f2fe145118845b911d1500aa9422fe0
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.7941176470588235,
   "eval_steps": 7,
-  "global_step": 27,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -53,6 +53,21 @@
       "eval_samples_per_second": 18.775,
       "eval_steps_per_second": 2.367,
       "step": 21
     }
   ],
   "logging_steps": 10,
@@ -67,12 +82,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 7.571537823950438e+16,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.0,
   "eval_steps": 7,
+  "global_step": 34,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 18.775,
       "eval_steps_per_second": 2.367,
       "step": 21
+    },
+    {
+      "epoch": 0.8235294117647058,
+      "eval_loss": 2.1168278180994093e-05,
+      "eval_runtime": 12.3009,
+      "eval_samples_per_second": 18.698,
+      "eval_steps_per_second": 2.358,
+      "step": 28
+    },
+    {
+      "epoch": 0.8823529411764706,
+      "grad_norm": 0.0023900624364614487,
+      "learning_rate": 3.8060233744356633e-06,
+      "loss": 0.0,
+      "step": 30
     }
   ],
   "logging_steps": 10,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 9.532338273150566e+16,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null