Training in progress, step 15, checkpoint

Browse files

Files changed (12) hide show

last-checkpoint/adapter_model.safetensors +1 -1
last-checkpoint/optimizer.pt +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +46 -3

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:434d4ba0a77faed75e243ca391a4b5da85883f9a03d5325c5437970ac3c80873
 size 50503544

 version https://git-lfs.github.com/spec/v1
+oid sha256:6f34852b64327509c6719a0ba9c958e37d74df9a1a5223f3b4a772a7ffeab0b4
 size 50503544

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:deb2258cc4c784862b7e9f9b897320dae9ad4a01d29471fb7d291773e98948f6
 size 25986148

 version https://git-lfs.github.com/spec/v1
+oid sha256:91008858bc4f68950e73897c7142d989181b2126363548c3ab4bbceceef6b473
 size 25986148

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:22a8ea6f872ad69b36a140052965078e0a1e019eff596980afdef00155896881
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:d208fc8ffc06a5de0e78a66250af5e4040febbcf16cdc254af2f5493300ac1c9
 size 15984

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3ac99ee8e22746ac5d76a305ad5b41f5db35e50e5bf8e6923c976375c5dd9c11
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:171729bc4986a9839636ee98592d71f8b00583a8eaabd1d63cf9d7610cef9d8e
 size 15984

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3ee7bc09cc5a34a5399c7ac2031fe648cc8f7c7c45cfe9a6a5f195d546cb4e07
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:e28a9e95efff5f4fdbdab6994e651e446586624a0f8b61ff953351f9ace2fd28
 size 15984

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b5bc4d5b483cd0139d1dd6497c17adfd72199395dd9fb59760db4eeefb18d90d
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:a87f5e3936866d69d87c5ebfdc7bf0d96d0c6bd727c3a6dbd5f5cb4c98ccb1ee
 size 15984

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f146764400aee269ace30336f52d5b91a0e05b6413450f2da5ab7e40cccbfc22
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:99817fbab47484f57146aab5db5d1d20950343ead7ff360b6f6af4b55cb9d971
 size 15984

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:00b5709b9458937bdf0beba73ee9c1b24aa748fbe41f4e89256fabae5db1ea04
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:dd6d7b5374da01deb55707ef3ca400e859d43ff9196f00ccd1413b068442c0ac
 size 15984

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:14d62a3d1654c081e8c665b79a207d9450a999239c270cf50a0ffae1c57648b9
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:7c436452d7af3913a771cc03d673e6c05ed368a9b1cf6d0e23e1bfe1832a5e7c
 size 15984

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:901aa808fd1c4548a3a0d072638a38f2fb141a4a2dbe1b2636bc961acd923b85
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:7f09039d225663348fb992c94c210c08e9332bf92c2e8818ce5057bb9610639d
 size 15984

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b4849a6ac0a1d895740f1ab4eba9d346b8d898008d0cfe93dd108cd928d7c63e
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:f193dee591957702c791ef1b0861987f5cc59c358aa6dd7c5c0054f6dbca1910
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.6153846153846154,
   "eval_steps": 5,
-  "global_step": 10,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -101,6 +101,49 @@
       "eval_samples_per_second": 93.837,
       "eval_steps_per_second": 5.999,
       "step": 10
     }
   ],
   "logging_steps": 1,
@@ -120,7 +163,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 6.587960141021184e+16,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.9230769230769231,
   "eval_steps": 5,
+  "global_step": 15,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 93.837,
       "eval_steps_per_second": 5.999,
       "step": 10
+    },
+    {
+      "epoch": 0.676923076923077,
+      "grad_norm": 14.431711196899414,
+      "learning_rate": 9.504844339512095e-05,
+      "loss": 2.9499,
+      "step": 11
+    },
+    {
+      "epoch": 0.7384615384615385,
+      "grad_norm": 16.134414672851562,
+      "learning_rate": 8.117449009293668e-05,
+      "loss": 2.4818,
+      "step": 12
+    },
+    {
+      "epoch": 0.8,
+      "grad_norm": 22.951139450073242,
+      "learning_rate": 6.112604669781572e-05,
+      "loss": 2.4057,
+      "step": 13
+    },
+    {
+      "epoch": 0.8615384615384616,
+      "grad_norm": 21.449586868286133,
+      "learning_rate": 3.887395330218429e-05,
+      "loss": 1.8603,
+      "step": 14
+    },
+    {
+      "epoch": 0.9230769230769231,
+      "grad_norm": 11.409588813781738,
+      "learning_rate": 1.8825509907063327e-05,
+      "loss": 1.6571,
+      "step": 15
+    },
+    {
+      "epoch": 0.9230769230769231,
+      "eval_loss": 1.7483874559402466,
+      "eval_runtime": 2.3419,
+      "eval_samples_per_second": 93.513,
+      "eval_steps_per_second": 5.978,
+      "step": 15
     }
   ],
   "logging_steps": 1,
       "attributes": {}
     }
   },
+  "total_flos": 9.881940211531776e+16,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null