Training in progress, epoch 1, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ee687c6b4d3e5ead2dffe570df735ac824ae830a7629b47a0b2397c525b02930
 size 27024

 version https://git-lfs.github.com/spec/v1
+oid sha256:c14eadf65048b83a72a07318990b712fb81ee2d420d364dedb6d9136fb8275ac
 size 27024

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2c7ac929589bd59efd8c74838ed47e6c16ae42a989cb7b51f09f61c0c64bb092
 size 63910

 version https://git-lfs.github.com/spec/v1
+oid sha256:f203216bc765834d4696952f7ded4d7087b3060c42d85bf085c66a5d1d3ddf86
 size 63910

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9d629fd5ba76e13469b4aa16dbfd3640d000777b913859f3961e56315077ff55
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:2d5ef96773eb758f89d6d8e0e5fe21bd00478f734b3101286128c5c2286df533
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b529c6dc606f7c4af8932b65821eaa427faee70c004932409321363fc742ca82
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:e22ca0a50bab80d00c8b8910bffb983a348f8762b7cf025e6f8e64a05a938289
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.9961685823754789,
   "eval_steps": 500,
-  "global_step": 195,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1380,6 +1380,21 @@
       "eval_samples_per_second": 145.877,
       "eval_steps_per_second": 145.877,
       "step": 195
     }
   ],
   "logging_steps": 1,
@@ -1394,12 +1409,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 2531225272320.0,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.0012771392081736,
   "eval_steps": 500,
+  "global_step": 196,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 145.877,
       "eval_steps_per_second": 145.877,
       "step": 195
+    },
+    {
+      "epoch": 1.0012771392081736,
+      "grad_norm": 0.08981695771217346,
+      "learning_rate": 0.0,
+      "loss": 12.4365,
+      "step": 196
+    },
+    {
+      "epoch": 1.0012771392081736,
+      "eval_loss": 10.354520797729492,
+      "eval_runtime": 0.2791,
+      "eval_samples_per_second": 150.484,
+      "eval_steps_per_second": 150.484,
+      "step": 196
     }
   ],
   "logging_steps": 1,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 2534457999360.0,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null