Training in progress, epoch 1

Files changed (8) hide show

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:48e3134343bbdcbaa2d0e515e448ba031cd266949636f85cccb6bf345f14ac59
 size 498625128

 version https://git-lfs.github.com/spec/v1
+oid sha256:5ec2e5250bedd266bfb35bf352696ec04e794cf8fe35f9366e93b673162645e3
 size 498625128

run-1/checkpoint-563/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2999c5c45ace354242376f2be90db4238a31117d3a08d6a1feb43fe0596f3f9e
 size 498625128

 version https://git-lfs.github.com/spec/v1
+oid sha256:5ec2e5250bedd266bfb35bf352696ec04e794cf8fe35f9366e93b673162645e3
 size 498625128

run-1/checkpoint-563/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dca027a35397ca14b602cf38277bd2d0cf8431351e372bf1ed202e14cdb5cad9
 size 997370106

 version https://git-lfs.github.com/spec/v1
+oid sha256:525af664db0555aeb47054eb84b08d8993d22bb5641f3e17cbe15b11e629537a
 size 997370106

run-1/checkpoint-563/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7ed49c5af3789e22fc643ddfa776a4e4d1dac2c8b6d694f36fa76f1a6d6a6b58
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:67acb8c45f2a5267738ac2fa23235c72161e378ee00369b01362c2d3a0c9f636
 size 1064

run-1/checkpoint-563/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 0.5438473456606133,
   "best_model_checkpoint": "students_scores_model/run-1/checkpoint-563",
   "epoch": 1.0,
   "eval_steps": 500,
@@ -10,25 +10,25 @@
   "log_history": [
     {
       "epoch": 0.8880994671403197,
-      "grad_norm": 16.69457244873047,
-      "learning_rate": 1.3821787207411013e-05,
-      "loss": 1.0782,
       "step": 500
     },
     {
       "epoch": 1.0,
-      "eval_f1": 0.5438473456606133,
-      "eval_loss": 1.0308393239974976,
-      "eval_runtime": 37.8021,
-      "eval_samples_per_second": 59.52,
-      "eval_steps_per_second": 7.46,
       "step": 563
     }
   ],
   "logging_steps": 500,
-  "max_steps": 1689,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 3,
   "save_steps": 500,
   "stateful_callbacks": {
     "TrainerControl": {
@@ -46,9 +46,9 @@
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": {
-    "learning_rate": 1.9634145158382844e-05,
-    "num_train_epochs": 3,
     "per_device_train_batch_size": 16,
-    "weight_decay": 0.000263763325616835
   }
 }

 {
+  "best_metric": 0.5710981943306789,
   "best_model_checkpoint": "students_scores_model/run-1/checkpoint-563",
   "epoch": 1.0,
   "eval_steps": 500,
   "log_history": [
     {
       "epoch": 0.8880994671403197,
+      "grad_norm": 33.513973236083984,
+      "learning_rate": 6.5983988623305475e-06,
+      "loss": 1.0854,
       "step": 500
     },
     {
       "epoch": 1.0,
+      "eval_f1": 0.5710981943306789,
+      "eval_loss": 0.9620336294174194,
+      "eval_runtime": 37.4093,
+      "eval_samples_per_second": 60.146,
+      "eval_steps_per_second": 7.538,
       "step": 563
     }
   ],
   "logging_steps": 500,
+  "max_steps": 1126,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 2,
   "save_steps": 500,
   "stateful_callbacks": {
     "TrainerControl": {
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": {
+    "learning_rate": 1.1868685493584978e-05,
+    "num_train_epochs": 2,
     "per_device_train_batch_size": 16,
+    "weight_decay": 0.002134803775236508
   }
 }

run-1/checkpoint-563/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4b1b930fb8e91788c965e2716a6235c673c8a487c662e9f94e1672503a85155c
 size 5368

 version https://git-lfs.github.com/spec/v1
+oid sha256:b94ce251b73f8aadbf2d3b914945301b52341856da7ddaf4675709c9b25289a5
 size 5368

runs/Dec08_21-54-18_6ff5f1d99a72/events.out.tfevents.1733696071.6ff5f1d99a72.23.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:7d6c12e65a830f35a3c3363d0253606b6431e0c8184affc765d0dc2742090f6b
+size 5882

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b18f3514f71ccee1e74cafceb4cbd84c3f4bda80bd3c08496a257871a520e8eb
 size 5368

 version https://git-lfs.github.com/spec/v1
+oid sha256:b94ce251b73f8aadbf2d3b914945301b52341856da7ddaf4675709c9b25289a5
 size 5368