Mr-TD
/

Llama3-8b-MOM-Summary-Finetuned-New

Model card Files Files and versions Community

Mr-TD commited on Jul 8

Commit

cce3e73

•

1 Parent(s): bdb5767

Training in progress, step 50, checkpoint

Browse files

Files changed (6) hide show

last-checkpoint/adapter_model.bin +1 -1
last-checkpoint/optimizer.pt +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +5 -53
last-checkpoint/training_args.bin +1 -1

last-checkpoint/adapter_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:56990d4e64657df94b286462a89a81d15aab2ff5bfc9b03b9df19fede5fc93c0
 size 109098378

 version https://git-lfs.github.com/spec/v1
+oid sha256:1c2788e275ff2fdbfec012ac7fb8eafac091166de57508ee4416b9718122b093
 size 109098378

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fad9ac4bd28f6dd06968fe126bb8a2d25fdd4d3f402fe28925f1f8f4c6f8cd01
 size 218182458

 version https://git-lfs.github.com/spec/v1
+oid sha256:823b4e4029fd13474140170c0acdd875c9e17032fb391afea7ce793b1623ae13
 size 218182458

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e75328e6be212481706506b053c5861a3db0b31645c20ab87d116a258a9a5452
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:f1e4342dc5be99a549a981dd65556fed85d338ccd355122fefa870d54060017c
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6088f970b1f0429ad85e576795204ef9269ce142d6ce9c2595b5649efde833b6
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:1d97348f8f3f5f96f2cacef5e1a65c040f53a19642348f1f05fea5ba1b9158e9
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.3020833333333333,
   "eval_steps": 500,
-  "global_step": 250,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -11,69 +11,21 @@
     {
       "epoch": 0.13,
       "learning_rate": 0.0001975746552556772,
-      "loss": 0.8817,
       "step": 25
     },
     {
       "epoch": 0.26,
       "learning_rate": 0.00018550053929480202,
-      "loss": 0.6527,
       "step": 50
-    },
-    {
-      "epoch": 0.39,
-      "learning_rate": 0.00016449948488669639,
-      "loss": 0.6045,
-      "step": 75
-    },
-    {
-      "epoch": 0.52,
-      "learning_rate": 0.000136764169663272,
-      "loss": 0.5813,
-      "step": 100
-    },
-    {
-      "epoch": 0.65,
-      "learning_rate": 0.00010519038181318999,
-      "loss": 0.5774,
-      "step": 125
-    },
-    {
-      "epoch": 0.78,
-      "learning_rate": 7.307467669163655e-05,
-      "loss": 0.5623,
-      "step": 150
-    },
-    {
-      "epoch": 0.91,
-      "learning_rate": 4.377019014049223e-05,
-      "loss": 0.5581,
-      "step": 175
-    },
-    {
-      "epoch": 1.04,
-      "learning_rate": 2.03365443542764e-05,
-      "loss": 0.5384,
-      "step": 200
-    },
-    {
-      "epoch": 1.17,
-      "learning_rate": 5.22039891260262e-06,
-      "loss": 0.537,
-      "step": 225
-    },
-    {
-      "epoch": 1.3,
-      "learning_rate": 0.0,
-      "loss": 0.4969,
-      "step": 250
     }
   ],
   "logging_steps": 25,
   "max_steps": 250,
   "num_train_epochs": 2,
   "save_steps": 50,
-  "total_flos": 1.37971841206272e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.2604166666666667,
   "eval_steps": 500,
+  "global_step": 50,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
     {
       "epoch": 0.13,
       "learning_rate": 0.0001975746552556772,
+      "loss": 0.8825,
       "step": 25
     },
     {
       "epoch": 0.26,
       "learning_rate": 0.00018550053929480202,
+      "loss": 0.6524,
       "step": 50
     }
   ],
   "logging_steps": 25,
   "max_steps": 250,
   "num_train_epochs": 2,
   "save_steps": 50,
+  "total_flos": 2825629156638720.0,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:708de3fb0d7f78ba42ebc5f0e539fb1ad08d6c5dbaf73fd4ce3446d99054170b
 size 4536

 version https://git-lfs.github.com/spec/v1
+oid sha256:642f80b637a5515fcc8833439eb2a37a5ee487f5a6d30b6350fd317f616d97f3
 size 4536