End of training

Files changed (7) hide show

all_results.json CHANGED Viewed

@@ -1,14 +1,14 @@
 {
-    "epoch": 10.0,
-    "eval_loss": 3.4109785556793213,
-    "eval_runtime": 2.7479,
     "eval_samples": 7,
-    "eval_samples_per_second": 2.547,
-    "eval_steps_per_second": 0.364,
-    "perplexity": 30.294874981347323,
-    "train_loss": 3.1061488560267856,
-    "train_runtime": 125.664,
     "train_samples": 14,
-    "train_samples_per_second": 1.114,
-    "train_steps_per_second": 0.557
 }

 {
+    "epoch": 100.0,
+    "eval_loss": 5.787299633026123,
+    "eval_runtime": 2.7515,
     "eval_samples": 7,
+    "eval_samples_per_second": 2.544,
+    "eval_steps_per_second": 0.363,
+    "perplexity": 326.131160418949,
+    "train_loss": 0.858495488848005,
+    "train_runtime": 1306.0127,
     "train_samples": 14,
+    "train_samples_per_second": 1.072,
+    "train_steps_per_second": 0.536
 }

eval_results.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
-    "epoch": 10.0,
-    "eval_loss": 3.4109785556793213,
-    "eval_runtime": 2.7479,
     "eval_samples": 7,
-    "eval_samples_per_second": 2.547,
-    "eval_steps_per_second": 0.364,
-    "perplexity": 30.294874981347323
 }

 {
+    "epoch": 100.0,
+    "eval_loss": 5.787299633026123,
+    "eval_runtime": 2.7515,
     "eval_samples": 7,
+    "eval_samples_per_second": 2.544,
+    "eval_steps_per_second": 0.363,
+    "perplexity": 326.131160418949
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:890f4284a9030a91bc54603a0991d4773b39a5def8d2f3f871145df0799f871e
 size 510403817

 version https://git-lfs.github.com/spec/v1
+oid sha256:765d8b17199f60da6867acfc46c3277707402f8d4aa2ed5f3dc789e84ac5ac0e
 size 510403817

runs/Oct18_19-15-28_955a9c86ed3b/events.out.tfevents.1634584539.955a9c86ed3b.1240.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9b9572a7a2a1c10d1a92ecc437dd185bb1ec48f9586f66fe28190fee0b314acc
-size 3556

 version https://git-lfs.github.com/spec/v1
+oid sha256:c313c09245ee9d0b6f71dcafb5a8df5cb21df5e8cb33c575796b7cf407259b49
+size 3910

runs/Oct18_19-15-28_955a9c86ed3b/events.out.tfevents.1634585850.955a9c86ed3b.1240.2 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:da6f162c85d096fa063f34368e9a265f0f06318999056b6ce4c3f3c9d9568dd8
+size 311

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
-    "epoch": 10.0,
-    "train_loss": 3.1061488560267856,
-    "train_runtime": 125.664,
     "train_samples": 14,
-    "train_samples_per_second": 1.114,
-    "train_steps_per_second": 0.557
 }

 {
+    "epoch": 100.0,
+    "train_loss": 0.858495488848005,
+    "train_runtime": 1306.0127,
     "train_samples": 14,
+    "train_samples_per_second": 1.072,
+    "train_steps_per_second": 0.536
 }

trainer_state.json CHANGED Viewed

@@ -1,25 +1,31 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 10.0,
-  "global_step": 70,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 10.0,
-      "step": 70,
-      "total_flos": 73161768960000.0,
-      "train_loss": 3.1061488560267856,
-      "train_runtime": 125.664,
-      "train_samples_per_second": 1.114,
-      "train_steps_per_second": 0.557
     }
   ],
-  "max_steps": 70,
-  "num_train_epochs": 10,
-  "total_flos": 73161768960000.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 100.0,
+  "global_step": 700,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 71.43,
+      "learning_rate": 1.4285714285714285e-05,
+      "loss": 1.119,
+      "step": 500
+    },
+    {
+      "epoch": 100.0,
+      "step": 700,
+      "total_flos": 731617689600000.0,
+      "train_loss": 0.858495488848005,
+      "train_runtime": 1306.0127,
+      "train_samples_per_second": 1.072,
+      "train_steps_per_second": 0.536
     }
   ],
+  "max_steps": 700,
+  "num_train_epochs": 100,
+  "total_flos": 731617689600000.0,
   "trial_name": null,
   "trial_params": null
 }