Training in progress, step 12000

Browse files

Files changed (13) hide show

{checkpoint-11000 → checkpoint-12000}/config.json +0 -0
{checkpoint-11000 → checkpoint-12000}/optimizer.pt +1 -1
{checkpoint-11000 → checkpoint-12000}/pytorch_model.bin +1 -1
{checkpoint-11000 → checkpoint-12000}/rng_state.pth +1 -1
{checkpoint-11000 → checkpoint-12000}/scheduler.pt +1 -1
{checkpoint-11000 → checkpoint-12000}/special_tokens_map.json +0 -0
{checkpoint-11000 → checkpoint-12000}/tokenizer.json +0 -0
{checkpoint-11000 → checkpoint-12000}/tokenizer_config.json +0 -0
{checkpoint-11000 → checkpoint-12000}/trainer_state.json +55 -3
{checkpoint-11000 → checkpoint-12000}/training_args.bin +0 -0
{checkpoint-11000 → checkpoint-12000}/vocab.txt +0 -0
pytorch_model.bin +1 -1
runs/Jul23_01-08-06_df8adf32a670/events.out.tfevents.1690074496.df8adf32a670.1420.0 +2 -2

{checkpoint-11000 → checkpoint-12000}/config.json RENAMED Viewed

File without changes

{checkpoint-11000 → checkpoint-12000}/optimizer.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a7121353f67016220d0ba6e07bd91a440d339f7e5ae43637ec5df1821dca53d0
 size 267028677

 version https://git-lfs.github.com/spec/v1
+oid sha256:14dbf8bfdaff0d358c50ba58b2e37e228971d18c40ded342ff3414bc23c55625
 size 267028677

{checkpoint-11000 → checkpoint-12000}/pytorch_model.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6b2d123eec1e3724e36f27638d03c43ed031e88f237dbef0f0139dfab99cb872
 size 133523761

 version https://git-lfs.github.com/spec/v1
+oid sha256:f464404bbabf4ffc076175dc0dd64bed9ebbae82e692e4cc0d024912d83b0bf7
 size 133523761

{checkpoint-11000 → checkpoint-12000}/rng_state.pth RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f611266503706b42390c0157b3936fc5fd122440ae086d8d5ee5411a8edfeafa
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:0e99597d92b26233312419b8d7606c8fbe7f7558947be013db496307a49ea89f
 size 14575

{checkpoint-11000 → checkpoint-12000}/scheduler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:91ff66b19ca53b4aad8b20e30491f86f0e0556ec5ed0d4287237a1e66d619793
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:ee8b6ab7544af193bb6ba46a2bee0e0abe8937e6b54f5dea5a487ee681ff4d17
 size 627

{checkpoint-11000 → checkpoint-12000}/special_tokens_map.json RENAMED Viewed

File without changes

{checkpoint-11000 → checkpoint-12000}/tokenizer.json RENAMED Viewed

File without changes

{checkpoint-11000 → checkpoint-12000}/tokenizer_config.json RENAMED Viewed

File without changes

{checkpoint-11000 → checkpoint-12000}/trainer_state.json RENAMED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 4.4,
-  "global_step": 11000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -454,11 +454,63 @@
       "eval_system_ram_total": 83.48074722290039,
       "eval_system_ram_used": 4.0838470458984375,
       "step": 10625
     }
   ],
   "max_steps": 12500,
   "num_train_epochs": 5,
-  "total_flos": 5590392214928640.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 4.8,
+  "global_step": 12000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_system_ram_total": 83.48074722290039,
       "eval_system_ram_used": 4.0838470458984375,
       "step": 10625
+    },
+    {
+      "epoch": 4.5,
+      "learning_rate": 2.0064000000000004e-06,
+      "loss": 0.6446,
+      "step": 11250
+    },
+    {
+      "epoch": 4.5,
+      "eval_accuracy": 0.7358,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 26.469707489013672,
+      "eval_f1": 0.7322672918855475,
+      "eval_gpu_ram_allocated": 0.39359617233276367,
+      "eval_gpu_ram_cached": 16.05078125,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 31,
+      "eval_loss": 0.8464106321334839,
+      "eval_precision": 0.7319786149192336,
+      "eval_recall": 0.7358,
+      "eval_runtime": 15.2922,
+      "eval_samples_per_second": 1307.853,
+      "eval_steps_per_second": 40.87,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 3.8687171936035156,
+      "step": 11250
+    },
+    {
+      "epoch": 4.75,
+      "learning_rate": 1.0064e-06,
+      "loss": 0.6355,
+      "step": 11875
+    },
+    {
+      "epoch": 4.75,
+      "eval_accuracy": 0.73495,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 26.470008850097656,
+      "eval_f1": 0.7311394674076037,
+      "eval_gpu_ram_allocated": 0.39347314834594727,
+      "eval_gpu_ram_cached": 16.05078125,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 30,
+      "eval_loss": 0.850346565246582,
+      "eval_precision": 0.7308376671248696,
+      "eval_recall": 0.73495,
+      "eval_runtime": 15.2775,
+      "eval_samples_per_second": 1309.111,
+      "eval_steps_per_second": 40.91,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 3.8853225708007812,
+      "step": 11875
     }
   ],
   "max_steps": 12500,
   "num_train_epochs": 5,
+  "total_flos": 6101292142348032.0,
   "trial_name": null,
   "trial_params": null
 }

{checkpoint-11000 → checkpoint-12000}/training_args.bin RENAMED Viewed

File without changes

{checkpoint-11000 → checkpoint-12000}/vocab.txt RENAMED Viewed

File without changes

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:59529ca11cd16e7f3bbb54ae86a9114f2c52ef602c31399728eb28f1e3d1a68e
 size 133523761

 version https://git-lfs.github.com/spec/v1
+oid sha256:f464404bbabf4ffc076175dc0dd64bed9ebbae82e692e4cc0d024912d83b0bf7
 size 133523761

runs/Jul23_01-08-06_df8adf32a670/events.out.tfevents.1690074496.df8adf32a670.1420.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39a09110f783e2e5350e99889528776802102f16699d8374cb32da164aa43612
-size 24718

 version https://git-lfs.github.com/spec/v1
+oid sha256:fb8b338480dce9596ce62d102b2c3b4e900091413645f35902e9c12c0c481491
+size 25820