Training in progress, step 154, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +32 -4
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 13587864
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16eef88422eb94e9d2420c95c1375df312b1b4ea595f24762f20b983747efe41
|
3 |
size 13587864
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27273018
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:764882108bdabde9c120b53d694588407379bf3cd5cf8bd51f06ae98b1b6ad60
|
3 |
size 27273018
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4b80374eb5b525a1eeb346cf4a22f7c07b53619389a7567c8fe8c3ad7a7556e
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8571cd03298231074ef5da5a91b5f7c590ccf8c044bb8f89ab9ac55f0cf228ef
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:544e1be73a65477247874aeff645c2a77a03a2386f9c039f21691e67953dda30
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4625c8f0544987395688ac4e887e1102183e1a5a7bbc24905bde6ed4147e8ae4
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0500dcde4e9286f0efc9accf05125c4dfcf1e260a707c8323234408753d49e72
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": 1.9268525838851929,
|
3 |
"best_model_checkpoint": "miner_id_24/checkpoint-150",
|
4 |
-
"epoch":
|
5 |
"eval_steps": 25,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -1113,6 +1113,34 @@
|
|
1113 |
"eval_samples_per_second": 176.994,
|
1114 |
"eval_steps_per_second": 46.019,
|
1115 |
"step": 150
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1116 |
}
|
1117 |
],
|
1118 |
"logging_steps": 1,
|
@@ -1136,12 +1164,12 @@
|
|
1136 |
"should_evaluate": false,
|
1137 |
"should_log": false,
|
1138 |
"should_save": true,
|
1139 |
-
"should_training_stop":
|
1140 |
},
|
1141 |
"attributes": {}
|
1142 |
}
|
1143 |
},
|
1144 |
-
"total_flos": 6.
|
1145 |
"train_batch_size": 1,
|
1146 |
"trial_name": null,
|
1147 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": 1.9268525838851929,
|
3 |
"best_model_checkpoint": "miner_id_24/checkpoint-150",
|
4 |
+
"epoch": 2.0073319755600814,
|
5 |
"eval_steps": 25,
|
6 |
+
"global_step": 154,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
1113 |
"eval_samples_per_second": 176.994,
|
1114 |
"eval_steps_per_second": 46.019,
|
1115 |
"step": 150
|
1116 |
+
},
|
1117 |
+
{
|
1118 |
+
"epoch": 1.9682281059063138,
|
1119 |
+
"grad_norm": 0.5727090835571289,
|
1120 |
+
"learning_rate": 3.0266391662183335e-05,
|
1121 |
+
"loss": 2.0008,
|
1122 |
+
"step": 151
|
1123 |
+
},
|
1124 |
+
{
|
1125 |
+
"epoch": 1.9812627291242362,
|
1126 |
+
"grad_norm": 0.6628953814506531,
|
1127 |
+
"learning_rate": 3.0118417936654115e-05,
|
1128 |
+
"loss": 2.2794,
|
1129 |
+
"step": 152
|
1130 |
+
},
|
1131 |
+
{
|
1132 |
+
"epoch": 1.994297352342159,
|
1133 |
+
"grad_norm": 0.3259391188621521,
|
1134 |
+
"learning_rate": 3.0029607730895854e-05,
|
1135 |
+
"loss": 2.0307,
|
1136 |
+
"step": 153
|
1137 |
+
},
|
1138 |
+
{
|
1139 |
+
"epoch": 2.0073319755600814,
|
1140 |
+
"grad_norm": 0.36595845222473145,
|
1141 |
+
"learning_rate": 2.9999999999999997e-05,
|
1142 |
+
"loss": 2.3735,
|
1143 |
+
"step": 154
|
1144 |
}
|
1145 |
],
|
1146 |
"logging_steps": 1,
|
|
|
1164 |
"should_evaluate": false,
|
1165 |
"should_log": false,
|
1166 |
"should_save": true,
|
1167 |
+
"should_training_stop": true
|
1168 |
},
|
1169 |
"attributes": {}
|
1170 |
}
|
1171 |
},
|
1172 |
+
"total_flos": 6.841916242211635e+16,
|
1173 |
"train_batch_size": 1,
|
1174 |
"trial_name": null,
|
1175 |
"trial_params": null
|