Training in progress, step 20000, checkpoint
Browse files
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 151061672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0e990b8c59e5598bc297637494bbcf3292ed66e258b527d11c54b5a554dd78b
|
3 |
size 151061672
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 297616186
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfc6de0cae9b656e0e1e839065e8e2053eceee36ee727f37817b3df325ab9bae
|
3 |
size 297616186
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:932c14fa744620038ccb3fdad1e196a4baf73b772af6a561bc48ddacc72a5fe7
|
3 |
size 14244
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55d42527fa9bec4d3688be19c35898c0c615e532c0d2f87ab4ced258be498427
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": 13.344171052269033,
|
3 |
"best_model_checkpoint": "./Whisper_tiny_fine_tune_Quran/checkpoint-19600",
|
4 |
-
"epoch":
|
5 |
"eval_steps": 400,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -3276,12 +3276,43 @@
|
|
3276 |
"learning_rate": 5.912536872321184e-10,
|
3277 |
"loss": 0.0011,
|
3278 |
"step": 19850
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3279 |
}
|
3280 |
],
|
3281 |
"logging_steps": 50,
|
3282 |
-
"max_steps":
|
3283 |
"num_input_tokens_seen": 0,
|
3284 |
-
"num_train_epochs":
|
3285 |
"save_steps": 400,
|
3286 |
"stateful_callbacks": {
|
3287 |
"TrainerControl": {
|
@@ -3290,12 +3321,12 @@
|
|
3290 |
"should_evaluate": false,
|
3291 |
"should_log": false,
|
3292 |
"should_save": true,
|
3293 |
-
"should_training_stop":
|
3294 |
},
|
3295 |
"attributes": {}
|
3296 |
}
|
3297 |
},
|
3298 |
-
"total_flos": 3.
|
3299 |
"train_batch_size": 16,
|
3300 |
"trial_name": null,
|
3301 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": 13.344171052269033,
|
3 |
"best_model_checkpoint": "./Whisper_tiny_fine_tune_Quran/checkpoint-19600",
|
4 |
+
"epoch": 7.042249801954053,
|
5 |
"eval_steps": 400,
|
6 |
+
"global_step": 20000,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
3276 |
"learning_rate": 5.912536872321184e-10,
|
3277 |
"loss": 0.0011,
|
3278 |
"step": 19850
|
3279 |
+
},
|
3280 |
+
{
|
3281 |
+
"epoch": 7.007041633659009,
|
3282 |
+
"grad_norm": 12099.953125,
|
3283 |
+
"learning_rate": 3.921831902685302e-06,
|
3284 |
+
"loss": 0.0014,
|
3285 |
+
"step": 19900
|
3286 |
+
},
|
3287 |
+
{
|
3288 |
+
"epoch": 7.024645717806531,
|
3289 |
+
"grad_norm": 23940.55859375,
|
3290 |
+
"learning_rate": 3.7857595969273683e-06,
|
3291 |
+
"loss": 0.0013,
|
3292 |
+
"step": 19950
|
3293 |
+
},
|
3294 |
+
{
|
3295 |
+
"epoch": 7.042249801954053,
|
3296 |
+
"grad_norm": 2267.954345703125,
|
3297 |
+
"learning_rate": 3.6519968320574414e-06,
|
3298 |
+
"loss": 0.0015,
|
3299 |
+
"step": 20000
|
3300 |
+
},
|
3301 |
+
{
|
3302 |
+
"epoch": 7.042249801954053,
|
3303 |
+
"eval_cer": 4.152554049853721,
|
3304 |
+
"eval_loss": 0.013851560652256012,
|
3305 |
+
"eval_runtime": 1119.0933,
|
3306 |
+
"eval_samples_per_second": 3.455,
|
3307 |
+
"eval_steps_per_second": 0.216,
|
3308 |
+
"eval_wer": 13.55082247265313,
|
3309 |
+
"step": 20000
|
3310 |
}
|
3311 |
],
|
3312 |
"logging_steps": 50,
|
3313 |
+
"max_steps": 22720,
|
3314 |
"num_input_tokens_seen": 0,
|
3315 |
+
"num_train_epochs": 8,
|
3316 |
"save_steps": 400,
|
3317 |
"stateful_callbacks": {
|
3318 |
"TrainerControl": {
|
|
|
3321 |
"should_evaluate": false,
|
3322 |
"should_log": false,
|
3323 |
"should_save": true,
|
3324 |
+
"should_training_stop": false
|
3325 |
},
|
3326 |
"attributes": {}
|
3327 |
}
|
3328 |
},
|
3329 |
+
"total_flos": 3.15121729536e+19,
|
3330 |
"train_batch_size": 16,
|
3331 |
"trial_name": null,
|
3332 |
"trial_params": null
|
last-checkpoint/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5560
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06a7832067efe8483eff726dfa1a1062ec2edca1a7bb138e313286ac232b4dbf
|
3 |
size 5560
|