Baselhany commited on
Commit
a32b6f3
·
verified ·
1 Parent(s): 864f41d

Training in progress, step 18600, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:03a1ed5c90eda41e8ca9b7169559116cb5239e526627278e8b83429bda1bc450
3
  size 290403936
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:836232e2ae3615bdffe832e9aae3bfe8a6a5e3f2341f18775b95bbade3a09e0a
3
  size 290403936
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4f8e87f5e4b08e46b3e75649df349d5b4fb594960164f2de19d18140a369834
3
  size 574811514
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b17e9ee1fe06813dba52c72e9bdf75e0ea7b8c7efe03ba060f9eeee01d3e68e8
3
  size 574811514
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b24b050a4497d2df6e7b62cfcfc4d42779850867386d0439e998a176affdfa5c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1c99a85b3235c08a2f7456fdd3f030b9e3b62228fae9a7361d4c5547a39cb7e
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f29b82604f7335f435c091689ced5b7937e31a97e2f9451a4908d45d79903d2
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f628c1b20976013ecb473aea3b4cbce7b25cc3d4915b1feb5ea96f37cfaae9f1
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 11.398892348386742,
3
  "best_model_checkpoint": "./Whisper_base_fine_tune_Quran/checkpoint-14800",
4
- "epoch": 6.478831088812605,
5
  "eval_steps": 200,
6
- "global_step": 18400,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -3503,6 +3503,44 @@
3503
  "eval_steps_per_second": 0.16,
3504
  "eval_wer": 11.566968836965806,
3505
  "step": 18400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3506
  }
3507
  ],
3508
  "logging_steps": 50,
@@ -3517,12 +3555,12 @@
3517
  "should_evaluate": false,
3518
  "should_log": false,
3519
  "should_save": true,
3520
- "should_training_stop": false
3521
  },
3522
  "attributes": {}
3523
  }
3524
  },
3525
- "total_flos": 7.6379131478016e+19,
3526
  "train_batch_size": 16,
3527
  "trial_name": null,
3528
  "trial_params": null
 
1
  {
2
  "best_metric": 11.398892348386742,
3
  "best_model_checkpoint": "./Whisper_base_fine_tune_Quran/checkpoint-14800",
4
+ "epoch": 6.549247425402694,
5
  "eval_steps": 200,
6
+ "global_step": 18600,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
3503
  "eval_steps_per_second": 0.16,
3504
  "eval_wer": 11.566968836965806,
3505
  "step": 18400
3506
+ },
3507
+ {
3508
+ "epoch": 6.496435172960127,
3509
+ "grad_norm": 6578.0205078125,
3510
+ "learning_rate": 1.694496166129711e-08,
3511
+ "loss": 0.0012,
3512
+ "step": 18450
3513
+ },
3514
+ {
3515
+ "epoch": 6.514039257107649,
3516
+ "grad_norm": 19422.87109375,
3517
+ "learning_rate": 7.53133041307974e-09,
3518
+ "loss": 0.001,
3519
+ "step": 18500
3520
+ },
3521
+ {
3522
+ "epoch": 6.5316433412551715,
3523
+ "grad_norm": 14675.833984375,
3524
+ "learning_rate": 1.8828680551918888e-09,
3525
+ "loss": 0.0013,
3526
+ "step": 18550
3527
+ },
3528
+ {
3529
+ "epoch": 6.549247425402694,
3530
+ "grad_norm": 26447.1796875,
3531
+ "learning_rate": 0.0,
3532
+ "loss": 0.0012,
3533
+ "step": 18600
3534
+ },
3535
+ {
3536
+ "epoch": 6.549247425402694,
3537
+ "eval_cer": 3.793663662027795,
3538
+ "eval_loss": 0.012004045769572258,
3539
+ "eval_runtime": 1511.039,
3540
+ "eval_samples_per_second": 2.559,
3541
+ "eval_steps_per_second": 0.16,
3542
+ "eval_wer": 11.577990246052957,
3543
+ "step": 18600
3544
  }
3545
  ],
3546
  "logging_steps": 50,
 
3555
  "should_evaluate": false,
3556
  "should_log": false,
3557
  "should_save": true,
3558
+ "should_training_stop": true
3559
  },
3560
  "attributes": {}
3561
  }
3562
  },
3563
+ "total_flos": 7.7209339428864e+19,
3564
  "train_batch_size": 16,
3565
  "trial_name": null,
3566
  "trial_params": null