yenpolin commited on
Commit
2475c6c
·
1 Parent(s): 716fb7c

End of training

Browse files
all_results.json CHANGED
@@ -3,13 +3,13 @@
3
  "eval_loss": NaN,
4
  "eval_mean_acc": 0.0,
5
  "eval_median_acc": 0.0,
6
- "eval_runtime": 17.3158,
7
  "eval_samples": 18477,
8
- "eval_samples_per_second": 1067.062,
9
- "eval_steps_per_second": 1.444,
10
  "train_loss": 0.0,
11
- "train_runtime": 127.9233,
12
  "train_samples": 100000,
13
- "train_samples_per_second": 781.718,
14
- "train_steps_per_second": 2.447
15
  }
 
3
  "eval_loss": NaN,
4
  "eval_mean_acc": 0.0,
5
  "eval_median_acc": 0.0,
6
+ "eval_runtime": 16.7609,
7
  "eval_samples": 18477,
8
+ "eval_samples_per_second": 1102.386,
9
+ "eval_steps_per_second": 0.597,
10
  "train_loss": 0.0,
11
+ "train_runtime": 109.5006,
12
  "train_samples": 100000,
13
+ "train_samples_per_second": 913.237,
14
+ "train_steps_per_second": 0.895
15
  }
eval_results.json CHANGED
@@ -3,8 +3,8 @@
3
  "eval_loss": NaN,
4
  "eval_mean_acc": 0.0,
5
  "eval_median_acc": 0.0,
6
- "eval_runtime": 17.3158,
7
  "eval_samples": 18477,
8
- "eval_samples_per_second": 1067.062,
9
- "eval_steps_per_second": 1.444
10
  }
 
3
  "eval_loss": NaN,
4
  "eval_mean_acc": 0.0,
5
  "eval_median_acc": 0.0,
6
+ "eval_runtime": 16.7609,
7
  "eval_samples": 18477,
8
+ "eval_samples_per_second": 1102.386,
9
+ "eval_steps_per_second": 0.597
10
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
  "train_loss": 0.0,
4
- "train_runtime": 127.9233,
5
  "train_samples": 100000,
6
- "train_samples_per_second": 781.718,
7
- "train_steps_per_second": 2.447
8
  }
 
1
  {
2
  "epoch": 1.0,
3
  "train_loss": 0.0,
4
+ "train_runtime": 109.5006,
5
  "train_samples": 100000,
6
+ "train_samples_per_second": 913.237,
7
+ "train_steps_per_second": 0.895
8
  }
trainer_state.json CHANGED
@@ -2,32 +2,22 @@
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
  "epoch": 1.0,
5
- "global_step": 313,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
- {
11
- "epoch": 0.51,
12
- "eval_loss": NaN,
13
- "eval_mean_acc": 0.0,
14
- "eval_median_acc": 0.0,
15
- "eval_runtime": 16.7694,
16
- "eval_samples_per_second": 1101.83,
17
- "eval_steps_per_second": 1.491,
18
- "step": 160
19
- },
20
  {
21
  "epoch": 1.0,
22
- "step": 313,
23
  "total_flos": 1.038017592e+16,
24
  "train_loss": 0.0,
25
- "train_runtime": 127.9233,
26
- "train_samples_per_second": 781.718,
27
- "train_steps_per_second": 2.447
28
  }
29
  ],
30
- "max_steps": 313,
31
  "num_train_epochs": 1,
32
  "total_flos": 1.038017592e+16,
33
  "trial_name": null,
 
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
  "epoch": 1.0,
5
+ "global_step": 98,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
 
 
 
 
 
 
 
 
 
 
10
  {
11
  "epoch": 1.0,
12
+ "step": 98,
13
  "total_flos": 1.038017592e+16,
14
  "train_loss": 0.0,
15
+ "train_runtime": 109.5006,
16
+ "train_samples_per_second": 913.237,
17
+ "train_steps_per_second": 0.895
18
  }
19
  ],
20
+ "max_steps": 98,
21
  "num_train_epochs": 1,
22
  "total_flos": 1.038017592e+16,
23
  "trial_name": null,