yenpolin commited on
Commit
303a5d9
·
1 Parent(s): 8d83978

End of training

Browse files
all_results.json CHANGED
@@ -3,13 +3,13 @@
3
  "eval_loss": NaN,
4
  "eval_mean_acc": 0.0,
5
  "eval_median_acc": 0.0,
6
- "eval_runtime": 16.7609,
7
  "eval_samples": 18477,
8
- "eval_samples_per_second": 1102.386,
9
- "eval_steps_per_second": 0.597,
10
  "train_loss": 0.0,
11
- "train_runtime": 109.5006,
12
  "train_samples": 100000,
13
- "train_samples_per_second": 913.237,
14
- "train_steps_per_second": 0.895
15
  }
 
3
  "eval_loss": NaN,
4
  "eval_mean_acc": 0.0,
5
  "eval_median_acc": 0.0,
6
+ "eval_runtime": 16.2793,
7
  "eval_samples": 18477,
8
+ "eval_samples_per_second": 1135.001,
9
+ "eval_steps_per_second": 0.614,
10
  "train_loss": 0.0,
11
+ "train_runtime": 124.2018,
12
  "train_samples": 100000,
13
+ "train_samples_per_second": 805.142,
14
+ "train_steps_per_second": 0.789
15
  }
eval_results.json CHANGED
@@ -3,8 +3,8 @@
3
  "eval_loss": NaN,
4
  "eval_mean_acc": 0.0,
5
  "eval_median_acc": 0.0,
6
- "eval_runtime": 16.7609,
7
  "eval_samples": 18477,
8
- "eval_samples_per_second": 1102.386,
9
- "eval_steps_per_second": 0.597
10
  }
 
3
  "eval_loss": NaN,
4
  "eval_mean_acc": 0.0,
5
  "eval_median_acc": 0.0,
6
+ "eval_runtime": 16.2793,
7
  "eval_samples": 18477,
8
+ "eval_samples_per_second": 1135.001,
9
+ "eval_steps_per_second": 0.614
10
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
  "train_loss": 0.0,
4
- "train_runtime": 109.5006,
5
  "train_samples": 100000,
6
- "train_samples_per_second": 913.237,
7
- "train_steps_per_second": 0.895
8
  }
 
1
  {
2
  "epoch": 1.0,
3
  "train_loss": 0.0,
4
+ "train_runtime": 124.2018,
5
  "train_samples": 100000,
6
+ "train_samples_per_second": 805.142,
7
+ "train_steps_per_second": 0.789
8
  }
trainer_state.json CHANGED
@@ -7,14 +7,24 @@
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
 
 
 
 
 
 
 
 
 
 
10
  {
11
  "epoch": 1.0,
12
  "step": 98,
13
  "total_flos": 1.038017592e+16,
14
  "train_loss": 0.0,
15
- "train_runtime": 109.5006,
16
- "train_samples_per_second": 913.237,
17
- "train_steps_per_second": 0.895
18
  }
19
  ],
20
  "max_steps": 98,
 
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
+ {
11
+ "epoch": 0.51,
12
+ "eval_loss": NaN,
13
+ "eval_mean_acc": 0.0,
14
+ "eval_median_acc": 0.0,
15
+ "eval_runtime": 16.276,
16
+ "eval_samples_per_second": 1135.228,
17
+ "eval_steps_per_second": 0.614,
18
+ "step": 50
19
+ },
20
  {
21
  "epoch": 1.0,
22
  "step": 98,
23
  "total_flos": 1.038017592e+16,
24
  "train_loss": 0.0,
25
+ "train_runtime": 124.2018,
26
+ "train_samples_per_second": 805.142,
27
+ "train_steps_per_second": 0.789
28
  }
29
  ],
30
  "max_steps": 98,