sheepy928 commited on
Commit
331c4c0
1 Parent(s): dd0e661

Training in progress, step 100, checkpoint

Browse files
checkpoint-100/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7346ec1ae7c9b8c42ee468ae13423be6aa1c8975467ce0e77a27b489c7fe012
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82badac31c39aef875e8457adefd9fd641ee6da84e3f503212042d11a47d703c
3
  size 14244
checkpoint-100/trainer_state.json CHANGED
@@ -23,10 +23,14 @@
23
  {
24
  "epoch": 0.06,
25
  "eval_accuracy": 0.44479243019924036,
 
 
26
  "eval_loss": 1.065091609954834,
27
- "eval_runtime": 50.348,
28
- "eval_samples_per_second": 596.131,
29
- "eval_steps_per_second": 1.172,
 
 
30
  "step": 20
31
  },
32
  {
@@ -44,10 +48,14 @@
44
  {
45
  "epoch": 0.12,
46
  "eval_accuracy": 0.5033650962883988,
 
 
47
  "eval_loss": 1.0188277959823608,
48
- "eval_runtime": 49.614,
49
- "eval_samples_per_second": 604.95,
50
- "eval_steps_per_second": 1.189,
 
 
51
  "step": 40
52
  },
53
  {
@@ -65,10 +73,14 @@
65
  {
66
  "epoch": 0.18,
67
  "eval_accuracy": 0.5279203038581995,
 
 
68
  "eval_loss": 0.9871189594268799,
69
- "eval_runtime": 49.5201,
70
- "eval_samples_per_second": 606.098,
71
- "eval_steps_per_second": 1.191,
 
 
72
  "step": 60
73
  },
74
  {
@@ -86,10 +98,14 @@
86
  {
87
  "epoch": 0.24,
88
  "eval_accuracy": 0.5308189511561271,
 
 
89
  "eval_loss": 0.9888613224029541,
90
- "eval_runtime": 49.4469,
91
- "eval_samples_per_second": 606.994,
92
- "eval_steps_per_second": 1.193,
 
 
93
  "step": 80
94
  },
95
  {
@@ -107,18 +123,22 @@
107
  {
108
  "epoch": 0.3,
109
  "eval_accuracy": 0.5307856333710935,
 
 
110
  "eval_loss": 0.9762536883354187,
111
- "eval_runtime": 49.4804,
112
- "eval_samples_per_second": 606.583,
113
- "eval_steps_per_second": 1.192,
 
 
114
  "step": 100
115
  }
116
  ],
117
  "logging_steps": 10,
118
- "max_steps": 996,
119
- "num_train_epochs": 3,
120
  "save_steps": 100,
121
- "total_flos": 1.34714065158144e+16,
122
  "trial_name": null,
123
  "trial_params": null
124
  }
 
23
  {
24
  "epoch": 0.06,
25
  "eval_accuracy": 0.44479243019924036,
26
+ "eval_combined_score": 0.3403229798934559,
27
+ "eval_f1": 0.2738667532127967,
28
  "eval_loss": 1.065091609954834,
29
+ "eval_precision": 0.19784030596254612,
30
+ "eval_recall": 0.44479243019924036,
31
+ "eval_runtime": 49.6621,
32
+ "eval_samples_per_second": 604.364,
33
+ "eval_steps_per_second": 1.188,
34
  "step": 20
35
  },
36
  {
 
48
  {
49
  "epoch": 0.12,
50
  "eval_accuracy": 0.5033650962883988,
51
+ "eval_combined_score": 0.4633375988688383,
52
+ "eval_f1": 0.4137746858205889,
53
  "eval_loss": 1.0188277959823608,
54
+ "eval_precision": 0.43284551707796665,
55
+ "eval_recall": 0.5033650962883988,
56
+ "eval_runtime": 49.1985,
57
+ "eval_samples_per_second": 610.06,
58
+ "eval_steps_per_second": 1.199,
59
  "step": 40
60
  },
61
  {
 
73
  {
74
  "epoch": 0.18,
75
  "eval_accuracy": 0.5279203038581995,
76
+ "eval_combined_score": 0.48433586826626607,
77
+ "eval_f1": 0.4596383010419703,
78
  "eval_loss": 0.9871189594268799,
79
+ "eval_precision": 0.421864564306695,
80
+ "eval_recall": 0.5279203038581995,
81
+ "eval_runtime": 49.0237,
82
+ "eval_samples_per_second": 612.235,
83
+ "eval_steps_per_second": 1.204,
84
  "step": 60
85
  },
86
  {
 
98
  {
99
  "epoch": 0.24,
100
  "eval_accuracy": 0.5308189511561271,
101
+ "eval_combined_score": 0.4866197693698143,
102
+ "eval_f1": 0.46528335920671143,
103
  "eval_loss": 0.9888613224029541,
104
+ "eval_precision": 0.4195578159602916,
105
+ "eval_recall": 0.5308189511561271,
106
+ "eval_runtime": 49.518,
107
+ "eval_samples_per_second": 606.124,
108
+ "eval_steps_per_second": 1.191,
109
  "step": 80
110
  },
111
  {
 
123
  {
124
  "epoch": 0.3,
125
  "eval_accuracy": 0.5307856333710935,
126
+ "eval_combined_score": 0.48644275806230897,
127
+ "eval_f1": 0.4666072639999521,
128
  "eval_loss": 0.9762536883354187,
129
+ "eval_precision": 0.4175925015070968,
130
+ "eval_recall": 0.5307856333710935,
131
+ "eval_runtime": 49.4629,
132
+ "eval_samples_per_second": 606.798,
133
+ "eval_steps_per_second": 1.193,
134
  "step": 100
135
  }
136
  ],
137
  "logging_steps": 10,
138
+ "max_steps": 1660,
139
+ "num_train_epochs": 5,
140
  "save_steps": 100,
141
+ "total_flos": 1.34714069876736e+16,
142
  "trial_name": null,
143
  "trial_params": null
144
  }
checkpoint-100/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f1be80ebe52f6e43af0b8aa087e72fad77310d5998b6e0b8f66a6a1d53be7b7
3
  size 4536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae98e7de1b05a570517ae68653e3c31b639a52c739d05197601f467f38b01c66
3
  size 4536