itsLeen commited on
Commit
bf159ac
·
verified ·
1 Parent(s): 0c452e2

itsLeen/vit-large-ai-or-not

Browse files
README.md CHANGED
@@ -18,8 +18,8 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [google/vit-large-patch16-224](https://huggingface.co/google/vit-large-patch16-224) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.1124
22
- - Accuracy: 0.9635
23
 
24
  ## Model description
25
 
 
18
 
19
  This model is a fine-tuned version of [google/vit-large-patch16-224](https://huggingface.co/google/vit-large-patch16-224) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 0.1039
22
+ - Accuracy: 0.9581
23
 
24
  ## Model description
25
 
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 2.0,
3
+ "total_flos": 9.690147678529511e+18,
4
+ "train_loss": 0.16445749211268226,
5
+ "train_runtime": 2512.7977,
6
+ "train_samples_per_second": 14.078,
7
+ "train_steps_per_second": 0.88
8
+ }
runs/Oct22_19-27-07_a63007bb5933/events.out.tfevents.1729628208.a63007bb5933.577.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21e9e2aba44969d6bfb3e6e9a987c4ee5c4d60d5ce61c04b8e9d58c83952dab6
3
+ size 411
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 2.0,
3
+ "total_flos": 9.690147678529511e+18,
4
+ "train_loss": 0.16445749211268226,
5
+ "train_runtime": 2512.7977,
6
+ "train_samples_per_second": 14.078,
7
+ "train_steps_per_second": 0.88
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,218 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.10391458868980408,
3
+ "best_model_checkpoint": "vit-large-ai-or-not/checkpoint-2000",
4
+ "epoch": 2.0,
5
+ "eval_steps": 200,
6
+ "global_step": 2212,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.18083182640144665,
13
+ "grad_norm": 1.507786750793457,
14
+ "learning_rate": 0.00018191681735985535,
15
+ "loss": 0.3925,
16
+ "step": 200
17
+ },
18
+ {
19
+ "epoch": 0.18083182640144665,
20
+ "eval_accuracy": 0.878625134264232,
21
+ "eval_loss": 0.40452271699905396,
22
+ "eval_runtime": 14.0535,
23
+ "eval_samples_per_second": 66.247,
24
+ "eval_steps_per_second": 8.325,
25
+ "step": 200
26
+ },
27
+ {
28
+ "epoch": 0.3616636528028933,
29
+ "grad_norm": 3.166074514389038,
30
+ "learning_rate": 0.00016383363471971068,
31
+ "loss": 0.2803,
32
+ "step": 400
33
+ },
34
+ {
35
+ "epoch": 0.3616636528028933,
36
+ "eval_accuracy": 0.9044038668098818,
37
+ "eval_loss": 0.2385927140712738,
38
+ "eval_runtime": 13.6284,
39
+ "eval_samples_per_second": 68.313,
40
+ "eval_steps_per_second": 8.585,
41
+ "step": 400
42
+ },
43
+ {
44
+ "epoch": 0.5424954792043399,
45
+ "grad_norm": 3.2524709701538086,
46
+ "learning_rate": 0.00014575045207956602,
47
+ "loss": 0.2235,
48
+ "step": 600
49
+ },
50
+ {
51
+ "epoch": 0.5424954792043399,
52
+ "eval_accuracy": 0.9172932330827067,
53
+ "eval_loss": 0.1893242746591568,
54
+ "eval_runtime": 13.8787,
55
+ "eval_samples_per_second": 67.081,
56
+ "eval_steps_per_second": 8.43,
57
+ "step": 600
58
+ },
59
+ {
60
+ "epoch": 0.7233273056057866,
61
+ "grad_norm": 0.6501625776290894,
62
+ "learning_rate": 0.00012766726943942136,
63
+ "loss": 0.217,
64
+ "step": 800
65
+ },
66
+ {
67
+ "epoch": 0.7233273056057866,
68
+ "eval_accuracy": 0.9398496240601504,
69
+ "eval_loss": 0.15967358648777008,
70
+ "eval_runtime": 15.6768,
71
+ "eval_samples_per_second": 59.387,
72
+ "eval_steps_per_second": 7.463,
73
+ "step": 800
74
+ },
75
+ {
76
+ "epoch": 0.9041591320072333,
77
+ "grad_norm": 0.8514215350151062,
78
+ "learning_rate": 0.00010958408679927667,
79
+ "loss": 0.1865,
80
+ "step": 1000
81
+ },
82
+ {
83
+ "epoch": 0.9041591320072333,
84
+ "eval_accuracy": 0.9419978517722879,
85
+ "eval_loss": 0.14128026366233826,
86
+ "eval_runtime": 14.4065,
87
+ "eval_samples_per_second": 64.624,
88
+ "eval_steps_per_second": 8.121,
89
+ "step": 1000
90
+ },
91
+ {
92
+ "epoch": 1.0849909584086799,
93
+ "grad_norm": 0.2293129414319992,
94
+ "learning_rate": 9.150090415913202e-05,
95
+ "loss": 0.1309,
96
+ "step": 1200
97
+ },
98
+ {
99
+ "epoch": 1.0849909584086799,
100
+ "eval_accuracy": 0.9516648764769066,
101
+ "eval_loss": 0.1473875343799591,
102
+ "eval_runtime": 14.0786,
103
+ "eval_samples_per_second": 66.129,
104
+ "eval_steps_per_second": 8.31,
105
+ "step": 1200
106
+ },
107
+ {
108
+ "epoch": 1.2658227848101267,
109
+ "grad_norm": 4.756102561950684,
110
+ "learning_rate": 7.341772151898734e-05,
111
+ "loss": 0.1008,
112
+ "step": 1400
113
+ },
114
+ {
115
+ "epoch": 1.2658227848101267,
116
+ "eval_accuracy": 0.9419978517722879,
117
+ "eval_loss": 0.19141799211502075,
118
+ "eval_runtime": 13.9995,
119
+ "eval_samples_per_second": 66.502,
120
+ "eval_steps_per_second": 8.357,
121
+ "step": 1400
122
+ },
123
+ {
124
+ "epoch": 1.4466546112115732,
125
+ "grad_norm": 0.034902941435575485,
126
+ "learning_rate": 5.533453887884268e-05,
127
+ "loss": 0.0793,
128
+ "step": 1600
129
+ },
130
+ {
131
+ "epoch": 1.4466546112115732,
132
+ "eval_accuracy": 0.9441460794844253,
133
+ "eval_loss": 0.15568311512470245,
134
+ "eval_runtime": 14.1017,
135
+ "eval_samples_per_second": 66.021,
136
+ "eval_steps_per_second": 8.297,
137
+ "step": 1600
138
+ },
139
+ {
140
+ "epoch": 1.6274864376130198,
141
+ "grad_norm": 1.2290639877319336,
142
+ "learning_rate": 3.725135623869802e-05,
143
+ "loss": 0.0804,
144
+ "step": 1800
145
+ },
146
+ {
147
+ "epoch": 1.6274864376130198,
148
+ "eval_accuracy": 0.9312567132116004,
149
+ "eval_loss": 0.23011024296283722,
150
+ "eval_runtime": 13.8445,
151
+ "eval_samples_per_second": 67.247,
152
+ "eval_steps_per_second": 8.451,
153
+ "step": 1800
154
+ },
155
+ {
156
+ "epoch": 1.8083182640144666,
157
+ "grad_norm": 0.08316856622695923,
158
+ "learning_rate": 1.9168173598553345e-05,
159
+ "loss": 0.0814,
160
+ "step": 2000
161
+ },
162
+ {
163
+ "epoch": 1.8083182640144666,
164
+ "eval_accuracy": 0.958109559613319,
165
+ "eval_loss": 0.10391458868980408,
166
+ "eval_runtime": 14.1201,
167
+ "eval_samples_per_second": 65.935,
168
+ "eval_steps_per_second": 8.286,
169
+ "step": 2000
170
+ },
171
+ {
172
+ "epoch": 1.9891500904159132,
173
+ "grad_norm": 0.11144193261861801,
174
+ "learning_rate": 1.08499095840868e-06,
175
+ "loss": 0.0446,
176
+ "step": 2200
177
+ },
178
+ {
179
+ "epoch": 1.9891500904159132,
180
+ "eval_accuracy": 0.9634801288936627,
181
+ "eval_loss": 0.1123916506767273,
182
+ "eval_runtime": 14.6416,
183
+ "eval_samples_per_second": 63.586,
184
+ "eval_steps_per_second": 7.991,
185
+ "step": 2200
186
+ },
187
+ {
188
+ "epoch": 2.0,
189
+ "step": 2212,
190
+ "total_flos": 9.690147678529511e+18,
191
+ "train_loss": 0.16445749211268226,
192
+ "train_runtime": 2512.7977,
193
+ "train_samples_per_second": 14.078,
194
+ "train_steps_per_second": 0.88
195
+ }
196
+ ],
197
+ "logging_steps": 200,
198
+ "max_steps": 2212,
199
+ "num_input_tokens_seen": 0,
200
+ "num_train_epochs": 2,
201
+ "save_steps": 200,
202
+ "stateful_callbacks": {
203
+ "TrainerControl": {
204
+ "args": {
205
+ "should_epoch_stop": false,
206
+ "should_evaluate": false,
207
+ "should_log": false,
208
+ "should_save": true,
209
+ "should_training_stop": true
210
+ },
211
+ "attributes": {}
212
+ }
213
+ },
214
+ "total_flos": 9.690147678529511e+18,
215
+ "train_batch_size": 16,
216
+ "trial_name": null,
217
+ "trial_params": null
218
+ }