jayanthspratap commited on
Commit
ee25917
1 Parent(s): b4f0906

End of training

Browse files
README.md CHANGED
@@ -32,7 +32,7 @@ should probably proofread and complete it, then remove this comment. -->
32
 
33
  This model is a fine-tuned version of [microsoft/resnet-50](https://huggingface.co/microsoft/resnet-50) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 0.6800
36
  - Accuracy: 0.9310
37
 
38
  ## Model description
 
32
 
33
  This model is a fine-tuned version of [microsoft/resnet-50](https://huggingface.co/microsoft/resnet-50) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.6922
36
  - Accuracy: 0.9310
37
 
38
  ## Model description
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 9.655172413793103,
3
+ "eval_accuracy": 0.9310344827586207,
4
+ "eval_loss": 0.6921818852424622,
5
+ "eval_runtime": 0.1602,
6
+ "eval_samples_per_second": 181.05,
7
+ "eval_steps_per_second": 49.945,
8
+ "total_flos": 2.321029594662912e+16,
9
+ "train_loss": 0.6887211867741176,
10
+ "train_runtime": 19.8811,
11
+ "train_samples_per_second": 56.838,
12
+ "train_steps_per_second": 3.521
13
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 9.655172413793103,
3
+ "eval_accuracy": 0.9310344827586207,
4
+ "eval_loss": 0.6921818852424622,
5
+ "eval_runtime": 0.1602,
6
+ "eval_samples_per_second": 181.05,
7
+ "eval_steps_per_second": 49.945
8
+ }
runs/Aug12_22-57-31_EMIMDGXA100GPU1/events.out.tfevents.1723517875.EMIMDGXA100GPU1.76048.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99229167e41d39d56d3b61b3af676ede75ecb5f9afafca9b7bd1ac9ae620110c
3
+ size 405
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 9.655172413793103,
3
+ "total_flos": 2.321029594662912e+16,
4
+ "train_loss": 0.6887211867741176,
5
+ "train_runtime": 19.8811,
6
+ "train_samples_per_second": 56.838,
7
+ "train_steps_per_second": 3.521
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,181 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9310344827586207,
3
+ "best_model_checkpoint": "resnet-50/checkpoint-7",
4
+ "epoch": 9.655172413793103,
5
+ "eval_steps": 500,
6
+ "global_step": 70,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.9655172413793104,
13
+ "eval_accuracy": 0.9310344827586207,
14
+ "eval_loss": 0.6921818852424622,
15
+ "eval_runtime": 0.1674,
16
+ "eval_samples_per_second": 173.228,
17
+ "eval_steps_per_second": 47.787,
18
+ "step": 7
19
+ },
20
+ {
21
+ "epoch": 1.3793103448275863,
22
+ "grad_norm": 2.6714026927948,
23
+ "learning_rate": 4.761904761904762e-06,
24
+ "loss": 0.6927,
25
+ "step": 10
26
+ },
27
+ {
28
+ "epoch": 1.9310344827586206,
29
+ "eval_accuracy": 0.9310344827586207,
30
+ "eval_loss": 0.6895474791526794,
31
+ "eval_runtime": 0.1422,
32
+ "eval_samples_per_second": 203.982,
33
+ "eval_steps_per_second": 56.271,
34
+ "step": 14
35
+ },
36
+ {
37
+ "epoch": 2.7586206896551726,
38
+ "grad_norm": 1.4340662956237793,
39
+ "learning_rate": 3.968253968253968e-06,
40
+ "loss": 0.6916,
41
+ "step": 20
42
+ },
43
+ {
44
+ "epoch": 2.896551724137931,
45
+ "eval_accuracy": 0.9310344827586207,
46
+ "eval_loss": 0.6877713203430176,
47
+ "eval_runtime": 0.1339,
48
+ "eval_samples_per_second": 216.634,
49
+ "eval_steps_per_second": 59.761,
50
+ "step": 21
51
+ },
52
+ {
53
+ "epoch": 4.0,
54
+ "eval_accuracy": 0.9310344827586207,
55
+ "eval_loss": 0.6853156089782715,
56
+ "eval_runtime": 0.15,
57
+ "eval_samples_per_second": 193.285,
58
+ "eval_steps_per_second": 53.32,
59
+ "step": 29
60
+ },
61
+ {
62
+ "epoch": 4.137931034482759,
63
+ "grad_norm": 0.846211314201355,
64
+ "learning_rate": 3.1746031746031746e-06,
65
+ "loss": 0.6899,
66
+ "step": 30
67
+ },
68
+ {
69
+ "epoch": 4.9655172413793105,
70
+ "eval_accuracy": 0.9310344827586207,
71
+ "eval_loss": 0.6838722825050354,
72
+ "eval_runtime": 0.1539,
73
+ "eval_samples_per_second": 188.443,
74
+ "eval_steps_per_second": 51.984,
75
+ "step": 36
76
+ },
77
+ {
78
+ "epoch": 5.517241379310345,
79
+ "grad_norm": 0.7562207579612732,
80
+ "learning_rate": 2.380952380952381e-06,
81
+ "loss": 0.6878,
82
+ "step": 40
83
+ },
84
+ {
85
+ "epoch": 5.931034482758621,
86
+ "eval_accuracy": 0.9310344827586207,
87
+ "eval_loss": 0.6810795068740845,
88
+ "eval_runtime": 0.1817,
89
+ "eval_samples_per_second": 159.574,
90
+ "eval_steps_per_second": 44.02,
91
+ "step": 43
92
+ },
93
+ {
94
+ "epoch": 6.896551724137931,
95
+ "grad_norm": 1.3402385711669922,
96
+ "learning_rate": 1.5873015873015873e-06,
97
+ "loss": 0.6868,
98
+ "step": 50
99
+ },
100
+ {
101
+ "epoch": 6.896551724137931,
102
+ "eval_accuracy": 0.9310344827586207,
103
+ "eval_loss": 0.6826210618019104,
104
+ "eval_runtime": 0.1474,
105
+ "eval_samples_per_second": 196.8,
106
+ "eval_steps_per_second": 54.29,
107
+ "step": 50
108
+ },
109
+ {
110
+ "epoch": 8.0,
111
+ "eval_accuracy": 0.9310344827586207,
112
+ "eval_loss": 0.6804185509681702,
113
+ "eval_runtime": 0.1782,
114
+ "eval_samples_per_second": 162.726,
115
+ "eval_steps_per_second": 44.89,
116
+ "step": 58
117
+ },
118
+ {
119
+ "epoch": 8.275862068965518,
120
+ "grad_norm": 1.5807445049285889,
121
+ "learning_rate": 7.936507936507937e-07,
122
+ "loss": 0.6864,
123
+ "step": 60
124
+ },
125
+ {
126
+ "epoch": 8.96551724137931,
127
+ "eval_accuracy": 0.9310344827586207,
128
+ "eval_loss": 0.6801003217697144,
129
+ "eval_runtime": 0.1994,
130
+ "eval_samples_per_second": 145.402,
131
+ "eval_steps_per_second": 40.111,
132
+ "step": 65
133
+ },
134
+ {
135
+ "epoch": 9.655172413793103,
136
+ "grad_norm": 0.9159764051437378,
137
+ "learning_rate": 0.0,
138
+ "loss": 0.686,
139
+ "step": 70
140
+ },
141
+ {
142
+ "epoch": 9.655172413793103,
143
+ "eval_accuracy": 0.9310344827586207,
144
+ "eval_loss": 0.6800179481506348,
145
+ "eval_runtime": 0.1551,
146
+ "eval_samples_per_second": 186.997,
147
+ "eval_steps_per_second": 51.585,
148
+ "step": 70
149
+ },
150
+ {
151
+ "epoch": 9.655172413793103,
152
+ "step": 70,
153
+ "total_flos": 2.321029594662912e+16,
154
+ "train_loss": 0.6887211867741176,
155
+ "train_runtime": 19.8811,
156
+ "train_samples_per_second": 56.838,
157
+ "train_steps_per_second": 3.521
158
+ }
159
+ ],
160
+ "logging_steps": 10,
161
+ "max_steps": 70,
162
+ "num_input_tokens_seen": 0,
163
+ "num_train_epochs": 10,
164
+ "save_steps": 500,
165
+ "stateful_callbacks": {
166
+ "TrainerControl": {
167
+ "args": {
168
+ "should_epoch_stop": false,
169
+ "should_evaluate": false,
170
+ "should_log": false,
171
+ "should_save": true,
172
+ "should_training_stop": true
173
+ },
174
+ "attributes": {}
175
+ }
176
+ },
177
+ "total_flos": 2.321029594662912e+16,
178
+ "train_batch_size": 4,
179
+ "trial_name": null,
180
+ "trial_params": null
181
+ }