polejowska
commited on
Commit
•
d4be0bc
1
Parent(s):
cd66a5f
End of training
Browse files- trainer_state.json +90 -20
trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
-
"best_metric": 1.
|
3 |
-
"best_model_checkpoint": "detr-r50-cd45rb-8ah-6l-gelu-corrected\\checkpoint-
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -275,31 +275,101 @@
|
|
275 |
},
|
276 |
{
|
277 |
"epoch": 20.0,
|
278 |
-
"learning_rate":
|
279 |
-
"loss": 2.
|
280 |
"step": 92120
|
281 |
},
|
282 |
{
|
283 |
"epoch": 20.0,
|
284 |
-
"eval_loss": 1.
|
285 |
-
"eval_runtime":
|
286 |
-
"eval_samples_per_second": 8.
|
287 |
-
"eval_steps_per_second": 1.
|
288 |
"step": 92120
|
289 |
},
|
290 |
{
|
291 |
-
"epoch":
|
292 |
-
"
|
293 |
-
"
|
294 |
-
"
|
295 |
-
|
296 |
-
|
297 |
-
"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
298 |
}
|
299 |
],
|
300 |
-
"max_steps":
|
301 |
-
"num_train_epochs":
|
302 |
-
"total_flos":
|
303 |
"trial_name": null,
|
304 |
"trial_params": null
|
305 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 1.5861479043960571,
|
3 |
+
"best_model_checkpoint": "detr-r50-cd45rb-8ah-6l-gelu-corrected\\checkpoint-115150",
|
4 |
+
"epoch": 25.0,
|
5 |
+
"global_step": 115150,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
275 |
},
|
276 |
{
|
277 |
"epoch": 20.0,
|
278 |
+
"learning_rate": 2.0037342596613115e-06,
|
279 |
+
"loss": 2.0206,
|
280 |
"step": 92120
|
281 |
},
|
282 |
{
|
283 |
"epoch": 20.0,
|
284 |
+
"eval_loss": 1.6168476343154907,
|
285 |
+
"eval_runtime": 207.1893,
|
286 |
+
"eval_samples_per_second": 8.596,
|
287 |
+
"eval_steps_per_second": 1.076,
|
288 |
"step": 92120
|
289 |
},
|
290 |
{
|
291 |
+
"epoch": 21.0,
|
292 |
+
"learning_rate": 1.6039947894051239e-06,
|
293 |
+
"loss": 2.026,
|
294 |
+
"step": 96726
|
295 |
+
},
|
296 |
+
{
|
297 |
+
"epoch": 21.0,
|
298 |
+
"eval_loss": 1.6022319793701172,
|
299 |
+
"eval_runtime": 206.9802,
|
300 |
+
"eval_samples_per_second": 8.605,
|
301 |
+
"eval_steps_per_second": 1.077,
|
302 |
+
"step": 96726
|
303 |
+
},
|
304 |
+
{
|
305 |
+
"epoch": 22.0,
|
306 |
+
"learning_rate": 1.2041684759009988e-06,
|
307 |
+
"loss": 2.0109,
|
308 |
+
"step": 101332
|
309 |
+
},
|
310 |
+
{
|
311 |
+
"epoch": 22.0,
|
312 |
+
"eval_loss": 1.5995537042617798,
|
313 |
+
"eval_runtime": 206.8836,
|
314 |
+
"eval_samples_per_second": 8.609,
|
315 |
+
"eval_steps_per_second": 1.078,
|
316 |
+
"step": 101332
|
317 |
+
},
|
318 |
+
{
|
319 |
+
"epoch": 23.0,
|
320 |
+
"learning_rate": 8.042553191489362e-07,
|
321 |
+
"loss": 2.0133,
|
322 |
+
"step": 105938
|
323 |
+
},
|
324 |
+
{
|
325 |
+
"epoch": 23.0,
|
326 |
+
"eval_loss": 1.5983381271362305,
|
327 |
+
"eval_runtime": 206.4758,
|
328 |
+
"eval_samples_per_second": 8.626,
|
329 |
+
"eval_steps_per_second": 1.08,
|
330 |
+
"step": 105938
|
331 |
+
},
|
332 |
+
{
|
333 |
+
"epoch": 24.0,
|
334 |
+
"learning_rate": 4.043421623968737e-07,
|
335 |
+
"loss": 2.0081,
|
336 |
+
"step": 110544
|
337 |
+
},
|
338 |
+
{
|
339 |
+
"epoch": 24.0,
|
340 |
+
"eval_loss": 1.5887646675109863,
|
341 |
+
"eval_runtime": 203.9191,
|
342 |
+
"eval_samples_per_second": 8.734,
|
343 |
+
"eval_steps_per_second": 1.094,
|
344 |
+
"step": 110544
|
345 |
+
},
|
346 |
+
{
|
347 |
+
"epoch": 25.0,
|
348 |
+
"learning_rate": 4.515848892748589e-09,
|
349 |
+
"loss": 1.9975,
|
350 |
+
"step": 115150
|
351 |
+
},
|
352 |
+
{
|
353 |
+
"epoch": 25.0,
|
354 |
+
"eval_loss": 1.5861479043960571,
|
355 |
+
"eval_runtime": 204.8681,
|
356 |
+
"eval_samples_per_second": 8.693,
|
357 |
+
"eval_steps_per_second": 1.089,
|
358 |
+
"step": 115150
|
359 |
+
},
|
360 |
+
{
|
361 |
+
"epoch": 25.0,
|
362 |
+
"step": 115150,
|
363 |
+
"total_flos": 2.2008141195206407e+20,
|
364 |
+
"train_loss": 0.4830571452317629,
|
365 |
+
"train_runtime": 17891.958,
|
366 |
+
"train_samples_per_second": 25.739,
|
367 |
+
"train_steps_per_second": 6.436
|
368 |
}
|
369 |
],
|
370 |
+
"max_steps": 115150,
|
371 |
+
"num_train_epochs": 25,
|
372 |
+
"total_flos": 2.2008141195206407e+20,
|
373 |
"trial_name": null,
|
374 |
"trial_params": null
|
375 |
}
|