|
{ |
|
"best_metric": 0.24191519618034363, |
|
"best_model_checkpoint": "/workspace/training_output/perspectives-vit-large-patch16-224-in21k-v3/checkpoint-9210", |
|
"epoch": 5.0, |
|
"eval_steps": 500, |
|
"global_step": 15350, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.16, |
|
"learning_rate": 1.93485342019544e-05, |
|
"loss": 0.9017, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"learning_rate": 1.8697068403908796e-05, |
|
"loss": 0.5698, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"learning_rate": 1.8045602605863193e-05, |
|
"loss": 0.4974, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.65, |
|
"learning_rate": 1.7394136807817594e-05, |
|
"loss": 0.4646, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.81, |
|
"learning_rate": 1.6742671009771988e-05, |
|
"loss": 0.4538, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.98, |
|
"learning_rate": 1.6091205211726385e-05, |
|
"loss": 0.4353, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.8811721273650208, |
|
"eval_loss": 0.33953866362571716, |
|
"eval_runtime": 349.0715, |
|
"eval_samples_per_second": 12.416, |
|
"eval_steps_per_second": 1.553, |
|
"step": 3070 |
|
}, |
|
{ |
|
"epoch": 1.14, |
|
"learning_rate": 1.5439739413680782e-05, |
|
"loss": 0.3613, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 1.3, |
|
"learning_rate": 1.478827361563518e-05, |
|
"loss": 0.3571, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 1.47, |
|
"learning_rate": 1.4136807817589578e-05, |
|
"loss": 0.3861, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 1.63, |
|
"learning_rate": 1.3485342019543975e-05, |
|
"loss": 0.3657, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 1.79, |
|
"learning_rate": 1.2833876221498372e-05, |
|
"loss": 0.3615, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 1.95, |
|
"learning_rate": 1.2182410423452771e-05, |
|
"loss": 0.3415, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.9192431933548685, |
|
"eval_loss": 0.25435712933540344, |
|
"eval_runtime": 357.646, |
|
"eval_samples_per_second": 12.118, |
|
"eval_steps_per_second": 1.515, |
|
"step": 6140 |
|
}, |
|
{ |
|
"epoch": 2.12, |
|
"learning_rate": 1.1530944625407168e-05, |
|
"loss": 0.3178, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 2.28, |
|
"learning_rate": 1.0879478827361565e-05, |
|
"loss": 0.2954, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 2.44, |
|
"learning_rate": 1.0228013029315963e-05, |
|
"loss": 0.3127, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 2.61, |
|
"learning_rate": 9.576547231270358e-06, |
|
"loss": 0.3116, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 2.77, |
|
"learning_rate": 8.925081433224755e-06, |
|
"loss": 0.2747, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 2.93, |
|
"learning_rate": 8.273615635179154e-06, |
|
"loss": 0.2689, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.92455006922012, |
|
"eval_loss": 0.24191519618034363, |
|
"eval_runtime": 319.492, |
|
"eval_samples_per_second": 13.565, |
|
"eval_steps_per_second": 1.696, |
|
"step": 9210 |
|
}, |
|
{ |
|
"epoch": 3.09, |
|
"learning_rate": 7.622149837133551e-06, |
|
"loss": 0.2727, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 3.26, |
|
"learning_rate": 6.9706840390879485e-06, |
|
"loss": 0.2362, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 3.42, |
|
"learning_rate": 6.319218241042345e-06, |
|
"loss": 0.2617, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 3.58, |
|
"learning_rate": 5.667752442996744e-06, |
|
"loss": 0.2437, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 3.75, |
|
"learning_rate": 5.016286644951141e-06, |
|
"loss": 0.2494, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 3.91, |
|
"learning_rate": 4.364820846905538e-06, |
|
"loss": 0.2525, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.9192431933548685, |
|
"eval_loss": 0.29525890946388245, |
|
"eval_runtime": 322.9797, |
|
"eval_samples_per_second": 13.419, |
|
"eval_steps_per_second": 1.678, |
|
"step": 12280 |
|
}, |
|
{ |
|
"epoch": 4.07, |
|
"learning_rate": 3.7133550488599353e-06, |
|
"loss": 0.2265, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 4.23, |
|
"learning_rate": 3.061889250814333e-06, |
|
"loss": 0.204, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 4.4, |
|
"learning_rate": 2.4104234527687296e-06, |
|
"loss": 0.2261, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 4.56, |
|
"learning_rate": 1.7589576547231272e-06, |
|
"loss": 0.2152, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 4.72, |
|
"learning_rate": 1.1074918566775244e-06, |
|
"loss": 0.1766, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 4.89, |
|
"learning_rate": 4.5602605863192187e-07, |
|
"loss": 0.1977, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.9356252884171666, |
|
"eval_loss": 0.24443966150283813, |
|
"eval_runtime": 321.057, |
|
"eval_samples_per_second": 13.499, |
|
"eval_steps_per_second": 1.688, |
|
"step": 15350 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"step": 15350, |
|
"total_flos": 3.363363283622308e+19, |
|
"train_loss": 0.3319820684874097, |
|
"train_runtime": 13677.2564, |
|
"train_samples_per_second": 8.977, |
|
"train_steps_per_second": 1.122 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 15350, |
|
"num_train_epochs": 5, |
|
"save_steps": 500, |
|
"total_flos": 3.363363283622308e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|