|
{ |
|
"best_metric": 1.2710014581680298, |
|
"best_model_checkpoint": "/content/pubmedbert-fulltext-cord19/checkpoint-5000", |
|
"epoch": 3.0, |
|
"global_step": 56250, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.27, |
|
"learning_rate": 2.4970000000000003e-05, |
|
"loss": 1.7985, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"eval_accuracy": 0.7176016320015706, |
|
"eval_loss": 1.2710014581680298, |
|
"eval_runtime": 289.9232, |
|
"eval_samples_per_second": 86.23, |
|
"eval_steps_per_second": 5.391, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 0.53, |
|
"learning_rate": 4.9965e-05, |
|
"loss": 1.7542, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 0.53, |
|
"eval_accuracy": 0.7069832712721614, |
|
"eval_loss": 1.3359251022338867, |
|
"eval_runtime": 290.2058, |
|
"eval_samples_per_second": 86.146, |
|
"eval_steps_per_second": 5.386, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"learning_rate": 4.460432432432432e-05, |
|
"loss": 1.7462, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"eval_accuracy": 0.7034289815931059, |
|
"eval_loss": 1.3488777875900269, |
|
"eval_runtime": 290.0812, |
|
"eval_samples_per_second": 86.183, |
|
"eval_steps_per_second": 5.388, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 1.07, |
|
"learning_rate": 3.9202162162162166e-05, |
|
"loss": 1.8371, |
|
"step": 20000 |
|
}, |
|
{ |
|
"epoch": 1.07, |
|
"eval_accuracy": 0.6891450706903661, |
|
"eval_loss": 1.436103105545044, |
|
"eval_runtime": 289.9321, |
|
"eval_samples_per_second": 86.227, |
|
"eval_steps_per_second": 5.391, |
|
"step": 20000 |
|
}, |
|
{ |
|
"epoch": 1.33, |
|
"learning_rate": 3.379675675675676e-05, |
|
"loss": 1.7102, |
|
"step": 25000 |
|
}, |
|
{ |
|
"epoch": 1.33, |
|
"eval_accuracy": 0.7039453286069087, |
|
"eval_loss": 1.3501886129379272, |
|
"eval_runtime": 289.995, |
|
"eval_samples_per_second": 86.208, |
|
"eval_steps_per_second": 5.39, |
|
"step": 25000 |
|
}, |
|
{ |
|
"epoch": 1.6, |
|
"learning_rate": 2.8393513513513515e-05, |
|
"loss": 1.6596, |
|
"step": 30000 |
|
}, |
|
{ |
|
"epoch": 1.6, |
|
"eval_accuracy": 0.70652987764824, |
|
"eval_loss": 1.334069013595581, |
|
"eval_runtime": 290.2224, |
|
"eval_samples_per_second": 86.141, |
|
"eval_steps_per_second": 5.386, |
|
"step": 30000 |
|
}, |
|
{ |
|
"epoch": 1.87, |
|
"learning_rate": 2.2990270270270274e-05, |
|
"loss": 1.6265, |
|
"step": 35000 |
|
}, |
|
{ |
|
"epoch": 1.87, |
|
"eval_accuracy": 0.708723656830319, |
|
"eval_loss": 1.322791576385498, |
|
"eval_runtime": 291.0022, |
|
"eval_samples_per_second": 85.91, |
|
"eval_steps_per_second": 5.371, |
|
"step": 35000 |
|
}, |
|
{ |
|
"epoch": 2.13, |
|
"learning_rate": 1.7584864864864868e-05, |
|
"loss": 1.605, |
|
"step": 40000 |
|
}, |
|
{ |
|
"epoch": 2.13, |
|
"eval_accuracy": 0.7099296658889697, |
|
"eval_loss": 1.307939052581787, |
|
"eval_runtime": 290.1974, |
|
"eval_samples_per_second": 86.148, |
|
"eval_steps_per_second": 5.386, |
|
"step": 40000 |
|
}, |
|
{ |
|
"epoch": 2.4, |
|
"learning_rate": 1.2181621621621623e-05, |
|
"loss": 1.5731, |
|
"step": 45000 |
|
}, |
|
{ |
|
"epoch": 2.4, |
|
"eval_accuracy": 0.7121370440536863, |
|
"eval_loss": 1.2985501289367676, |
|
"eval_runtime": 290.9835, |
|
"eval_samples_per_second": 85.916, |
|
"eval_steps_per_second": 5.371, |
|
"step": 45000 |
|
}, |
|
{ |
|
"epoch": 2.67, |
|
"learning_rate": 6.778378378378379e-06, |
|
"loss": 1.5602, |
|
"step": 50000 |
|
}, |
|
{ |
|
"epoch": 2.67, |
|
"eval_accuracy": 0.7135782251340592, |
|
"eval_loss": 1.2928680181503296, |
|
"eval_runtime": 290.2984, |
|
"eval_samples_per_second": 86.118, |
|
"eval_steps_per_second": 5.384, |
|
"step": 50000 |
|
}, |
|
{ |
|
"epoch": 2.93, |
|
"learning_rate": 1.3762162162162162e-06, |
|
"loss": 1.5447, |
|
"step": 55000 |
|
}, |
|
{ |
|
"epoch": 2.93, |
|
"eval_accuracy": 0.7142735090199965, |
|
"eval_loss": 1.2874841690063477, |
|
"eval_runtime": 290.4326, |
|
"eval_samples_per_second": 86.078, |
|
"eval_steps_per_second": 5.382, |
|
"step": 55000 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"step": 56250, |
|
"total_flos": 1.156661775e+17, |
|
"train_loss": 1.6709515473090277, |
|
"train_runtime": 32029.5992, |
|
"train_samples_per_second": 28.099, |
|
"train_steps_per_second": 1.756 |
|
} |
|
], |
|
"max_steps": 56250, |
|
"num_train_epochs": 3, |
|
"total_flos": 1.156661775e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|