|
{ |
|
"best_metric": 0.981159271079996, |
|
"best_model_checkpoint": "./output//42_roberta-large_nace_5__5e-6_0.01_0.06_07-21-22_10-40/checkpoint-12000", |
|
"epoch": 4.418262150220913, |
|
"global_step": 12000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.74, |
|
"learning_rate": 4.535840188014101e-06, |
|
"loss": 0.1726, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"eval_accuracy": 0.9712155725823152, |
|
"eval_f1": 0.9751469526657729, |
|
"eval_loss": 0.08084136247634888, |
|
"eval_roc_auc": 0.9750559610355007, |
|
"eval_runtime": 143.2301, |
|
"eval_samples_per_second": 33.715, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 1.47, |
|
"learning_rate": 3.7524481002741874e-06, |
|
"loss": 0.0668, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 1.47, |
|
"eval_accuracy": 0.9726651480637813, |
|
"eval_f1": 0.9771228359439407, |
|
"eval_loss": 0.08218056708574295, |
|
"eval_roc_auc": 0.9770191055094254, |
|
"eval_runtime": 143.2878, |
|
"eval_samples_per_second": 33.701, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 2.21, |
|
"learning_rate": 2.969056012534274e-06, |
|
"loss": 0.0501, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 2.21, |
|
"eval_accuracy": 0.9749430523917996, |
|
"eval_f1": 0.9794069192751236, |
|
"eval_loss": 0.07129524648189545, |
|
"eval_roc_auc": 0.9792922833616305, |
|
"eval_runtime": 143.1874, |
|
"eval_samples_per_second": 33.725, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 2.95, |
|
"learning_rate": 2.18566392479436e-06, |
|
"loss": 0.0377, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 2.95, |
|
"eval_accuracy": 0.9757713812383516, |
|
"eval_f1": 0.9797813080255828, |
|
"eval_loss": 0.08654613047838211, |
|
"eval_roc_auc": 0.9797172685997191, |
|
"eval_runtime": 143.3834, |
|
"eval_samples_per_second": 33.679, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 3.68, |
|
"learning_rate": 1.4022718370544457e-06, |
|
"loss": 0.0254, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 3.68, |
|
"eval_accuracy": 0.9743218057568854, |
|
"eval_f1": 0.9794111591517397, |
|
"eval_loss": 0.09397488832473755, |
|
"eval_roc_auc": 0.979291082596074, |
|
"eval_runtime": 143.2996, |
|
"eval_samples_per_second": 33.699, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 4.42, |
|
"learning_rate": 6.18879749314532e-07, |
|
"loss": 0.0196, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 4.42, |
|
"eval_accuracy": 0.9763926278732656, |
|
"eval_f1": 0.981159271079996, |
|
"eval_loss": 0.09825791418552399, |
|
"eval_roc_auc": 0.981051940958186, |
|
"eval_runtime": 143.2702, |
|
"eval_samples_per_second": 33.706, |
|
"step": 12000 |
|
} |
|
], |
|
"max_steps": 13580, |
|
"num_train_epochs": 5, |
|
"total_flos": 6.9866971594752e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|