|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 10.0, |
|
"global_step": 1100, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 9e-05, |
|
"loss": 0.2594, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.951993141877411, |
|
"eval_f1": 0.9531642040702537, |
|
"eval_loss": 0.14524979889392853, |
|
"eval_precision": 0.9671852899575671, |
|
"eval_recall": 0.9395438307227261, |
|
"eval_roc_auc": 0.9525100105994584, |
|
"eval_runtime": 4.6691, |
|
"eval_samples_per_second": 1498.989, |
|
"eval_steps_per_second": 5.997, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 8e-05, |
|
"loss": 0.0966, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.9644234890698671, |
|
"eval_f1": 0.9655839668279198, |
|
"eval_loss": 0.1103191077709198, |
|
"eval_precision": 0.971357063403782, |
|
"eval_recall": 0.9598790876614455, |
|
"eval_roc_auc": 0.9646121628783418, |
|
"eval_runtime": 4.725, |
|
"eval_samples_per_second": 1481.272, |
|
"eval_steps_per_second": 5.926, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 7e-05, |
|
"loss": 0.0499, |
|
"step": 330 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.9639948564080583, |
|
"eval_f1": 0.9652796913750344, |
|
"eval_loss": 0.11932428181171417, |
|
"eval_precision": 0.967946946670351, |
|
"eval_recall": 0.962627095355867, |
|
"eval_roc_auc": 0.9640516429160287, |
|
"eval_runtime": 4.7987, |
|
"eval_samples_per_second": 1458.529, |
|
"eval_steps_per_second": 5.835, |
|
"step": 330 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 6e-05, |
|
"loss": 0.0251, |
|
"step": 440 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.962280325760823, |
|
"eval_f1": 0.9639639639639641, |
|
"eval_loss": 0.12893760204315186, |
|
"eval_precision": 0.9576891781936534, |
|
"eval_recall": 0.9703215169002474, |
|
"eval_roc_auc": 0.9619464727358379, |
|
"eval_runtime": 4.816, |
|
"eval_samples_per_second": 1453.283, |
|
"eval_steps_per_second": 5.814, |
|
"step": 440 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 5e-05, |
|
"loss": 0.0132, |
|
"step": 550 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.9659951421631662, |
|
"eval_f1": 0.9673435784851812, |
|
"eval_loss": 0.1495329588651657, |
|
"eval_precision": 0.9660180871471636, |
|
"eval_recall": 0.9686727122835944, |
|
"eval_roc_auc": 0.9658839751894163, |
|
"eval_runtime": 4.8435, |
|
"eval_samples_per_second": 1445.041, |
|
"eval_steps_per_second": 5.781, |
|
"step": 550 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 4e-05, |
|
"loss": 0.0086, |
|
"step": 660 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.9684240605800829, |
|
"eval_f1": 0.9692071896335517, |
|
"eval_loss": 0.1759045422077179, |
|
"eval_precision": 0.9830412662521198, |
|
"eval_recall": 0.9557570761198131, |
|
"eval_roc_auc": 0.968949966631335, |
|
"eval_runtime": 4.8741, |
|
"eval_samples_per_second": 1435.957, |
|
"eval_steps_per_second": 5.745, |
|
"step": 660 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0054, |
|
"step": 770 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.9699957136733819, |
|
"eval_f1": 0.9709141274238227, |
|
"eval_loss": 0.15680807828903198, |
|
"eval_precision": 0.9787768779670483, |
|
"eval_recall": 0.9631766968947513, |
|
"eval_roc_auc": 0.9702788246378518, |
|
"eval_runtime": 4.886, |
|
"eval_samples_per_second": 1432.464, |
|
"eval_steps_per_second": 5.731, |
|
"step": 770 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 2e-05, |
|
"loss": 0.0023, |
|
"step": 880 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.9707101014430632, |
|
"eval_f1": 0.9717280375120674, |
|
"eval_loss": 0.17754127085208893, |
|
"eval_precision": 0.9753599114064231, |
|
"eval_recall": 0.9681231107447101, |
|
"eval_roc_auc": 0.9708175077533074, |
|
"eval_runtime": 4.8851, |
|
"eval_samples_per_second": 1432.728, |
|
"eval_steps_per_second": 5.732, |
|
"step": 880 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0023, |
|
"step": 990 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.9709958565509359, |
|
"eval_f1": 0.9718953343486086, |
|
"eval_loss": 0.17516092956066132, |
|
"eval_precision": 0.9793526785714286, |
|
"eval_recall": 0.964550700741962, |
|
"eval_roc_auc": 0.9712634456090762, |
|
"eval_runtime": 4.8624, |
|
"eval_samples_per_second": 1439.42, |
|
"eval_steps_per_second": 5.759, |
|
"step": 990 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 0.0, |
|
"loss": 0.0011, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.9712816116588084, |
|
"eval_f1": 0.9722260605223159, |
|
"eval_loss": 0.1769445687532425, |
|
"eval_precision": 0.9777654252362423, |
|
"eval_recall": 0.9667491068974993, |
|
"eval_roc_auc": 0.9714697915439877, |
|
"eval_runtime": 4.9001, |
|
"eval_samples_per_second": 1428.327, |
|
"eval_steps_per_second": 5.714, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 1100, |
|
"total_flos": 1.854013711589376e+16, |
|
"train_loss": 0.04638458222828128, |
|
"train_runtime": 631.2261, |
|
"train_samples_per_second": 443.454, |
|
"train_steps_per_second": 1.743 |
|
} |
|
], |
|
"max_steps": 1100, |
|
"num_train_epochs": 10, |
|
"total_flos": 1.854013711589376e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|