|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 10.0, |
|
"global_step": 220, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 9.090909090909092e-05, |
|
"loss": 0.6837, |
|
"step": 22 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.5897435897435898, |
|
"eval_f1": 0.6666666666666666, |
|
"eval_loss": 0.6039571166038513, |
|
"eval_precision": 0.5161290322580645, |
|
"eval_recall": 0.9411764705882353, |
|
"eval_roc_auc": 0.6296791443850267, |
|
"eval_runtime": 0.069, |
|
"eval_samples_per_second": 565.227, |
|
"eval_steps_per_second": 43.479, |
|
"step": 22 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 8.090909090909092e-05, |
|
"loss": 0.3852, |
|
"step": 44 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.9230769230769231, |
|
"eval_f1": 0.9189189189189189, |
|
"eval_loss": 0.28810474276542664, |
|
"eval_precision": 0.85, |
|
"eval_recall": 1.0, |
|
"eval_roc_auc": 0.9318181818181819, |
|
"eval_runtime": 0.064, |
|
"eval_samples_per_second": 609.374, |
|
"eval_steps_per_second": 46.875, |
|
"step": 44 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 7.090909090909092e-05, |
|
"loss": 0.2148, |
|
"step": 66 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.9230769230769231, |
|
"eval_f1": 0.9189189189189189, |
|
"eval_loss": 0.38069406151771545, |
|
"eval_precision": 0.85, |
|
"eval_recall": 1.0, |
|
"eval_roc_auc": 0.9318181818181819, |
|
"eval_runtime": 0.065, |
|
"eval_samples_per_second": 600.004, |
|
"eval_steps_per_second": 46.154, |
|
"step": 66 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 6.090909090909091e-05, |
|
"loss": 0.0701, |
|
"step": 88 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.8717948717948718, |
|
"eval_f1": 0.8717948717948718, |
|
"eval_loss": 0.4933823347091675, |
|
"eval_precision": 0.7727272727272727, |
|
"eval_recall": 1.0, |
|
"eval_roc_auc": 0.8863636363636364, |
|
"eval_runtime": 0.071, |
|
"eval_samples_per_second": 549.297, |
|
"eval_steps_per_second": 42.254, |
|
"step": 88 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 5.090909090909091e-05, |
|
"loss": 0.0164, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.8974358974358975, |
|
"eval_f1": 0.8947368421052632, |
|
"eval_loss": 0.4892081320285797, |
|
"eval_precision": 0.8095238095238095, |
|
"eval_recall": 1.0, |
|
"eval_roc_auc": 0.9090909090909091, |
|
"eval_runtime": 0.064, |
|
"eval_samples_per_second": 609.381, |
|
"eval_steps_per_second": 46.875, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 4.0909090909090915e-05, |
|
"loss": 0.0039, |
|
"step": 132 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.8974358974358975, |
|
"eval_f1": 0.8947368421052632, |
|
"eval_loss": 0.49288177490234375, |
|
"eval_precision": 0.8095238095238095, |
|
"eval_recall": 1.0, |
|
"eval_roc_auc": 0.9090909090909091, |
|
"eval_runtime": 0.058, |
|
"eval_samples_per_second": 672.418, |
|
"eval_steps_per_second": 51.724, |
|
"step": 132 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 3.090909090909091e-05, |
|
"loss": 0.0012, |
|
"step": 154 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.9230769230769231, |
|
"eval_f1": 0.9189189189189189, |
|
"eval_loss": 0.4065372943878174, |
|
"eval_precision": 0.85, |
|
"eval_recall": 1.0, |
|
"eval_roc_auc": 0.9318181818181819, |
|
"eval_runtime": 0.063, |
|
"eval_samples_per_second": 619.043, |
|
"eval_steps_per_second": 47.619, |
|
"step": 154 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 2.090909090909091e-05, |
|
"loss": 0.0008, |
|
"step": 176 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.9230769230769231, |
|
"eval_f1": 0.9189189189189189, |
|
"eval_loss": 0.48369330167770386, |
|
"eval_precision": 0.85, |
|
"eval_recall": 1.0, |
|
"eval_roc_auc": 0.9318181818181819, |
|
"eval_runtime": 0.059, |
|
"eval_samples_per_second": 661.03, |
|
"eval_steps_per_second": 50.848, |
|
"step": 176 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 1.0909090909090909e-05, |
|
"loss": 0.0007, |
|
"step": 198 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.9230769230769231, |
|
"eval_f1": 0.9189189189189189, |
|
"eval_loss": 0.4999829828739166, |
|
"eval_precision": 0.85, |
|
"eval_recall": 1.0, |
|
"eval_roc_auc": 0.9318181818181819, |
|
"eval_runtime": 0.061, |
|
"eval_samples_per_second": 639.321, |
|
"eval_steps_per_second": 49.179, |
|
"step": 198 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 9.09090909090909e-07, |
|
"loss": 0.0006, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.9230769230769231, |
|
"eval_f1": 0.9189189189189189, |
|
"eval_loss": 0.5037449598312378, |
|
"eval_precision": 0.85, |
|
"eval_recall": 1.0, |
|
"eval_roc_auc": 0.9318181818181819, |
|
"eval_runtime": 0.058, |
|
"eval_samples_per_second": 672.418, |
|
"eval_steps_per_second": 51.724, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 220, |
|
"total_flos": 197738122089864.0, |
|
"train_loss": 0.1377350079192018, |
|
"train_runtime": 17.676, |
|
"train_samples_per_second": 194.048, |
|
"train_steps_per_second": 12.446 |
|
} |
|
], |
|
"max_steps": 220, |
|
"num_train_epochs": 10, |
|
"total_flos": 197738122089864.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|