{ "best_metric": null, "best_model_checkpoint": null, "epoch": 10.0, "global_step": 5510, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 8.101633393829401e-06, "loss": 0.6213, "step": 551 }, { "epoch": 1.0, "eval_accuracy": 0.6627921055817896, "eval_f1": 0.6499937162247078, "eval_loss": 0.5820437073707581, "eval_precision": 0.6816025303110174, "eval_recall": 0.6211866442469373, "eval_roc_auc": 0.6631323846234687, "eval_runtime": 28.6308, "eval_samples_per_second": 288.465, "eval_steps_per_second": 6.427, "step": 551 }, { "epoch": 2.0, "learning_rate": 7.203266787658802e-06, "loss": 0.5585, "step": 1102 }, { "epoch": 2.0, "eval_accuracy": 0.6689671873108124, "eval_f1": 0.5894894894894895, "eval_loss": 0.5801684856414795, "eval_precision": 0.7861433720464558, "eval_recall": 0.47153495075666585, "eval_roc_auc": 0.670581928503333, "eval_runtime": 28.9285, "eval_samples_per_second": 285.497, "eval_steps_per_second": 6.361, "step": 1102 }, { "epoch": 3.0, "learning_rate": 6.304900181488204e-06, "loss": 0.5109, "step": 1653 }, { "epoch": 3.0, "eval_accuracy": 0.6885821528030028, "eval_f1": 0.6392706872370266, "eval_loss": 0.5686787962913513, "eval_precision": 0.7681159420289855, "eval_recall": 0.5474417487388902, "eval_roc_auc": 0.689736499369445, "eval_runtime": 28.9515, "eval_samples_per_second": 285.27, "eval_steps_per_second": 6.355, "step": 1653 }, { "epoch": 4.0, "learning_rate": 5.404900181488204e-06, "loss": 0.4645, "step": 2204 }, { "epoch": 4.0, "eval_accuracy": 0.6972999152439763, "eval_f1": 0.6525847693162868, "eval_loss": 0.5875381827354431, "eval_precision": 0.7741510056050115, "eval_recall": 0.5640163343742494, "eval_roc_auc": 0.6983900031246246, "eval_runtime": 29.0279, "eval_samples_per_second": 284.519, "eval_steps_per_second": 6.339, "step": 2204 }, { "epoch": 5.0, "learning_rate": 4.504900181488204e-06, "loss": 0.4161, "step": 2755 }, { "epoch": 5.0, "eval_accuracy": 0.709650078702022, "eval_f1": 0.6926429120738272, "eval_loss": 0.5819324254989624, "eval_precision": 0.7425116790327013, "eval_recall": 0.6490511650252222, "eval_roc_auc": 0.7101456997001111, "eval_runtime": 29.0292, "eval_samples_per_second": 284.506, "eval_steps_per_second": 6.338, "step": 2755 }, { "epoch": 6.0, "learning_rate": 3.6049001814882032e-06, "loss": 0.3756, "step": 3306 }, { "epoch": 6.0, "eval_accuracy": 0.705775517617145, "eval_f1": 0.6843335931410757, "eval_loss": 0.6318923234939575, "eval_precision": 0.7451202263083451, "eval_recall": 0.6327167907758828, "eval_roc_auc": 0.7063730438254414, "eval_runtime": 29.1411, "eval_samples_per_second": 283.414, "eval_steps_per_second": 6.314, "step": 3306 }, { "epoch": 7.0, "learning_rate": 2.706533575317604e-06, "loss": 0.3451, "step": 3857 }, { "epoch": 7.0, "eval_accuracy": 0.7025063567017799, "eval_f1": 0.6842308186608405, "eval_loss": 0.6542169451713562, "eval_precision": 0.7357656163626313, "eval_recall": 0.6394427095844343, "eval_roc_auc": 0.7030221360422172, "eval_runtime": 29.0336, "eval_samples_per_second": 284.464, "eval_steps_per_second": 6.337, "step": 3857 }, { "epoch": 8.0, "learning_rate": 1.8065335753176044e-06, "loss": 0.3144, "step": 4408 }, { "epoch": 8.0, "eval_accuracy": 0.701658796464463, "eval_f1": 0.6680140123955807, "eval_loss": 0.7204051613807678, "eval_precision": 0.7606627799938631, "eval_recall": 0.5954840259428297, "eval_roc_auc": 0.7025271692214148, "eval_runtime": 29.0414, "eval_samples_per_second": 284.387, "eval_steps_per_second": 6.336, "step": 4408 }, { "epoch": 9.0, "learning_rate": 9.065335753176044e-07, "loss": 0.2978, "step": 4959 }, { "epoch": 9.0, "eval_accuracy": 0.7032328369051943, "eval_f1": 0.6755790866975514, "eval_loss": 0.7168041467666626, "eval_precision": 0.7523584905660378, "eval_recall": 0.6130194571222676, "eval_roc_auc": 0.7039706660611338, "eval_runtime": 29.0774, "eval_samples_per_second": 284.035, "eval_steps_per_second": 6.328, "step": 4959 }, { "epoch": 10.0, "learning_rate": 6.533575317604356e-09, "loss": 0.2757, "step": 5510 }, { "epoch": 10.0, "eval_accuracy": 0.7019009565322678, "eval_f1": 0.6654891304347826, "eval_loss": 0.7599468231201172, "eval_precision": 0.7660306537378793, "eval_recall": 0.5882776843622388, "eval_roc_auc": 0.7028302484311194, "eval_runtime": 29.101, "eval_samples_per_second": 283.804, "eval_steps_per_second": 6.323, "step": 5510 }, { "epoch": 10.0, "step": 5510, "total_flos": 6.51831328548864e+16, "train_loss": 0.4179859999087242, "train_runtime": 3050.636, "train_samples_per_second": 81.209, "train_steps_per_second": 1.806 } ], "max_steps": 5510, "num_train_epochs": 10, "total_flos": 6.51831328548864e+16, "trial_name": null, "trial_params": null }