{ "best_metric": 0.06356040388345718, "best_model_checkpoint": "autotrain-as4wo-k82ez/checkpoint-48324", "epoch": 3.0, "eval_steps": 500, "global_step": 48324, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.05, "learning_rate": 8.286778398510241e-06, "loss": 0.4813, "step": 805 }, { "epoch": 0.1, "learning_rate": 1.6614938961307676e-05, "loss": 0.3538, "step": 1610 }, { "epoch": 0.15, "learning_rate": 2.4932753983033314e-05, "loss": 0.2967, "step": 2415 }, { "epoch": 0.2, "learning_rate": 3.3260914545830745e-05, "loss": 0.2605, "step": 3220 }, { "epoch": 0.25, "learning_rate": 4.1589075108628184e-05, "loss": 0.2491, "step": 4025 }, { "epoch": 0.3, "learning_rate": 4.9917235671425615e-05, "loss": 0.2294, "step": 4830 }, { "epoch": 0.35, "learning_rate": 4.908486813363685e-05, "loss": 0.218, "step": 5635 }, { "epoch": 0.4, "learning_rate": 4.815938929893541e-05, "loss": 0.1886, "step": 6440 }, { "epoch": 0.45, "learning_rate": 4.723391046423398e-05, "loss": 0.1842, "step": 7245 }, { "epoch": 0.5, "learning_rate": 4.630843162953255e-05, "loss": 0.1583, "step": 8050 }, { "epoch": 0.55, "learning_rate": 4.5384102457979815e-05, "loss": 0.1594, "step": 8855 }, { "epoch": 0.6, "learning_rate": 4.4458623623278384e-05, "loss": 0.1576, "step": 9660 }, { "epoch": 0.65, "learning_rate": 4.353544411487435e-05, "loss": 0.1407, "step": 10465 }, { "epoch": 0.7, "learning_rate": 4.260996528017291e-05, "loss": 0.1376, "step": 11270 }, { "epoch": 0.75, "learning_rate": 4.168448644547148e-05, "loss": 0.1427, "step": 12075 }, { "epoch": 0.8, "learning_rate": 4.0760157273918745e-05, "loss": 0.138, "step": 12880 }, { "epoch": 0.85, "learning_rate": 3.983467843921731e-05, "loss": 0.1268, "step": 13685 }, { "epoch": 0.9, "learning_rate": 3.8909199604515875e-05, "loss": 0.1335, "step": 14490 }, { "epoch": 0.95, "learning_rate": 3.798487043296314e-05, "loss": 0.1231, "step": 15295 }, { "epoch": 1.0, "learning_rate": 3.705939159826171e-05, "loss": 0.1248, "step": 16100 }, { "epoch": 1.0, "eval_accuracy": 0.9748882542835858, "eval_auc": 0.9954070396202473, "eval_f1": 0.9635372064722586, "eval_loss": 0.11125129461288452, "eval_precision": 0.9544602196624699, "eval_recall": 0.9727884965416819, "eval_runtime": 44.32, "eval_samples_per_second": 726.896, "eval_steps_per_second": 45.442, "step": 16108 }, { "epoch": 1.05, "learning_rate": 3.613391276356028e-05, "loss": 0.1071, "step": 16905 }, { "epoch": 1.1, "learning_rate": 3.520843392885885e-05, "loss": 0.0985, "step": 17710 }, { "epoch": 1.15, "learning_rate": 3.4282955094157416e-05, "loss": 0.095, "step": 18515 }, { "epoch": 1.2, "learning_rate": 3.3357476259455985e-05, "loss": 0.085, "step": 19320 }, { "epoch": 1.25, "learning_rate": 3.2431997424754554e-05, "loss": 0.0904, "step": 20125 }, { "epoch": 1.3, "learning_rate": 3.1506518590053115e-05, "loss": 0.0808, "step": 20930 }, { "epoch": 1.35, "learning_rate": 3.0581039755351684e-05, "loss": 0.0917, "step": 21735 }, { "epoch": 1.4, "learning_rate": 2.965556092065025e-05, "loss": 0.0812, "step": 22540 }, { "epoch": 1.45, "learning_rate": 2.8732381412246213e-05, "loss": 0.0861, "step": 23345 }, { "epoch": 1.5, "learning_rate": 2.780690257754478e-05, "loss": 0.0733, "step": 24150 }, { "epoch": 1.55, "learning_rate": 2.6882573405992045e-05, "loss": 0.088, "step": 24955 }, { "epoch": 1.6, "learning_rate": 2.5957094571290614e-05, "loss": 0.0745, "step": 25760 }, { "epoch": 1.65, "learning_rate": 2.5031615736589182e-05, "loss": 0.0751, "step": 26565 }, { "epoch": 1.7, "learning_rate": 2.4106136901887748e-05, "loss": 0.0661, "step": 27370 }, { "epoch": 1.75, "learning_rate": 2.3180658067186313e-05, "loss": 0.0659, "step": 28175 }, { "epoch": 1.8, "learning_rate": 2.225517923248488e-05, "loss": 0.0648, "step": 28980 }, { "epoch": 1.85, "learning_rate": 2.132970039778345e-05, "loss": 0.0687, "step": 29785 }, { "epoch": 1.9, "learning_rate": 2.0406520889379414e-05, "loss": 0.0596, "step": 30590 }, { "epoch": 1.95, "learning_rate": 1.948104205467798e-05, "loss": 0.0649, "step": 31395 }, { "epoch": 2.0, "learning_rate": 1.8556712883125246e-05, "loss": 0.0625, "step": 32200 }, { "epoch": 2.0, "eval_accuracy": 0.9843245592252297, "eval_auc": 0.9981209244728939, "eval_f1": 0.9769016146000092, "eval_loss": 0.06887876242399216, "eval_precision": 0.9819770114942529, "eval_recall": 0.9718784128139789, "eval_runtime": 44.3879, "eval_samples_per_second": 725.783, "eval_steps_per_second": 45.373, "step": 32216 }, { "epoch": 2.05, "learning_rate": 1.763238371157251e-05, "loss": 0.0398, "step": 33005 }, { "epoch": 2.1, "learning_rate": 1.6706904876871077e-05, "loss": 0.0423, "step": 33810 }, { "epoch": 2.15, "learning_rate": 1.5781426042169646e-05, "loss": 0.0447, "step": 34615 }, { "epoch": 2.2, "learning_rate": 1.4855947207468213e-05, "loss": 0.0369, "step": 35420 }, { "epoch": 2.25, "learning_rate": 1.393046837276678e-05, "loss": 0.0356, "step": 36225 }, { "epoch": 2.3, "learning_rate": 1.3006139201214046e-05, "loss": 0.0461, "step": 37030 }, { "epoch": 2.35, "learning_rate": 1.2080660366512613e-05, "loss": 0.0331, "step": 37835 }, { "epoch": 2.4, "learning_rate": 1.1156331194959878e-05, "loss": 0.0393, "step": 38640 }, { "epoch": 2.45, "learning_rate": 1.0230852360258445e-05, "loss": 0.0338, "step": 39445 }, { "epoch": 2.5, "learning_rate": 9.305373525557012e-06, "loss": 0.0393, "step": 40250 }, { "epoch": 2.55, "learning_rate": 8.37989469085558e-06, "loss": 0.0342, "step": 41055 }, { "epoch": 2.6, "learning_rate": 7.4544158561541465e-06, "loss": 0.0342, "step": 41860 }, { "epoch": 2.65, "learning_rate": 6.530086684601412e-06, "loss": 0.0351, "step": 42665 }, { "epoch": 2.7, "learning_rate": 5.6057575130486766e-06, "loss": 0.0337, "step": 43470 }, { "epoch": 2.75, "learning_rate": 4.680278678347244e-06, "loss": 0.0343, "step": 44275 }, { "epoch": 2.8, "learning_rate": 3.7547998436458122e-06, "loss": 0.0348, "step": 45080 }, { "epoch": 2.85, "learning_rate": 2.829321008944379e-06, "loss": 0.0317, "step": 45885 }, { "epoch": 2.9, "learning_rate": 1.903842174242947e-06, "loss": 0.029, "step": 46690 }, { "epoch": 2.95, "learning_rate": 9.806626658389092e-07, "loss": 0.0402, "step": 47495 }, { "epoch": 3.0, "learning_rate": 5.518383113747672e-08, "loss": 0.0304, "step": 48300 }, { "epoch": 3.0, "eval_accuracy": 0.9876148497640924, "eval_auc": 0.998944462787882, "eval_f1": 0.9819203407494677, "eval_loss": 0.06356040388345718, "eval_precision": 0.977799837559787, "eval_recall": 0.9860757189661449, "eval_runtime": 44.4481, "eval_samples_per_second": 724.8, "eval_steps_per_second": 45.311, "step": 48324 } ], "logging_steps": 805, "max_steps": 48324, "num_input_tokens_seen": 0, "num_train_epochs": 3, "save_steps": 500, "total_flos": 1.2802510444207104e+16, "train_batch_size": 8, "trial_name": null, "trial_params": null }