{ "best_metric": 0.40153906255014676, "best_model_checkpoint": "/home2/s5432073/language-tech-project/results/ltp-roberta-large-defaultltp-roberta-large-default-0/checkpoint-1200", "epoch": 8.284023668639053, "global_step": 1400, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.18, "learning_rate": 9.28348909657321e-06, "loss": 0.4442, "step": 200 }, { "epoch": 1.18, "eval_f1": 0.14004634931160595, "eval_f1_all": [ 0.11111111111111112, 0.19823008849557522, 0.0, 0.0, 0.5077262693156732, 0.0, 0.015037593984962407, 0.0, 0.7197452229299364, 0.6306954436450838, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.5973799126637556, 0.015625, 0.0, 0.005376344086021506 ], "eval_loss": 0.3573361933231354, "eval_runtime": 3.7892, "eval_samples_per_second": 500.363, "eval_steps_per_second": 15.834, "step": 200 }, { "epoch": 2.37, "learning_rate": 8.037383177570094e-06, "loss": 0.3303, "step": 400 }, { "epoch": 2.37, "eval_f1": 0.26419617591690636, "eval_f1_all": [ 0.43804034582132567, 0.31333333333333335, 0.0, 0.0, 0.616, 0.03592814371257485, 0.3128491620111732, 0.0, 0.7331058020477816, 0.5398601398601399, 0.16580310880829016, 0.391025641025641, 0.0, 0.0, 0.13119533527696794, 0.0, 0.6373056994818653, 0.6169154228855722, 0.02643171806167401, 0.32612966601178783 ], "eval_loss": 0.32742321491241455, "eval_runtime": 3.2193, "eval_samples_per_second": 588.954, "eval_steps_per_second": 18.638, "step": 400 }, { "epoch": 3.55, "learning_rate": 6.791277258566978e-06, "loss": 0.2955, "step": 600 }, { "epoch": 3.55, "eval_f1": 0.33856925982901875, "eval_f1_all": [ 0.5025125628140703, 0.5899632802937577, 0.0, 0.07407407407407407, 0.6084275436793423, 0.0588235294117647, 0.3567567567567568, 0.0, 0.7440944881889764, 0.6120481927710844, 0.3916666666666666, 0.49431818181818177, 0.0, 0.015625, 0.5071868583162218, 0.06382978723404255, 0.6857597454256166, 0.6403940886699507, 0.10526315789473682, 0.3206412825651303 ], "eval_loss": 0.31045234203338623, "eval_runtime": 3.1516, "eval_samples_per_second": 601.599, "eval_steps_per_second": 19.038, "step": 600 }, { "epoch": 4.73, "learning_rate": 5.545171339563863e-06, "loss": 0.275, "step": 800 }, { "epoch": 4.73, "eval_f1": 0.35946421270983664, "eval_f1_all": [ 0.5432692307692307, 0.5728770595690748, 0.055944055944055944, 0.125, 0.6434782608695652, 0.11891891891891894, 0.33513513513513515, 0.0, 0.7636594663278272, 0.638655462184874, 0.41071428571428564, 0.5251396648044693, 0.0, 0.015503875968992248, 0.5346733668341709, 0.07017543859649122, 0.657762938230384, 0.6666666666666667, 0.11244979919678717, 0.39926062846580407 ], "eval_loss": 0.3056282103061676, "eval_runtime": 3.1101, "eval_samples_per_second": 609.632, "eval_steps_per_second": 19.292, "step": 800 }, { "epoch": 5.92, "learning_rate": 4.299065420560748e-06, "loss": 0.2582, "step": 1000 }, { "epoch": 5.92, "eval_f1": 0.3779236416443889, "eval_f1_all": [ 0.5119617224880383, 0.5549872122762148, 0.09523809523809525, 0.24793388429752064, 0.6457739791073124, 0.10112359550561797, 0.31351351351351353, 0.0, 0.7588785046728972, 0.6312056737588652, 0.44999999999999996, 0.5300546448087431, 0.0, 0.015384615384615385, 0.5868995633187772, 0.17857142857142858, 0.6494401378122309, 0.7022222222222223, 0.12851405622489961, 0.45676998368678634 ], "eval_loss": 0.30811235308647156, "eval_runtime": 3.5499, "eval_samples_per_second": 534.102, "eval_steps_per_second": 16.902, "step": 1000 }, { "epoch": 7.1, "learning_rate": 3.0529595015576325e-06, "loss": 0.2446, "step": 1200 }, { "epoch": 7.1, "eval_f1": 0.40153906255014676, "eval_f1_all": [ 0.5172413793103449, 0.5871121718377088, 0.12, 0.3759398496240602, 0.630952380952381, 0.17258883248730966, 0.3768115942028986, 0.0, 0.7563683866753755, 0.6462513199577613, 0.4758064516129032, 0.5527369826435248, 0.0, 0.015037593984962405, 0.5758683729433272, 0.21203438395415472, 0.6746794871794872, 0.7136563876651982, 0.17777777777777778, 0.44991789819376027 ], "eval_loss": 0.30632713437080383, "eval_runtime": 3.2144, "eval_samples_per_second": 589.85, "eval_steps_per_second": 18.666, "step": 1200 }, { "epoch": 8.28, "learning_rate": 1.8068535825545173e-06, "loss": 0.2344, "step": 1400 }, { "epoch": 8.28, "eval_f1": 0.39818355623683893, "eval_f1_all": [ 0.5059665871121718, 0.6030267753201397, 0.13071895424836602, 0.3609022556390977, 0.6425073457394711, 0.17616580310880828, 0.3827751196172249, 0.0, 0.7609942638623327, 0.6363636363636364, 0.4672131147540983, 0.5517241379310345, 0.0, 0.015151515151515152, 0.5907099035933392, 0.14012738853503187, 0.7006960556844547, 0.7053571428571428, 0.1484375, 0.4448336252189142 ], "eval_loss": 0.30558517575263977, "eval_runtime": 3.0733, "eval_samples_per_second": 616.921, "eval_steps_per_second": 19.523, "step": 1400 } ], "max_steps": 1690, "num_train_epochs": 10, "total_flos": 7696217086325736.0, "trial_name": null, "trial_params": null }