File size: 5,713 Bytes
b32141a |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 10.0,
"global_step": 1100,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"learning_rate": 9e-05,
"loss": 0.2594,
"step": 110
},
{
"epoch": 1.0,
"eval_accuracy": 0.951993141877411,
"eval_f1": 0.9531642040702537,
"eval_loss": 0.14524979889392853,
"eval_precision": 0.9671852899575671,
"eval_recall": 0.9395438307227261,
"eval_roc_auc": 0.9525100105994584,
"eval_runtime": 4.6691,
"eval_samples_per_second": 1498.989,
"eval_steps_per_second": 5.997,
"step": 110
},
{
"epoch": 2.0,
"learning_rate": 8e-05,
"loss": 0.0966,
"step": 220
},
{
"epoch": 2.0,
"eval_accuracy": 0.9644234890698671,
"eval_f1": 0.9655839668279198,
"eval_loss": 0.1103191077709198,
"eval_precision": 0.971357063403782,
"eval_recall": 0.9598790876614455,
"eval_roc_auc": 0.9646121628783418,
"eval_runtime": 4.725,
"eval_samples_per_second": 1481.272,
"eval_steps_per_second": 5.926,
"step": 220
},
{
"epoch": 3.0,
"learning_rate": 7e-05,
"loss": 0.0499,
"step": 330
},
{
"epoch": 3.0,
"eval_accuracy": 0.9639948564080583,
"eval_f1": 0.9652796913750344,
"eval_loss": 0.11932428181171417,
"eval_precision": 0.967946946670351,
"eval_recall": 0.962627095355867,
"eval_roc_auc": 0.9640516429160287,
"eval_runtime": 4.7987,
"eval_samples_per_second": 1458.529,
"eval_steps_per_second": 5.835,
"step": 330
},
{
"epoch": 4.0,
"learning_rate": 6e-05,
"loss": 0.0251,
"step": 440
},
{
"epoch": 4.0,
"eval_accuracy": 0.962280325760823,
"eval_f1": 0.9639639639639641,
"eval_loss": 0.12893760204315186,
"eval_precision": 0.9576891781936534,
"eval_recall": 0.9703215169002474,
"eval_roc_auc": 0.9619464727358379,
"eval_runtime": 4.816,
"eval_samples_per_second": 1453.283,
"eval_steps_per_second": 5.814,
"step": 440
},
{
"epoch": 5.0,
"learning_rate": 5e-05,
"loss": 0.0132,
"step": 550
},
{
"epoch": 5.0,
"eval_accuracy": 0.9659951421631662,
"eval_f1": 0.9673435784851812,
"eval_loss": 0.1495329588651657,
"eval_precision": 0.9660180871471636,
"eval_recall": 0.9686727122835944,
"eval_roc_auc": 0.9658839751894163,
"eval_runtime": 4.8435,
"eval_samples_per_second": 1445.041,
"eval_steps_per_second": 5.781,
"step": 550
},
{
"epoch": 6.0,
"learning_rate": 4e-05,
"loss": 0.0086,
"step": 660
},
{
"epoch": 6.0,
"eval_accuracy": 0.9684240605800829,
"eval_f1": 0.9692071896335517,
"eval_loss": 0.1759045422077179,
"eval_precision": 0.9830412662521198,
"eval_recall": 0.9557570761198131,
"eval_roc_auc": 0.968949966631335,
"eval_runtime": 4.8741,
"eval_samples_per_second": 1435.957,
"eval_steps_per_second": 5.745,
"step": 660
},
{
"epoch": 7.0,
"learning_rate": 3e-05,
"loss": 0.0054,
"step": 770
},
{
"epoch": 7.0,
"eval_accuracy": 0.9699957136733819,
"eval_f1": 0.9709141274238227,
"eval_loss": 0.15680807828903198,
"eval_precision": 0.9787768779670483,
"eval_recall": 0.9631766968947513,
"eval_roc_auc": 0.9702788246378518,
"eval_runtime": 4.886,
"eval_samples_per_second": 1432.464,
"eval_steps_per_second": 5.731,
"step": 770
},
{
"epoch": 8.0,
"learning_rate": 2e-05,
"loss": 0.0023,
"step": 880
},
{
"epoch": 8.0,
"eval_accuracy": 0.9707101014430632,
"eval_f1": 0.9717280375120674,
"eval_loss": 0.17754127085208893,
"eval_precision": 0.9753599114064231,
"eval_recall": 0.9681231107447101,
"eval_roc_auc": 0.9708175077533074,
"eval_runtime": 4.8851,
"eval_samples_per_second": 1432.728,
"eval_steps_per_second": 5.732,
"step": 880
},
{
"epoch": 9.0,
"learning_rate": 1e-05,
"loss": 0.0023,
"step": 990
},
{
"epoch": 9.0,
"eval_accuracy": 0.9709958565509359,
"eval_f1": 0.9718953343486086,
"eval_loss": 0.17516092956066132,
"eval_precision": 0.9793526785714286,
"eval_recall": 0.964550700741962,
"eval_roc_auc": 0.9712634456090762,
"eval_runtime": 4.8624,
"eval_samples_per_second": 1439.42,
"eval_steps_per_second": 5.759,
"step": 990
},
{
"epoch": 10.0,
"learning_rate": 0.0,
"loss": 0.0011,
"step": 1100
},
{
"epoch": 10.0,
"eval_accuracy": 0.9712816116588084,
"eval_f1": 0.9722260605223159,
"eval_loss": 0.1769445687532425,
"eval_precision": 0.9777654252362423,
"eval_recall": 0.9667491068974993,
"eval_roc_auc": 0.9714697915439877,
"eval_runtime": 4.9001,
"eval_samples_per_second": 1428.327,
"eval_steps_per_second": 5.714,
"step": 1100
},
{
"epoch": 10.0,
"step": 1100,
"total_flos": 1.854013711589376e+16,
"train_loss": 0.04638458222828128,
"train_runtime": 631.2261,
"train_samples_per_second": 443.454,
"train_steps_per_second": 1.743
}
],
"max_steps": 1100,
"num_train_epochs": 10,
"total_flos": 1.854013711589376e+16,
"trial_name": null,
"trial_params": null
}
|