***** Eval results ***** 2021-12-13 21:36:24.587572epoch = 1.0 eval_HasAns_exact = 78.35122965015587 eval_HasAns_f1 = 85.13968688137153 eval_HasAns_total = 5774 eval_NoAns_exact = 82.26532732940768 eval_NoAns_f1 = 82.26532732940768 eval_NoAns_total = 5774 eval_best_exact = 83.36508486317977 eval_best_exact_thresh = -4.265625 eval_best_f1 = 86.50049020991854 eval_best_f1_thresh = -3.76171875 eval_exact = 80.30827848978178 eval_f1 = 83.70250710538936 eval_runtime = 116.2823 eval_samples_per_second = 119.743 eval_steps_per_second = 0.937 eval_total = 11548 ***** Eval results ***** 2021-12-13 23:54:17.975036epoch = 2.0 eval_HasAns_exact = 81.65916175961205 eval_HasAns_f1 = 87.7141782584969 eval_HasAns_total = 5774 eval_NoAns_exact = 79.14790439903014 eval_NoAns_f1 = 79.14790439903014 eval_NoAns_total = 5774 eval_best_exact = 85.417388292345 eval_best_exact_thresh = -4.91015625 eval_best_f1 = 88.2525034462934 eval_best_f1_thresh = -4.91015625 eval_exact = 80.4035330793211 eval_f1 = 83.4310413287634 eval_runtime = 114.7091 eval_samples_per_second = 121.385 eval_steps_per_second = 0.95 eval_total = 11548 ***** Eval results ***** 2021-12-14 02:12:16.445998epoch = 3.0 eval_HasAns_exact = 82.40387945964669 eval_HasAns_f1 = 88.17376210385724 eval_HasAns_total = 5774 eval_NoAns_exact = 82.04018011776931 eval_NoAns_f1 = 82.04018011776931 eval_NoAns_total = 5774 eval_best_exact = 85.93695878074125 eval_best_exact_thresh = -5.8046875 eval_best_f1 = 88.652083582146 eval_best_f1_thresh = -4.640625 eval_exact = 82.222029788708 eval_f1 = 85.10697111081303 eval_runtime = 115.8495 eval_samples_per_second = 120.19 eval_steps_per_second = 0.941 eval_total = 11548 ***** Eval results ***** 2021-12-14 04:30:40.843577epoch = 4.0 eval_HasAns_exact = 82.92344994804296 eval_HasAns_f1 = 88.76361604970366 eval_HasAns_total = 5774 eval_NoAns_exact = 75.68410114305507 eval_NoAns_f1 = 75.68410114305507 eval_NoAns_total = 5774 eval_best_exact = 86.31797713889851 eval_best_exact_thresh = -7.69921875 eval_best_f1 = 89.0138490084362 eval_best_f1_thresh = -7.4140625 eval_exact = 79.30377554554902 eval_f1 = 82.22385859637924 eval_runtime = 116.6262 eval_samples_per_second = 119.39 eval_steps_per_second = 0.935 eval_total = 11548 ***** Eval results ***** 2021-12-14 06:49:11.744655epoch = 5.0 eval_HasAns_exact = 83.04468306200208 eval_HasAns_f1 = 88.60010543614725 eval_HasAns_total = 5774 eval_NoAns_exact = 84.48216141323172 eval_NoAns_f1 = 84.48216141323172 eval_NoAns_total = 5774 eval_best_exact = 87.20990647731209 eval_best_exact_thresh = -4.83984375 eval_best_f1 = 89.8436215977173 eval_best_f1_thresh = -4.83984375 eval_exact = 83.76342223761691 eval_f1 = 86.5411334246892 eval_runtime = 117.7564 eval_samples_per_second = 118.244 eval_steps_per_second = 0.926 eval_total = 11548 ***** Eval results ***** 2021-12-14 09:07:43.312763epoch = 6.0 eval_HasAns_exact = 83.46033945271908 eval_HasAns_f1 = 89.05328761170561 eval_HasAns_total = 5774 eval_NoAns_exact = 82.05749913404918 eval_NoAns_f1 = 82.05749913404918 eval_NoAns_total = 5774 eval_best_exact = 87.53030827848978 eval_best_exact_thresh = -6.7421875 eval_best_f1 = 90.18823628334343 eval_best_f1_thresh = -5.328125 eval_exact = 82.75891929338414 eval_f1 = 85.55539337287718 eval_runtime = 115.8934 eval_samples_per_second = 120.145 eval_steps_per_second = 0.941 eval_total = 11548 ***** Eval results ***** 2021-12-14 11:26:17.714938epoch = 7.0 eval_HasAns_exact = 83.47765846899897 eval_HasAns_f1 = 88.97497847186122 eval_HasAns_total = 5774 eval_NoAns_exact = 83.28714928992034 eval_NoAns_f1 = 83.28714928992034 eval_NoAns_total = 5774 eval_best_exact = 87.56494631104954 eval_best_exact_thresh = -5.70703125 eval_best_f1 = 90.1712271871601 eval_best_f1_thresh = -5.6875 eval_exact = 83.38240387945964 eval_f1 = 86.13106388089054 eval_runtime = 118.9527 eval_samples_per_second = 117.055 eval_steps_per_second = 0.916 eval_total = 11548 ***** Eval results ***** 2021-12-14 13:22:43.923006epoch = 6.0 eval_HasAns_exact = 83.46033945271908 eval_HasAns_f1 = 89.05328761170561 eval_HasAns_total = 5774 eval_NoAns_exact = 82.05749913404918 eval_NoAns_f1 = 82.05749913404918 eval_NoAns_total = 5774 eval_best_exact = 87.53030827848978 eval_best_exact_thresh = -6.7421875 eval_best_f1 = 90.18823628334343 eval_best_f1_thresh = -5.328125 eval_exact = 82.75891929338414 eval_f1 = 85.55539337287718 eval_runtime = 118.456 eval_samples_per_second = 117.546 eval_steps_per_second = 0.92 eval_total = 11548 ***** Eval results ***** 2021-12-14 15:41:40.429066epoch = 7.0 eval_HasAns_exact = 83.47765846899897 eval_HasAns_f1 = 88.97497847186122 eval_HasAns_total = 5774 eval_NoAns_exact = 83.28714928992034 eval_NoAns_f1 = 83.28714928992034 eval_NoAns_total = 5774 eval_best_exact = 87.56494631104954 eval_best_exact_thresh = -5.70703125 eval_best_f1 = 90.1712271871601 eval_best_f1_thresh = -5.6875 eval_exact = 83.38240387945964 eval_f1 = 86.13106388089054 eval_runtime = 116.1628 eval_samples_per_second = 119.866 eval_steps_per_second = 0.938 eval_total = 11548 ***** Eval results ***** 2021-12-14 18:00:18.739183epoch = 8.0 eval_HasAns_exact = 83.80671977831659 eval_HasAns_f1 = 89.25279748539205 eval_HasAns_total = 5774 eval_NoAns_exact = 82.35192241080706 eval_NoAns_f1 = 82.35192241080706 eval_NoAns_total = 5774 eval_best_exact = 87.7641149982681 eval_best_exact_thresh = -5.828125 eval_best_f1 = 90.35660938760992 eval_best_f1_thresh = -5.828125 eval_exact = 83.07932109456183 eval_f1 = 85.8023599480993 eval_runtime = 114.8772 eval_samples_per_second = 121.208 eval_steps_per_second = 0.949 eval_total = 11548 ***** Eval results ***** 2021-12-14 20:19:11.241603epoch = 9.0 eval_HasAns_exact = 83.70280568063734 eval_HasAns_f1 = 89.21377471775827 eval_HasAns_total = 5774 eval_NoAns_exact = 82.38656044336682 eval_NoAns_f1 = 82.38656044336682 eval_NoAns_total = 5774 eval_best_exact = 87.85936958780741 eval_best_exact_thresh = -6.28515625 eval_best_f1 = 90.4998967568238 eval_best_f1_thresh = -5.98046875 eval_exact = 83.04468306200208 eval_f1 = 85.80016758056232 eval_runtime = 114.8108 eval_samples_per_second = 121.278 eval_steps_per_second = 0.949 eval_total = 11548 ***** Eval results ***** 2021-12-14 22:37:47.534128epoch = 10.0 eval_HasAns_exact = 83.65084863179771 eval_HasAns_f1 = 89.1463632488054 eval_HasAns_total = 5774 eval_NoAns_exact = 82.99272601316245 eval_NoAns_f1 = 82.99272601316245 eval_NoAns_total = 5774 eval_best_exact = 87.81607204710772 eval_best_exact_thresh = -6.37890625 eval_best_f1 = 90.44887200606756 eval_best_f1_thresh = -6.046875 eval_exact = 83.32178732248008 eval_f1 = 86.0695446309837 eval_runtime = 116.3261 eval_samples_per_second = 119.698 eval_steps_per_second = 0.937 eval_total = 11548