File size: 6,706 Bytes
c311cbf |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 |
***** Eval results ***** 2021-12-13 21:36:24.587572epoch = 1.0 eval_HasAns_exact = 78.35122965015587 eval_HasAns_f1 = 85.13968688137153 eval_HasAns_total = 5774 eval_NoAns_exact = 82.26532732940768 eval_NoAns_f1 = 82.26532732940768 eval_NoAns_total = 5774 eval_best_exact = 83.36508486317977 eval_best_exact_thresh = -4.265625 eval_best_f1 = 86.50049020991854 eval_best_f1_thresh = -3.76171875 eval_exact = 80.30827848978178 eval_f1 = 83.70250710538936 eval_runtime = 116.2823 eval_samples_per_second = 119.743 eval_steps_per_second = 0.937 eval_total = 11548 ***** Eval results ***** 2021-12-13 23:54:17.975036epoch = 2.0 eval_HasAns_exact = 81.65916175961205 eval_HasAns_f1 = 87.7141782584969 eval_HasAns_total = 5774 eval_NoAns_exact = 79.14790439903014 eval_NoAns_f1 = 79.14790439903014 eval_NoAns_total = 5774 eval_best_exact = 85.417388292345 eval_best_exact_thresh = -4.91015625 eval_best_f1 = 88.2525034462934 eval_best_f1_thresh = -4.91015625 eval_exact = 80.4035330793211 eval_f1 = 83.4310413287634 eval_runtime = 114.7091 eval_samples_per_second = 121.385 eval_steps_per_second = 0.95 eval_total = 11548 ***** Eval results ***** 2021-12-14 02:12:16.445998epoch = 3.0 eval_HasAns_exact = 82.40387945964669 eval_HasAns_f1 = 88.17376210385724 eval_HasAns_total = 5774 eval_NoAns_exact = 82.04018011776931 eval_NoAns_f1 = 82.04018011776931 eval_NoAns_total = 5774 eval_best_exact = 85.93695878074125 eval_best_exact_thresh = -5.8046875 eval_best_f1 = 88.652083582146 eval_best_f1_thresh = -4.640625 eval_exact = 82.222029788708 eval_f1 = 85.10697111081303 eval_runtime = 115.8495 eval_samples_per_second = 120.19 eval_steps_per_second = 0.941 eval_total = 11548 ***** Eval results ***** 2021-12-14 04:30:40.843577epoch = 4.0 eval_HasAns_exact = 82.92344994804296 eval_HasAns_f1 = 88.76361604970366 eval_HasAns_total = 5774 eval_NoAns_exact = 75.68410114305507 eval_NoAns_f1 = 75.68410114305507 eval_NoAns_total = 5774 eval_best_exact = 86.31797713889851 eval_best_exact_thresh = -7.69921875 eval_best_f1 = 89.0138490084362 eval_best_f1_thresh = -7.4140625 eval_exact = 79.30377554554902 eval_f1 = 82.22385859637924 eval_runtime = 116.6262 eval_samples_per_second = 119.39 eval_steps_per_second = 0.935 eval_total = 11548 ***** Eval results ***** 2021-12-14 06:49:11.744655epoch = 5.0 eval_HasAns_exact = 83.04468306200208 eval_HasAns_f1 = 88.60010543614725 eval_HasAns_total = 5774 eval_NoAns_exact = 84.48216141323172 eval_NoAns_f1 = 84.48216141323172 eval_NoAns_total = 5774 eval_best_exact = 87.20990647731209 eval_best_exact_thresh = -4.83984375 eval_best_f1 = 89.8436215977173 eval_best_f1_thresh = -4.83984375 eval_exact = 83.76342223761691 eval_f1 = 86.5411334246892 eval_runtime = 117.7564 eval_samples_per_second = 118.244 eval_steps_per_second = 0.926 eval_total = 11548 ***** Eval results ***** 2021-12-14 09:07:43.312763epoch = 6.0 eval_HasAns_exact = 83.46033945271908 eval_HasAns_f1 = 89.05328761170561 eval_HasAns_total = 5774 eval_NoAns_exact = 82.05749913404918 eval_NoAns_f1 = 82.05749913404918 eval_NoAns_total = 5774 eval_best_exact = 87.53030827848978 eval_best_exact_thresh = -6.7421875 eval_best_f1 = 90.18823628334343 eval_best_f1_thresh = -5.328125 eval_exact = 82.75891929338414 eval_f1 = 85.55539337287718 eval_runtime = 115.8934 eval_samples_per_second = 120.145 eval_steps_per_second = 0.941 eval_total = 11548 ***** Eval results ***** 2021-12-14 11:26:17.714938epoch = 7.0 eval_HasAns_exact = 83.47765846899897 eval_HasAns_f1 = 88.97497847186122 eval_HasAns_total = 5774 eval_NoAns_exact = 83.28714928992034 eval_NoAns_f1 = 83.28714928992034 eval_NoAns_total = 5774 eval_best_exact = 87.56494631104954 eval_best_exact_thresh = -5.70703125 eval_best_f1 = 90.1712271871601 eval_best_f1_thresh = -5.6875 eval_exact = 83.38240387945964 eval_f1 = 86.13106388089054 eval_runtime = 118.9527 eval_samples_per_second = 117.055 eval_steps_per_second = 0.916 eval_total = 11548 ***** Eval results ***** 2021-12-14 13:22:43.923006epoch = 6.0 eval_HasAns_exact = 83.46033945271908 eval_HasAns_f1 = 89.05328761170561 eval_HasAns_total = 5774 eval_NoAns_exact = 82.05749913404918 eval_NoAns_f1 = 82.05749913404918 eval_NoAns_total = 5774 eval_best_exact = 87.53030827848978 eval_best_exact_thresh = -6.7421875 eval_best_f1 = 90.18823628334343 eval_best_f1_thresh = -5.328125 eval_exact = 82.75891929338414 eval_f1 = 85.55539337287718 eval_runtime = 118.456 eval_samples_per_second = 117.546 eval_steps_per_second = 0.92 eval_total = 11548 ***** Eval results ***** 2021-12-14 15:41:40.429066epoch = 7.0 eval_HasAns_exact = 83.47765846899897 eval_HasAns_f1 = 88.97497847186122 eval_HasAns_total = 5774 eval_NoAns_exact = 83.28714928992034 eval_NoAns_f1 = 83.28714928992034 eval_NoAns_total = 5774 eval_best_exact = 87.56494631104954 eval_best_exact_thresh = -5.70703125 eval_best_f1 = 90.1712271871601 eval_best_f1_thresh = -5.6875 eval_exact = 83.38240387945964 eval_f1 = 86.13106388089054 eval_runtime = 116.1628 eval_samples_per_second = 119.866 eval_steps_per_second = 0.938 eval_total = 11548 ***** Eval results ***** 2021-12-14 18:00:18.739183epoch = 8.0 eval_HasAns_exact = 83.80671977831659 eval_HasAns_f1 = 89.25279748539205 eval_HasAns_total = 5774 eval_NoAns_exact = 82.35192241080706 eval_NoAns_f1 = 82.35192241080706 eval_NoAns_total = 5774 eval_best_exact = 87.7641149982681 eval_best_exact_thresh = -5.828125 eval_best_f1 = 90.35660938760992 eval_best_f1_thresh = -5.828125 eval_exact = 83.07932109456183 eval_f1 = 85.8023599480993 eval_runtime = 114.8772 eval_samples_per_second = 121.208 eval_steps_per_second = 0.949 eval_total = 11548 ***** Eval results ***** 2021-12-14 20:19:11.241603epoch = 9.0 eval_HasAns_exact = 83.70280568063734 eval_HasAns_f1 = 89.21377471775827 eval_HasAns_total = 5774 eval_NoAns_exact = 82.38656044336682 eval_NoAns_f1 = 82.38656044336682 eval_NoAns_total = 5774 eval_best_exact = 87.85936958780741 eval_best_exact_thresh = -6.28515625 eval_best_f1 = 90.4998967568238 eval_best_f1_thresh = -5.98046875 eval_exact = 83.04468306200208 eval_f1 = 85.80016758056232 eval_runtime = 114.8108 eval_samples_per_second = 121.278 eval_steps_per_second = 0.949 eval_total = 11548 ***** Eval results ***** 2021-12-14 22:37:47.534128epoch = 10.0 eval_HasAns_exact = 83.65084863179771 eval_HasAns_f1 = 89.1463632488054 eval_HasAns_total = 5774 eval_NoAns_exact = 82.99272601316245 eval_NoAns_f1 = 82.99272601316245 eval_NoAns_total = 5774 eval_best_exact = 87.81607204710772 eval_best_exact_thresh = -6.37890625 eval_best_f1 = 90.44887200606756 eval_best_f1_thresh = -6.046875 eval_exact = 83.32178732248008 eval_f1 = 86.0695446309837 eval_runtime = 116.3261 eval_samples_per_second = 119.698 eval_steps_per_second = 0.937 eval_total = 11548 |