File size: 7,514 Bytes
54ca777 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 | {
"best_metric": 0.21624045073986053,
"best_model_checkpoint": "/hpcwork/vg380347/NER/EduGBERT/checkpoint-550",
"epoch": 7.446808510638298,
"eval_steps": 50,
"global_step": 1050,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.35,
"eval_f1": 0.5815712900096993,
"eval_loss": 0.3045153319835663,
"eval_precision": 0.5216332212040367,
"eval_recall": 0.6570718877849211,
"eval_runtime": 7.1562,
"eval_samples_per_second": 629.381,
"eval_steps_per_second": 5.031,
"step": 50
},
{
"epoch": 0.71,
"eval_f1": 0.6822522225880804,
"eval_loss": 0.25079214572906494,
"eval_precision": 0.6210286536386525,
"eval_recall": 0.7568673290473408,
"eval_runtime": 7.2954,
"eval_samples_per_second": 617.376,
"eval_steps_per_second": 4.935,
"step": 100
},
{
"epoch": 1.06,
"eval_f1": 0.7016087182148418,
"eval_loss": 0.24814821779727936,
"eval_precision": 0.6308912739150724,
"eval_recall": 0.7901811805961426,
"eval_runtime": 7.1783,
"eval_samples_per_second": 627.45,
"eval_steps_per_second": 5.015,
"step": 150
},
{
"epoch": 1.42,
"eval_f1": 0.7199271355149306,
"eval_loss": 0.2445540428161621,
"eval_precision": 0.6488800281458895,
"eval_recall": 0.8084453535943893,
"eval_runtime": 7.1384,
"eval_samples_per_second": 630.95,
"eval_steps_per_second": 5.043,
"step": 200
},
{
"epoch": 1.77,
"eval_f1": 0.722252082773448,
"eval_loss": 0.22964715957641602,
"eval_precision": 0.6685323383084577,
"eval_recall": 0.7853594389246055,
"eval_runtime": 7.434,
"eval_samples_per_second": 605.866,
"eval_steps_per_second": 4.843,
"step": 250
},
{
"epoch": 2.13,
"eval_f1": 0.7319960997353392,
"eval_loss": 0.21758420765399933,
"eval_precision": 0.6993611924407772,
"eval_recall": 0.7678258328462887,
"eval_runtime": 7.1469,
"eval_samples_per_second": 630.207,
"eval_steps_per_second": 5.037,
"step": 300
},
{
"epoch": 2.48,
"eval_f1": 0.7406113537117905,
"eval_loss": 0.22185301780700684,
"eval_precision": 0.6854868797413257,
"eval_recall": 0.8053769725306839,
"eval_runtime": 7.1574,
"eval_samples_per_second": 629.281,
"eval_steps_per_second": 5.03,
"step": 350
},
{
"epoch": 2.84,
"eval_f1": 0.7412340309866812,
"eval_loss": 0.2164618819952011,
"eval_precision": 0.6928353658536586,
"eval_recall": 0.7969023962594973,
"eval_runtime": 7.1409,
"eval_samples_per_second": 630.735,
"eval_steps_per_second": 5.041,
"step": 400
},
{
"epoch": 3.19,
"eval_f1": 0.7499483221938952,
"eval_loss": 0.2220638245344162,
"eval_precision": 0.7096101186595384,
"eval_recall": 0.7951490356516657,
"eval_runtime": 7.4483,
"eval_samples_per_second": 604.703,
"eval_steps_per_second": 4.833,
"step": 450
},
{
"epoch": 3.55,
"learning_rate": 4.822695035460993e-06,
"loss": 0.2581,
"step": 500
},
{
"epoch": 3.55,
"eval_f1": 0.7439247452312516,
"eval_loss": 0.2487693727016449,
"eval_precision": 0.6727315689981096,
"eval_recall": 0.8319696084161309,
"eval_runtime": 7.1497,
"eval_samples_per_second": 629.957,
"eval_steps_per_second": 5.035,
"step": 500
},
{
"epoch": 3.9,
"eval_f1": 0.7555155958226711,
"eval_loss": 0.21624045073986053,
"eval_precision": 0.717268548916612,
"eval_recall": 0.7980713033313852,
"eval_runtime": 7.1536,
"eval_samples_per_second": 629.612,
"eval_steps_per_second": 5.032,
"step": 550
},
{
"epoch": 4.26,
"eval_f1": 0.7588671611598112,
"eval_loss": 0.23951853811740875,
"eval_precision": 0.7046080641121963,
"eval_recall": 0.8221800116890707,
"eval_runtime": 7.0397,
"eval_samples_per_second": 639.8,
"eval_steps_per_second": 5.114,
"step": 600
},
{
"epoch": 4.61,
"eval_f1": 0.7562726374711887,
"eval_loss": 0.24661774933338165,
"eval_precision": 0.688406665867402,
"eval_recall": 0.8389830508474576,
"eval_runtime": 7.1388,
"eval_samples_per_second": 630.916,
"eval_steps_per_second": 5.043,
"step": 650
},
{
"epoch": 4.96,
"eval_f1": 0.7577822311289245,
"eval_loss": 0.24025806784629822,
"eval_precision": 0.6980063992124046,
"eval_recall": 0.8287551139684395,
"eval_runtime": 7.1329,
"eval_samples_per_second": 631.441,
"eval_steps_per_second": 5.047,
"step": 700
},
{
"epoch": 5.32,
"eval_f1": 0.7517815517815518,
"eval_loss": 0.261866956949234,
"eval_precision": 0.6907355280871375,
"eval_recall": 0.8246639392168322,
"eval_runtime": 7.3254,
"eval_samples_per_second": 614.846,
"eval_steps_per_second": 4.914,
"step": 750
},
{
"epoch": 5.67,
"eval_f1": 0.7615306467998646,
"eval_loss": 0.2429821491241455,
"eval_precision": 0.7097588688296932,
"eval_recall": 0.8214494447691408,
"eval_runtime": 7.1352,
"eval_samples_per_second": 631.236,
"eval_steps_per_second": 5.045,
"step": 800
},
{
"epoch": 6.03,
"eval_f1": 0.7594460131773565,
"eval_loss": 0.24021703004837036,
"eval_precision": 0.7033623910336239,
"eval_recall": 0.8252483927527762,
"eval_runtime": 7.155,
"eval_samples_per_second": 629.489,
"eval_steps_per_second": 5.031,
"step": 850
},
{
"epoch": 6.38,
"eval_f1": 0.7594716019580233,
"eval_loss": 0.25845229625701904,
"eval_precision": 0.70182178708638,
"eval_recall": 0.8274400935125658,
"eval_runtime": 7.1743,
"eval_samples_per_second": 627.796,
"eval_steps_per_second": 5.018,
"step": 900
},
{
"epoch": 6.74,
"eval_f1": 0.7634940255459416,
"eval_loss": 0.2463415563106537,
"eval_precision": 0.7202643171806168,
"eval_recall": 0.8122443015780245,
"eval_runtime": 7.1315,
"eval_samples_per_second": 631.568,
"eval_steps_per_second": 5.048,
"step": 950
},
{
"epoch": 7.09,
"learning_rate": 4.645390070921986e-06,
"loss": 0.1517,
"step": 1000
},
{
"epoch": 7.09,
"eval_f1": 0.7641669494401085,
"eval_loss": 0.25761693716049194,
"eval_precision": 0.7134710429603346,
"eval_recall": 0.8226183518410286,
"eval_runtime": 7.1379,
"eval_samples_per_second": 630.995,
"eval_steps_per_second": 5.043,
"step": 1000
},
{
"epoch": 7.45,
"eval_f1": 0.7703476197124111,
"eval_loss": 0.2536332607269287,
"eval_precision": 0.7375033413525796,
"eval_recall": 0.8062536528345996,
"eval_runtime": 7.1375,
"eval_samples_per_second": 631.035,
"eval_steps_per_second": 5.044,
"step": 1050
}
],
"logging_steps": 500,
"max_steps": 14100,
"num_train_epochs": 100,
"save_steps": 50,
"total_flos": 6.408198647855674e+16,
"trial_name": null,
"trial_params": null
}
|