Training in progress, epoch 1
Browse files- config.json +440 -440
- model.safetensors +1 -1
- training_args.bin +1 -1
config.json
CHANGED
|
@@ -21,451 +21,451 @@
|
|
| 21 |
"hidden_activation": "gelu",
|
| 22 |
"hidden_size": 768,
|
| 23 |
"id2label": {
|
| 24 |
-
"0":
|
| 25 |
-
"1":
|
| 26 |
-
"10":
|
| 27 |
-
"100":
|
| 28 |
-
"101":
|
| 29 |
-
"102":
|
| 30 |
-
"103":
|
| 31 |
-
"104":
|
| 32 |
-
"105":
|
| 33 |
-
"106":
|
| 34 |
-
"107":
|
| 35 |
-
"108":
|
| 36 |
-
"109":
|
| 37 |
-
"11":
|
| 38 |
-
"110":
|
| 39 |
-
"111":
|
| 40 |
-
"112":
|
| 41 |
-
"113":
|
| 42 |
-
"114":
|
| 43 |
-
"115":
|
| 44 |
-
"116":
|
| 45 |
-
"117":
|
| 46 |
-
"118":
|
| 47 |
-
"119":
|
| 48 |
-
"12":
|
| 49 |
-
"120":
|
| 50 |
-
"121":
|
| 51 |
-
"122":
|
| 52 |
-
"123":
|
| 53 |
-
"124":
|
| 54 |
-
"125":
|
| 55 |
-
"126":
|
| 56 |
-
"127":
|
| 57 |
-
"128":
|
| 58 |
-
"129":
|
| 59 |
-
"13":
|
| 60 |
-
"130":
|
| 61 |
-
"131":
|
| 62 |
-
"132":
|
| 63 |
-
"133":
|
| 64 |
-
"134":
|
| 65 |
-
"135":
|
| 66 |
-
"136":
|
| 67 |
-
"137":
|
| 68 |
-
"138":
|
| 69 |
-
"139":
|
| 70 |
-
"14":
|
| 71 |
-
"140":
|
| 72 |
-
"141":
|
| 73 |
-
"142":
|
| 74 |
-
"143":
|
| 75 |
-
"144":
|
| 76 |
-
"145":
|
| 77 |
-
"146":
|
| 78 |
-
"147":
|
| 79 |
-
"148":
|
| 80 |
-
"149":
|
| 81 |
-
"15":
|
| 82 |
-
"150":
|
| 83 |
-
"151":
|
| 84 |
-
"152":
|
| 85 |
-
"153":
|
| 86 |
-
"154":
|
| 87 |
-
"155":
|
| 88 |
-
"156":
|
| 89 |
-
"157":
|
| 90 |
-
"158":
|
| 91 |
-
"159":
|
| 92 |
-
"16":
|
| 93 |
-
"160":
|
| 94 |
-
"161":
|
| 95 |
-
"162":
|
| 96 |
-
"163":
|
| 97 |
-
"164":
|
| 98 |
-
"165":
|
| 99 |
-
"166":
|
| 100 |
-
"167":
|
| 101 |
-
"168":
|
| 102 |
-
"169":
|
| 103 |
-
"17":
|
| 104 |
-
"170":
|
| 105 |
-
"171":
|
| 106 |
-
"172":
|
| 107 |
-
"173":
|
| 108 |
-
"174":
|
| 109 |
-
"175":
|
| 110 |
-
"176":
|
| 111 |
-
"177":
|
| 112 |
-
"178":
|
| 113 |
-
"179":
|
| 114 |
-
"18":
|
| 115 |
-
"180":
|
| 116 |
-
"181":
|
| 117 |
-
"182":
|
| 118 |
-
"183":
|
| 119 |
-
"184":
|
| 120 |
-
"185":
|
| 121 |
-
"186":
|
| 122 |
-
"187":
|
| 123 |
-
"188":
|
| 124 |
-
"189":
|
| 125 |
-
"19":
|
| 126 |
-
"190":
|
| 127 |
-
"191":
|
| 128 |
-
"192":
|
| 129 |
-
"193":
|
| 130 |
-
"194":
|
| 131 |
-
"195":
|
| 132 |
-
"196":
|
| 133 |
-
"197":
|
| 134 |
-
"198":
|
| 135 |
-
"199":
|
| 136 |
-
"2":
|
| 137 |
-
"20":
|
| 138 |
-
"200":
|
| 139 |
-
"201":
|
| 140 |
-
"202":
|
| 141 |
-
"203":
|
| 142 |
-
"204":
|
| 143 |
-
"205":
|
| 144 |
-
"206":
|
| 145 |
-
"207":
|
| 146 |
-
"208":
|
| 147 |
-
"209":
|
| 148 |
-
"21":
|
| 149 |
-
"210":
|
| 150 |
-
"211":
|
| 151 |
-
"212":
|
| 152 |
-
"213":
|
| 153 |
-
"214":
|
| 154 |
-
"215":
|
| 155 |
-
"216":
|
| 156 |
-
"217":
|
| 157 |
-
"218":
|
| 158 |
-
"219":
|
| 159 |
-
"22":
|
| 160 |
-
"220":
|
| 161 |
-
"221":
|
| 162 |
-
"222":
|
| 163 |
-
"223":
|
| 164 |
-
"224":
|
| 165 |
-
"225":
|
| 166 |
-
"226":
|
| 167 |
-
"227":
|
| 168 |
-
"228":
|
| 169 |
-
"229":
|
| 170 |
-
"23":
|
| 171 |
-
"230":
|
| 172 |
-
"231":
|
| 173 |
-
"232":
|
| 174 |
-
"233":
|
| 175 |
-
"234":
|
| 176 |
-
"235":
|
| 177 |
-
"236":
|
| 178 |
-
"237":
|
| 179 |
-
"238":
|
| 180 |
-
"239":
|
| 181 |
-
"24":
|
| 182 |
-
"240":
|
| 183 |
-
"241":
|
| 184 |
-
"242":
|
| 185 |
-
"243":
|
| 186 |
-
"244":
|
| 187 |
-
"245":
|
| 188 |
-
"246":
|
| 189 |
-
"247":
|
| 190 |
-
"248":
|
| 191 |
-
"249":
|
| 192 |
-
"25":
|
| 193 |
-
"250":
|
| 194 |
-
"251":
|
| 195 |
-
"252":
|
| 196 |
-
"253":
|
| 197 |
-
"254":
|
| 198 |
-
"255":
|
| 199 |
-
"256":
|
| 200 |
-
"257":
|
| 201 |
-
"258":
|
| 202 |
-
"259":
|
| 203 |
-
"26":
|
| 204 |
-
"260":
|
| 205 |
-
"261":
|
| 206 |
-
"262":
|
| 207 |
-
"263":
|
| 208 |
-
"264":
|
| 209 |
-
"265":
|
| 210 |
-
"266":
|
| 211 |
-
"267":
|
| 212 |
-
"268":
|
| 213 |
-
"269":
|
| 214 |
-
"27":
|
| 215 |
-
"270":
|
| 216 |
-
"271":
|
| 217 |
-
"272":
|
| 218 |
-
"273":
|
| 219 |
-
"274":
|
| 220 |
-
"275":
|
| 221 |
-
"276":
|
| 222 |
-
"277":
|
| 223 |
-
"278":
|
| 224 |
-
"279":
|
| 225 |
-
"28":
|
| 226 |
-
"280":
|
| 227 |
-
"281":
|
| 228 |
-
"282":
|
| 229 |
-
"283":
|
| 230 |
-
"284":
|
| 231 |
-
"29":
|
| 232 |
-
"3":
|
| 233 |
-
"30":
|
| 234 |
-
"31":
|
| 235 |
-
"32":
|
| 236 |
-
"33":
|
| 237 |
-
"34":
|
| 238 |
-
"35":
|
| 239 |
-
"36":
|
| 240 |
-
"37":
|
| 241 |
-
"38":
|
| 242 |
-
"39":
|
| 243 |
-
"4":
|
| 244 |
-
"40":
|
| 245 |
-
"41":
|
| 246 |
-
"42":
|
| 247 |
-
"43":
|
| 248 |
-
"44":
|
| 249 |
-
"45":
|
| 250 |
-
"46":
|
| 251 |
-
"47":
|
| 252 |
-
"48":
|
| 253 |
-
"49":
|
| 254 |
-
"5":
|
| 255 |
-
"50":
|
| 256 |
-
"51":
|
| 257 |
-
"52":
|
| 258 |
-
"53":
|
| 259 |
-
"54":
|
| 260 |
-
"55":
|
| 261 |
-
"56":
|
| 262 |
-
"57":
|
| 263 |
-
"58":
|
| 264 |
-
"59":
|
| 265 |
-
"6":
|
| 266 |
-
"60":
|
| 267 |
-
"61":
|
| 268 |
-
"62":
|
| 269 |
-
"63":
|
| 270 |
-
"64":
|
| 271 |
-
"65":
|
| 272 |
-
"66":
|
| 273 |
-
"67":
|
| 274 |
-
"68":
|
| 275 |
-
"69":
|
| 276 |
-
"7":
|
| 277 |
-
"70":
|
| 278 |
-
"71":
|
| 279 |
-
"72":
|
| 280 |
-
"73":
|
| 281 |
-
"74":
|
| 282 |
-
"75":
|
| 283 |
-
"76":
|
| 284 |
-
"77":
|
| 285 |
-
"78":
|
| 286 |
-
"79":
|
| 287 |
-
"8":
|
| 288 |
-
"80":
|
| 289 |
-
"81":
|
| 290 |
-
"82":
|
| 291 |
-
"83":
|
| 292 |
-
"84":
|
| 293 |
-
"85":
|
| 294 |
-
"86":
|
| 295 |
-
"87":
|
| 296 |
-
"88":
|
| 297 |
-
"89":
|
| 298 |
-
"9":
|
| 299 |
-
"90":
|
| 300 |
-
"91":
|
| 301 |
-
"92":
|
| 302 |
-
"93":
|
| 303 |
-
"94":
|
| 304 |
-
"95":
|
| 305 |
-
"96":
|
| 306 |
-
"97":
|
| 307 |
-
"98":
|
| 308 |
-
"99":
|
| 309 |
},
|
| 310 |
"initializer_cutoff_factor": 2.0,
|
| 311 |
"initializer_range": 0.02,
|
| 312 |
"intermediate_size": 1152,
|
| 313 |
"label2id": {
|
| 314 |
-
"
|
| 315 |
-
"
|
| 316 |
-
"
|
| 317 |
-
"
|
| 318 |
-
"
|
| 319 |
-
"
|
| 320 |
-
"
|
| 321 |
-
"
|
| 322 |
-
"
|
| 323 |
-
"
|
| 324 |
-
"
|
| 325 |
-
"
|
| 326 |
-
"
|
| 327 |
-
"
|
| 328 |
-
"
|
| 329 |
-
"
|
| 330 |
-
"
|
| 331 |
-
"
|
| 332 |
-
"
|
| 333 |
-
"
|
| 334 |
-
"
|
| 335 |
-
"
|
| 336 |
-
"
|
| 337 |
-
"
|
| 338 |
-
"
|
| 339 |
-
"
|
| 340 |
-
"
|
| 341 |
-
"
|
| 342 |
-
"
|
| 343 |
-
"
|
| 344 |
-
"
|
| 345 |
-
"
|
| 346 |
-
"
|
| 347 |
-
"
|
| 348 |
-
"
|
| 349 |
-
"
|
| 350 |
-
"
|
| 351 |
-
"
|
| 352 |
-
"
|
| 353 |
-
"
|
| 354 |
-
"
|
| 355 |
-
"
|
| 356 |
-
"
|
| 357 |
-
"
|
| 358 |
-
"
|
| 359 |
-
"
|
| 360 |
-
"
|
| 361 |
-
"
|
| 362 |
-
"
|
| 363 |
-
"
|
| 364 |
-
"
|
| 365 |
-
"
|
| 366 |
-
"
|
| 367 |
-
"
|
| 368 |
-
"
|
| 369 |
-
"
|
| 370 |
-
"
|
| 371 |
-
"
|
| 372 |
-
"
|
| 373 |
-
"
|
| 374 |
-
"
|
| 375 |
-
"
|
| 376 |
-
"
|
| 377 |
-
"
|
| 378 |
-
"
|
| 379 |
-
"
|
| 380 |
-
"
|
| 381 |
-
"
|
| 382 |
-
"
|
| 383 |
-
"
|
| 384 |
-
"
|
| 385 |
-
"
|
| 386 |
-
"
|
| 387 |
-
"
|
| 388 |
-
"
|
| 389 |
-
"
|
| 390 |
-
"
|
| 391 |
-
"
|
| 392 |
-
"
|
| 393 |
-
"
|
| 394 |
-
"
|
| 395 |
-
"
|
| 396 |
-
"
|
| 397 |
-
"
|
| 398 |
-
"
|
| 399 |
-
"
|
| 400 |
-
"
|
| 401 |
-
"
|
| 402 |
-
"
|
| 403 |
-
"
|
| 404 |
-
"
|
| 405 |
-
"
|
| 406 |
-
"
|
| 407 |
-
"
|
| 408 |
-
"
|
| 409 |
-
"
|
| 410 |
-
"
|
| 411 |
-
"
|
| 412 |
-
"
|
| 413 |
-
"
|
| 414 |
-
"
|
| 415 |
-
"
|
| 416 |
-
"
|
| 417 |
-
"
|
| 418 |
-
"
|
| 419 |
-
"
|
| 420 |
-
"
|
| 421 |
-
"
|
| 422 |
-
"
|
| 423 |
-
"
|
| 424 |
-
"
|
| 425 |
-
"
|
| 426 |
-
"
|
| 427 |
-
"
|
| 428 |
-
"
|
| 429 |
-
"
|
| 430 |
-
"
|
| 431 |
-
"
|
| 432 |
-
"
|
| 433 |
-
"
|
| 434 |
-
"
|
| 435 |
-
"
|
| 436 |
-
"
|
| 437 |
-
"
|
| 438 |
-
"
|
| 439 |
-
"
|
| 440 |
-
"
|
| 441 |
-
"
|
| 442 |
-
"
|
| 443 |
-
"
|
| 444 |
-
"
|
| 445 |
-
"
|
| 446 |
-
"
|
| 447 |
-
"
|
| 448 |
-
"
|
| 449 |
-
"
|
| 450 |
-
"
|
| 451 |
-
"
|
| 452 |
-
"
|
| 453 |
-
"
|
| 454 |
-
"
|
| 455 |
-
"
|
| 456 |
-
"
|
| 457 |
-
"
|
| 458 |
-
"
|
| 459 |
-
"
|
| 460 |
-
"
|
| 461 |
-
"
|
| 462 |
-
"
|
| 463 |
-
"
|
| 464 |
-
"
|
| 465 |
-
"
|
| 466 |
-
"
|
| 467 |
-
"
|
| 468 |
-
"
|
| 469 |
},
|
| 470 |
"layer_norm_eps": 1e-05,
|
| 471 |
"local_attention": 128,
|
|
|
|
| 21 |
"hidden_activation": "gelu",
|
| 22 |
"hidden_size": 768,
|
| 23 |
"id2label": {
|
| 24 |
+
"0": 7,
|
| 25 |
+
"1": 17,
|
| 26 |
+
"10": 58,
|
| 27 |
+
"100": 231,
|
| 28 |
+
"101": 232,
|
| 29 |
+
"102": 233,
|
| 30 |
+
"103": 234,
|
| 31 |
+
"104": 235,
|
| 32 |
+
"105": 236,
|
| 33 |
+
"106": 237,
|
| 34 |
+
"107": 238,
|
| 35 |
+
"108": 239,
|
| 36 |
+
"109": 240,
|
| 37 |
+
"11": 64,
|
| 38 |
+
"110": 241,
|
| 39 |
+
"111": 242,
|
| 40 |
+
"112": 243,
|
| 41 |
+
"113": 244,
|
| 42 |
+
"114": 245,
|
| 43 |
+
"115": 246,
|
| 44 |
+
"116": 247,
|
| 45 |
+
"117": 248,
|
| 46 |
+
"118": 249,
|
| 47 |
+
"119": 250,
|
| 48 |
+
"12": 67,
|
| 49 |
+
"120": 251,
|
| 50 |
+
"121": 252,
|
| 51 |
+
"122": 253,
|
| 52 |
+
"123": 254,
|
| 53 |
+
"124": 255,
|
| 54 |
+
"125": 256,
|
| 55 |
+
"126": 257,
|
| 56 |
+
"127": 258,
|
| 57 |
+
"128": 259,
|
| 58 |
+
"129": 260,
|
| 59 |
+
"13": 83,
|
| 60 |
+
"130": 261,
|
| 61 |
+
"131": 262,
|
| 62 |
+
"132": 263,
|
| 63 |
+
"133": 264,
|
| 64 |
+
"134": 265,
|
| 65 |
+
"135": 266,
|
| 66 |
+
"136": 267,
|
| 67 |
+
"137": 268,
|
| 68 |
+
"138": 269,
|
| 69 |
+
"139": 270,
|
| 70 |
+
"14": 91,
|
| 71 |
+
"140": 271,
|
| 72 |
+
"141": 272,
|
| 73 |
+
"142": 273,
|
| 74 |
+
"143": 274,
|
| 75 |
+
"144": 275,
|
| 76 |
+
"145": 276,
|
| 77 |
+
"146": 277,
|
| 78 |
+
"147": 278,
|
| 79 |
+
"148": 279,
|
| 80 |
+
"149": 280,
|
| 81 |
+
"15": 100,
|
| 82 |
+
"150": 281,
|
| 83 |
+
"151": 282,
|
| 84 |
+
"152": 283,
|
| 85 |
+
"153": 284,
|
| 86 |
+
"154": 154,
|
| 87 |
+
"155": 155,
|
| 88 |
+
"156": 156,
|
| 89 |
+
"157": 157,
|
| 90 |
+
"158": 158,
|
| 91 |
+
"159": 159,
|
| 92 |
+
"16": 102,
|
| 93 |
+
"160": 160,
|
| 94 |
+
"161": 161,
|
| 95 |
+
"162": 162,
|
| 96 |
+
"163": 163,
|
| 97 |
+
"164": 164,
|
| 98 |
+
"165": 165,
|
| 99 |
+
"166": 166,
|
| 100 |
+
"167": 167,
|
| 101 |
+
"168": 168,
|
| 102 |
+
"169": 169,
|
| 103 |
+
"17": 126,
|
| 104 |
+
"170": 170,
|
| 105 |
+
"171": 171,
|
| 106 |
+
"172": 172,
|
| 107 |
+
"173": 173,
|
| 108 |
+
"174": 174,
|
| 109 |
+
"175": 175,
|
| 110 |
+
"176": 176,
|
| 111 |
+
"177": 177,
|
| 112 |
+
"178": 178,
|
| 113 |
+
"179": 179,
|
| 114 |
+
"18": 127,
|
| 115 |
+
"180": 180,
|
| 116 |
+
"181": 181,
|
| 117 |
+
"182": 182,
|
| 118 |
+
"183": 183,
|
| 119 |
+
"184": 184,
|
| 120 |
+
"185": 185,
|
| 121 |
+
"186": 186,
|
| 122 |
+
"187": 187,
|
| 123 |
+
"188": 188,
|
| 124 |
+
"189": 189,
|
| 125 |
+
"19": 128,
|
| 126 |
+
"190": 190,
|
| 127 |
+
"191": 191,
|
| 128 |
+
"192": 192,
|
| 129 |
+
"193": 193,
|
| 130 |
+
"194": 194,
|
| 131 |
+
"195": 195,
|
| 132 |
+
"196": 196,
|
| 133 |
+
"197": 197,
|
| 134 |
+
"198": 198,
|
| 135 |
+
"199": 199,
|
| 136 |
+
"2": 31,
|
| 137 |
+
"20": 131,
|
| 138 |
+
"200": 200,
|
| 139 |
+
"201": 201,
|
| 140 |
+
"202": 202,
|
| 141 |
+
"203": 203,
|
| 142 |
+
"204": 204,
|
| 143 |
+
"205": 205,
|
| 144 |
+
"206": 206,
|
| 145 |
+
"207": 207,
|
| 146 |
+
"208": 208,
|
| 147 |
+
"209": 209,
|
| 148 |
+
"21": 135,
|
| 149 |
+
"210": 210,
|
| 150 |
+
"211": 211,
|
| 151 |
+
"212": 212,
|
| 152 |
+
"213": 213,
|
| 153 |
+
"214": 214,
|
| 154 |
+
"215": 215,
|
| 155 |
+
"216": 216,
|
| 156 |
+
"217": 217,
|
| 157 |
+
"218": 218,
|
| 158 |
+
"219": 219,
|
| 159 |
+
"22": 138,
|
| 160 |
+
"220": 220,
|
| 161 |
+
"221": 221,
|
| 162 |
+
"222": 222,
|
| 163 |
+
"223": 223,
|
| 164 |
+
"224": 224,
|
| 165 |
+
"225": 225,
|
| 166 |
+
"226": 226,
|
| 167 |
+
"227": 227,
|
| 168 |
+
"228": 228,
|
| 169 |
+
"229": 229,
|
| 170 |
+
"23": 153,
|
| 171 |
+
"230": 230,
|
| 172 |
+
"231": 231,
|
| 173 |
+
"232": 232,
|
| 174 |
+
"233": 233,
|
| 175 |
+
"234": 234,
|
| 176 |
+
"235": 235,
|
| 177 |
+
"236": 236,
|
| 178 |
+
"237": 237,
|
| 179 |
+
"238": 238,
|
| 180 |
+
"239": 239,
|
| 181 |
+
"24": 154,
|
| 182 |
+
"240": 240,
|
| 183 |
+
"241": 241,
|
| 184 |
+
"242": 242,
|
| 185 |
+
"243": 243,
|
| 186 |
+
"244": 244,
|
| 187 |
+
"245": 245,
|
| 188 |
+
"246": 246,
|
| 189 |
+
"247": 247,
|
| 190 |
+
"248": 248,
|
| 191 |
+
"249": 249,
|
| 192 |
+
"25": 155,
|
| 193 |
+
"250": 250,
|
| 194 |
+
"251": 251,
|
| 195 |
+
"252": 252,
|
| 196 |
+
"253": 253,
|
| 197 |
+
"254": 254,
|
| 198 |
+
"255": 255,
|
| 199 |
+
"256": 256,
|
| 200 |
+
"257": 257,
|
| 201 |
+
"258": 258,
|
| 202 |
+
"259": 259,
|
| 203 |
+
"26": 156,
|
| 204 |
+
"260": 260,
|
| 205 |
+
"261": 261,
|
| 206 |
+
"262": 262,
|
| 207 |
+
"263": 263,
|
| 208 |
+
"264": 264,
|
| 209 |
+
"265": 265,
|
| 210 |
+
"266": 266,
|
| 211 |
+
"267": 267,
|
| 212 |
+
"268": 268,
|
| 213 |
+
"269": 269,
|
| 214 |
+
"27": 157,
|
| 215 |
+
"270": 270,
|
| 216 |
+
"271": 271,
|
| 217 |
+
"272": 272,
|
| 218 |
+
"273": 273,
|
| 219 |
+
"274": 274,
|
| 220 |
+
"275": 275,
|
| 221 |
+
"276": 276,
|
| 222 |
+
"277": 277,
|
| 223 |
+
"278": 278,
|
| 224 |
+
"279": 279,
|
| 225 |
+
"28": 158,
|
| 226 |
+
"280": 280,
|
| 227 |
+
"281": 281,
|
| 228 |
+
"282": 282,
|
| 229 |
+
"283": 283,
|
| 230 |
+
"284": 284,
|
| 231 |
+
"29": 159,
|
| 232 |
+
"3": 38,
|
| 233 |
+
"30": 160,
|
| 234 |
+
"31": 161,
|
| 235 |
+
"32": 162,
|
| 236 |
+
"33": 163,
|
| 237 |
+
"34": 164,
|
| 238 |
+
"35": 165,
|
| 239 |
+
"36": 166,
|
| 240 |
+
"37": 167,
|
| 241 |
+
"38": 168,
|
| 242 |
+
"39": 169,
|
| 243 |
+
"4": 39,
|
| 244 |
+
"40": 171,
|
| 245 |
+
"41": 172,
|
| 246 |
+
"42": 173,
|
| 247 |
+
"43": 174,
|
| 248 |
+
"44": 175,
|
| 249 |
+
"45": 176,
|
| 250 |
+
"46": 177,
|
| 251 |
+
"47": 178,
|
| 252 |
+
"48": 179,
|
| 253 |
+
"49": 180,
|
| 254 |
+
"5": 40,
|
| 255 |
+
"50": 181,
|
| 256 |
+
"51": 182,
|
| 257 |
+
"52": 183,
|
| 258 |
+
"53": 184,
|
| 259 |
+
"54": 185,
|
| 260 |
+
"55": 186,
|
| 261 |
+
"56": 187,
|
| 262 |
+
"57": 188,
|
| 263 |
+
"58": 189,
|
| 264 |
+
"59": 190,
|
| 265 |
+
"6": 43,
|
| 266 |
+
"60": 191,
|
| 267 |
+
"61": 192,
|
| 268 |
+
"62": 193,
|
| 269 |
+
"63": 194,
|
| 270 |
+
"64": 195,
|
| 271 |
+
"65": 196,
|
| 272 |
+
"66": 197,
|
| 273 |
+
"67": 198,
|
| 274 |
+
"68": 199,
|
| 275 |
+
"69": 200,
|
| 276 |
+
"7": 48,
|
| 277 |
+
"70": 201,
|
| 278 |
+
"71": 202,
|
| 279 |
+
"72": 203,
|
| 280 |
+
"73": 204,
|
| 281 |
+
"74": 205,
|
| 282 |
+
"75": 206,
|
| 283 |
+
"76": 207,
|
| 284 |
+
"77": 208,
|
| 285 |
+
"78": 209,
|
| 286 |
+
"79": 210,
|
| 287 |
+
"8": 53,
|
| 288 |
+
"80": 211,
|
| 289 |
+
"81": 212,
|
| 290 |
+
"82": 213,
|
| 291 |
+
"83": 214,
|
| 292 |
+
"84": 215,
|
| 293 |
+
"85": 216,
|
| 294 |
+
"86": 217,
|
| 295 |
+
"87": 218,
|
| 296 |
+
"88": 219,
|
| 297 |
+
"89": 220,
|
| 298 |
+
"9": 56,
|
| 299 |
+
"90": 221,
|
| 300 |
+
"91": 222,
|
| 301 |
+
"92": 223,
|
| 302 |
+
"93": 224,
|
| 303 |
+
"94": 225,
|
| 304 |
+
"95": 226,
|
| 305 |
+
"96": 227,
|
| 306 |
+
"97": 228,
|
| 307 |
+
"98": 229,
|
| 308 |
+
"99": 230
|
| 309 |
},
|
| 310 |
"initializer_cutoff_factor": 2.0,
|
| 311 |
"initializer_range": 0.02,
|
| 312 |
"intermediate_size": 1152,
|
| 313 |
"label2id": {
|
| 314 |
+
"7": "0",
|
| 315 |
+
"17": "1",
|
| 316 |
+
"31": "2",
|
| 317 |
+
"38": "3",
|
| 318 |
+
"39": "4",
|
| 319 |
+
"40": "5",
|
| 320 |
+
"43": "6",
|
| 321 |
+
"48": "7",
|
| 322 |
+
"53": "8",
|
| 323 |
+
"56": "9",
|
| 324 |
+
"58": "10",
|
| 325 |
+
"64": "11",
|
| 326 |
+
"67": "12",
|
| 327 |
+
"83": "13",
|
| 328 |
+
"91": "14",
|
| 329 |
+
"100": "15",
|
| 330 |
+
"102": "16",
|
| 331 |
+
"126": "17",
|
| 332 |
+
"127": "18",
|
| 333 |
+
"128": "19",
|
| 334 |
+
"131": "20",
|
| 335 |
+
"135": "21",
|
| 336 |
+
"138": "22",
|
| 337 |
+
"153": "23",
|
| 338 |
+
"154": "154",
|
| 339 |
+
"155": "155",
|
| 340 |
+
"156": "156",
|
| 341 |
+
"157": "157",
|
| 342 |
+
"158": "158",
|
| 343 |
+
"159": "159",
|
| 344 |
+
"160": "160",
|
| 345 |
+
"161": "161",
|
| 346 |
+
"162": "162",
|
| 347 |
+
"163": "163",
|
| 348 |
+
"164": "164",
|
| 349 |
+
"165": "165",
|
| 350 |
+
"166": "166",
|
| 351 |
+
"167": "167",
|
| 352 |
+
"168": "168",
|
| 353 |
+
"169": "169",
|
| 354 |
+
"170": "170",
|
| 355 |
+
"171": "171",
|
| 356 |
+
"172": "172",
|
| 357 |
+
"173": "173",
|
| 358 |
+
"174": "174",
|
| 359 |
+
"175": "175",
|
| 360 |
+
"176": "176",
|
| 361 |
+
"177": "177",
|
| 362 |
+
"178": "178",
|
| 363 |
+
"179": "179",
|
| 364 |
+
"180": "180",
|
| 365 |
+
"181": "181",
|
| 366 |
+
"182": "182",
|
| 367 |
+
"183": "183",
|
| 368 |
+
"184": "184",
|
| 369 |
+
"185": "185",
|
| 370 |
+
"186": "186",
|
| 371 |
+
"187": "187",
|
| 372 |
+
"188": "188",
|
| 373 |
+
"189": "189",
|
| 374 |
+
"190": "190",
|
| 375 |
+
"191": "191",
|
| 376 |
+
"192": "192",
|
| 377 |
+
"193": "193",
|
| 378 |
+
"194": "194",
|
| 379 |
+
"195": "195",
|
| 380 |
+
"196": "196",
|
| 381 |
+
"197": "197",
|
| 382 |
+
"198": "198",
|
| 383 |
+
"199": "199",
|
| 384 |
+
"200": "200",
|
| 385 |
+
"201": "201",
|
| 386 |
+
"202": "202",
|
| 387 |
+
"203": "203",
|
| 388 |
+
"204": "204",
|
| 389 |
+
"205": "205",
|
| 390 |
+
"206": "206",
|
| 391 |
+
"207": "207",
|
| 392 |
+
"208": "208",
|
| 393 |
+
"209": "209",
|
| 394 |
+
"210": "210",
|
| 395 |
+
"211": "211",
|
| 396 |
+
"212": "212",
|
| 397 |
+
"213": "213",
|
| 398 |
+
"214": "214",
|
| 399 |
+
"215": "215",
|
| 400 |
+
"216": "216",
|
| 401 |
+
"217": "217",
|
| 402 |
+
"218": "218",
|
| 403 |
+
"219": "219",
|
| 404 |
+
"220": "220",
|
| 405 |
+
"221": "221",
|
| 406 |
+
"222": "222",
|
| 407 |
+
"223": "223",
|
| 408 |
+
"224": "224",
|
| 409 |
+
"225": "225",
|
| 410 |
+
"226": "226",
|
| 411 |
+
"227": "227",
|
| 412 |
+
"228": "228",
|
| 413 |
+
"229": "229",
|
| 414 |
+
"230": "230",
|
| 415 |
+
"231": "231",
|
| 416 |
+
"232": "232",
|
| 417 |
+
"233": "233",
|
| 418 |
+
"234": "234",
|
| 419 |
+
"235": "235",
|
| 420 |
+
"236": "236",
|
| 421 |
+
"237": "237",
|
| 422 |
+
"238": "238",
|
| 423 |
+
"239": "239",
|
| 424 |
+
"240": "240",
|
| 425 |
+
"241": "241",
|
| 426 |
+
"242": "242",
|
| 427 |
+
"243": "243",
|
| 428 |
+
"244": "244",
|
| 429 |
+
"245": "245",
|
| 430 |
+
"246": "246",
|
| 431 |
+
"247": "247",
|
| 432 |
+
"248": "248",
|
| 433 |
+
"249": "249",
|
| 434 |
+
"250": "250",
|
| 435 |
+
"251": "251",
|
| 436 |
+
"252": "252",
|
| 437 |
+
"253": "253",
|
| 438 |
+
"254": "254",
|
| 439 |
+
"255": "255",
|
| 440 |
+
"256": "256",
|
| 441 |
+
"257": "257",
|
| 442 |
+
"258": "258",
|
| 443 |
+
"259": "259",
|
| 444 |
+
"260": "260",
|
| 445 |
+
"261": "261",
|
| 446 |
+
"262": "262",
|
| 447 |
+
"263": "263",
|
| 448 |
+
"264": "264",
|
| 449 |
+
"265": "265",
|
| 450 |
+
"266": "266",
|
| 451 |
+
"267": "267",
|
| 452 |
+
"268": "268",
|
| 453 |
+
"269": "269",
|
| 454 |
+
"270": "270",
|
| 455 |
+
"271": "271",
|
| 456 |
+
"272": "272",
|
| 457 |
+
"273": "273",
|
| 458 |
+
"274": "274",
|
| 459 |
+
"275": "275",
|
| 460 |
+
"276": "276",
|
| 461 |
+
"277": "277",
|
| 462 |
+
"278": "278",
|
| 463 |
+
"279": "279",
|
| 464 |
+
"280": "280",
|
| 465 |
+
"281": "281",
|
| 466 |
+
"282": "282",
|
| 467 |
+
"283": "283",
|
| 468 |
+
"284": "284"
|
| 469 |
},
|
| 470 |
"layer_norm_eps": 1e-05,
|
| 471 |
"local_attention": 128,
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 599310308
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe6037a95b51ab55eca90629e34cd687da59993e01ed8b9f1cb15075868a4514
|
| 3 |
size 599310308
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5905
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ad0181d394bb3507dc8d789366400bf5358f02e775c63324094924065e12b79
|
| 3 |
size 5905
|