Upload 9 files
Browse files- models/ud_ewt_gum_pud_20250611/README.md +341 -0
- models/ud_ewt_gum_pud_20250611/added_tokens.json +3 -0
- models/ud_ewt_gum_pud_20250611/config.json +254 -0
- models/ud_ewt_gum_pud_20250611/model.safetensors +3 -0
- models/ud_ewt_gum_pud_20250611/special_tokens_map.json +15 -0
- models/ud_ewt_gum_pud_20250611/spm.model +3 -0
- models/ud_ewt_gum_pud_20250611/tokenizer.json +0 -0
- models/ud_ewt_gum_pud_20250611/tokenizer_config.json +60 -0
- models/ud_ewt_gum_pud_20250611/training_args.bin +3 -0
models/ud_ewt_gum_pud_20250611/README.md
ADDED
|
@@ -0,0 +1,341 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
## Test Results
|
| 2 |
+
|
| 3 |
+
```text
|
| 4 |
+
----- xpos classification report -----
|
| 5 |
+
precision recall f1-score support
|
| 6 |
+
|
| 7 |
+
$ 0.91 1.00 0.95 49
|
| 8 |
+
'' 1.00 0.99 0.99 228
|
| 9 |
+
, 0.97 0.99 0.98 2403
|
| 10 |
+
-LRB- 1.00 1.00 1.00 190
|
| 11 |
+
-RRB- 1.00 1.00 1.00 190
|
| 12 |
+
. 1.00 1.00 1.00 2860
|
| 13 |
+
: 0.89 0.76 0.82 245
|
| 14 |
+
ADD 0.93 0.83 0.88 84
|
| 15 |
+
AFX 0.00 0.00 0.00 4
|
| 16 |
+
CC 1.00 1.00 1.00 1644
|
| 17 |
+
CD 0.97 0.98 0.97 1164
|
| 18 |
+
DT 1.00 1.00 1.00 4862
|
| 19 |
+
EX 0.98 1.00 0.99 94
|
| 20 |
+
FW 0.75 0.18 0.30 49
|
| 21 |
+
HYPH 0.98 0.95 0.96 172
|
| 22 |
+
IN 0.99 0.99 0.99 6100
|
| 23 |
+
JJ 0.94 0.93 0.94 3612
|
| 24 |
+
JJR 0.88 0.94 0.91 120
|
| 25 |
+
JJS 0.96 0.92 0.94 128
|
| 26 |
+
LS 1.00 0.67 0.80 3
|
| 27 |
+
MD 1.00 1.00 1.00 572
|
| 28 |
+
NFP 0.95 0.98 0.96 91
|
| 29 |
+
NN 0.96 0.92 0.94 7636
|
| 30 |
+
NNP 0.87 0.94 0.90 4237
|
| 31 |
+
NNPS 0.67 0.84 0.75 160
|
| 32 |
+
NNS 0.99 0.97 0.98 2785
|
| 33 |
+
PDT 0.94 0.94 0.94 32
|
| 34 |
+
POS 0.99 0.99 0.99 168
|
| 35 |
+
PRP 1.00 1.00 1.00 1941
|
| 36 |
+
PRP$ 0.99 1.00 0.99 685
|
| 37 |
+
RB 0.94 0.94 0.94 2163
|
| 38 |
+
RBR 0.81 0.93 0.87 80
|
| 39 |
+
RBS 0.85 0.91 0.88 56
|
| 40 |
+
RP 0.82 0.87 0.85 182
|
| 41 |
+
SYM 0.68 0.64 0.66 42
|
| 42 |
+
TO 0.99 0.99 0.99 718
|
| 43 |
+
UH 0.90 0.95 0.92 99
|
| 44 |
+
VB 0.98 0.98 0.98 1765
|
| 45 |
+
VBD 0.99 0.99 0.99 1630
|
| 46 |
+
VBG 0.96 0.96 0.96 837
|
| 47 |
+
VBN 0.95 0.96 0.95 1217
|
| 48 |
+
VBP 0.98 0.97 0.98 1073
|
| 49 |
+
VBZ 0.99 1.00 1.00 1101
|
| 50 |
+
WDT 0.95 0.98 0.97 291
|
| 51 |
+
WP 0.98 0.98 0.98 170
|
| 52 |
+
WP$ 0.00 0.00 0.00 7
|
| 53 |
+
WRB 0.99 0.99 0.99 192
|
| 54 |
+
`` 0.99 1.00 0.99 227
|
| 55 |
+
|
| 56 |
+
accuracy 0.97 54358
|
| 57 |
+
macro avg 0.90 0.89 0.89 54358
|
| 58 |
+
weighted avg 0.97 0.97 0.97 54358
|
| 59 |
+
|
| 60 |
+
----- deprel classification report -----
|
| 61 |
+
precision recall f1-score support
|
| 62 |
+
|
| 63 |
+
acl 0.86 0.81 0.84 469
|
| 64 |
+
acl:relcl 0.92 0.93 0.92 497
|
| 65 |
+
advcl 0.85 0.85 0.85 794
|
| 66 |
+
advmod 0.93 0.92 0.93 2244
|
| 67 |
+
amod 0.94 0.93 0.94 3167
|
| 68 |
+
appos 0.63 0.78 0.70 405
|
| 69 |
+
aux 0.99 0.99 0.99 1165
|
| 70 |
+
aux:pass 0.96 0.97 0.96 499
|
| 71 |
+
case 0.98 0.99 0.98 5459
|
| 72 |
+
cc 0.99 0.99 0.99 1653
|
| 73 |
+
cc:preconj 0.90 0.87 0.88 30
|
| 74 |
+
ccomp 0.77 0.78 0.77 388
|
| 75 |
+
compound 0.85 0.85 0.85 2437
|
| 76 |
+
compound:prt 0.84 0.91 0.87 180
|
| 77 |
+
conj 0.93 0.95 0.94 1901
|
| 78 |
+
cop 0.93 0.97 0.95 961
|
| 79 |
+
csubj 0.63 0.61 0.62 59
|
| 80 |
+
csubj:pass 0.00 0.00 0.00 5
|
| 81 |
+
det 1.00 1.00 1.00 4643
|
| 82 |
+
det:predet 0.84 0.84 0.84 32
|
| 83 |
+
discourse 0.91 0.85 0.88 102
|
| 84 |
+
expl 0.85 0.96 0.90 142
|
| 85 |
+
fixed 0.86 0.77 0.81 190
|
| 86 |
+
flat 0.86 0.83 0.84 589
|
| 87 |
+
iobj 0.83 0.74 0.78 53
|
| 88 |
+
list 0.66 0.43 0.52 251
|
| 89 |
+
mark 0.93 0.97 0.95 1542
|
| 90 |
+
nmod 0.89 0.91 0.90 2373
|
| 91 |
+
nmod:npmod 0.33 0.02 0.03 62
|
| 92 |
+
nmod:poss 0.99 0.99 0.99 855
|
| 93 |
+
nmod:tmod 0.67 0.51 0.58 106
|
| 94 |
+
nsubj 0.97 0.96 0.96 3655
|
| 95 |
+
nsubj:pass 0.92 0.95 0.93 438
|
| 96 |
+
nummod 0.81 0.93 0.86 616
|
| 97 |
+
obj 0.97 0.97 0.97 2418
|
| 98 |
+
obl 0.92 0.89 0.90 2747
|
| 99 |
+
obl:npmod 0.54 0.53 0.54 73
|
| 100 |
+
obl:tmod 0.55 0.80 0.65 82
|
| 101 |
+
parataxis 0.71 0.47 0.57 271
|
| 102 |
+
punct 1.00 1.00 1.00 6547
|
| 103 |
+
root 0.95 0.94 0.95 3558
|
| 104 |
+
vocative 0.71 0.67 0.69 18
|
| 105 |
+
xcomp 0.87 0.87 0.87 682
|
| 106 |
+
|
| 107 |
+
accuracy 0.94 54358
|
| 108 |
+
macro avg 0.82 0.81 0.81 54358
|
| 109 |
+
weighted avg 0.94 0.94 0.94 54358
|
| 110 |
+
|
| 111 |
+
----- pos classification report -----
|
| 112 |
+
precision recall f1-score support
|
| 113 |
+
|
| 114 |
+
ADJ 0.94 0.93 0.94 3866
|
| 115 |
+
ADP 0.98 0.98 0.98 5528
|
| 116 |
+
ADV 0.93 0.90 0.91 2230
|
| 117 |
+
AUX 0.98 0.99 0.98 2640
|
| 118 |
+
CCONJ 1.00 1.00 1.00 1643
|
| 119 |
+
DET 0.99 0.99 0.99 4731
|
| 120 |
+
INTJ 0.90 0.93 0.91 101
|
| 121 |
+
NOUN 0.97 0.95 0.96 10146
|
| 122 |
+
NUM 0.97 0.98 0.98 1161
|
| 123 |
+
PART 0.96 0.99 0.97 1069
|
| 124 |
+
PRON 0.98 0.99 0.98 3400
|
| 125 |
+
PROPN 0.91 0.95 0.93 4585
|
| 126 |
+
PUNCT 1.00 1.00 1.00 6584
|
| 127 |
+
SCONJ 0.88 0.95 0.91 838
|
| 128 |
+
SYM 0.87 0.86 0.87 144
|
| 129 |
+
VERB 0.98 0.97 0.97 5555
|
| 130 |
+
X 0.85 0.60 0.70 137
|
| 131 |
+
|
| 132 |
+
accuracy 0.97 54358
|
| 133 |
+
macro avg 0.95 0.94 0.94 54358
|
| 134 |
+
weighted avg 0.97 0.97 0.97 54358
|
| 135 |
+
|
| 136 |
+
----- Case classification report -----
|
| 137 |
+
precision recall f1-score support
|
| 138 |
+
|
| 139 |
+
Acc 0.86 0.98 0.92 377
|
| 140 |
+
Nom 1.00 0.96 0.98 1554
|
| 141 |
+
X 1.00 1.00 1.00 52427
|
| 142 |
+
|
| 143 |
+
accuracy 1.00 54358
|
| 144 |
+
macro avg 0.95 0.98 0.97 54358
|
| 145 |
+
weighted avg 1.00 1.00 1.00 54358
|
| 146 |
+
|
| 147 |
+
----- Definite classification report -----
|
| 148 |
+
precision recall f1-score support
|
| 149 |
+
|
| 150 |
+
Def 1.00 1.00 1.00 2947
|
| 151 |
+
Ind 1.00 1.00 1.00 1182
|
| 152 |
+
X 1.00 1.00 1.00 50229
|
| 153 |
+
|
| 154 |
+
accuracy 1.00 54358
|
| 155 |
+
macro avg 1.00 1.00 1.00 54358
|
| 156 |
+
weighted avg 1.00 1.00 1.00 54358
|
| 157 |
+
|
| 158 |
+
----- Degree classification report -----
|
| 159 |
+
precision recall f1-score support
|
| 160 |
+
|
| 161 |
+
Cmp 0.84 0.96 0.89 160
|
| 162 |
+
Pos 0.93 0.94 0.94 3702
|
| 163 |
+
Sup 0.99 0.99 0.99 147
|
| 164 |
+
X 1.00 0.99 1.00 50349
|
| 165 |
+
|
| 166 |
+
accuracy 0.99 54358
|
| 167 |
+
macro avg 0.94 0.97 0.95 54358
|
| 168 |
+
weighted avg 0.99 0.99 0.99 54358
|
| 169 |
+
|
| 170 |
+
----- Foreign classification report -----
|
| 171 |
+
precision recall f1-score support
|
| 172 |
+
|
| 173 |
+
X 1.00 1.00 1.00 54309
|
| 174 |
+
Yes 0.55 0.24 0.34 49
|
| 175 |
+
|
| 176 |
+
accuracy 1.00 54358
|
| 177 |
+
macro avg 0.77 0.62 0.67 54358
|
| 178 |
+
weighted avg 1.00 1.00 1.00 54358
|
| 179 |
+
|
| 180 |
+
----- Gender classification report -----
|
| 181 |
+
precision recall f1-score support
|
| 182 |
+
|
| 183 |
+
Fem 1.00 1.00 1.00 135
|
| 184 |
+
Masc 1.00 1.00 1.00 395
|
| 185 |
+
Neut 1.00 1.00 1.00 436
|
| 186 |
+
X 1.00 1.00 1.00 53392
|
| 187 |
+
|
| 188 |
+
accuracy 1.00 54358
|
| 189 |
+
macro avg 1.00 1.00 1.00 54358
|
| 190 |
+
weighted avg 1.00 1.00 1.00 54358
|
| 191 |
+
|
| 192 |
+
----- Mood classification report -----
|
| 193 |
+
precision recall f1-score support
|
| 194 |
+
|
| 195 |
+
Imp 0.84 0.96 0.89 203
|
| 196 |
+
Ind 0.99 0.99 0.99 3804
|
| 197 |
+
X 1.00 1.00 1.00 50351
|
| 198 |
+
|
| 199 |
+
accuracy 1.00 54358
|
| 200 |
+
macro avg 0.94 0.98 0.96 54358
|
| 201 |
+
weighted avg 1.00 1.00 1.00 54358
|
| 202 |
+
|
| 203 |
+
----- NumType classification report -----
|
| 204 |
+
precision recall f1-score support
|
| 205 |
+
|
| 206 |
+
Card 0.97 0.98 0.98 1164
|
| 207 |
+
Mult 1.00 0.64 0.78 14
|
| 208 |
+
Ord 0.93 0.87 0.90 111
|
| 209 |
+
X 1.00 1.00 1.00 53069
|
| 210 |
+
|
| 211 |
+
accuracy 1.00 54358
|
| 212 |
+
macro avg 0.98 0.87 0.91 54358
|
| 213 |
+
weighted avg 1.00 1.00 1.00 54358
|
| 214 |
+
|
| 215 |
+
----- Number classification report -----
|
| 216 |
+
precision recall f1-score support
|
| 217 |
+
|
| 218 |
+
Plur 0.98 0.98 0.98 3639
|
| 219 |
+
Sing 0.98 0.98 0.98 15212
|
| 220 |
+
X 0.99 0.99 0.99 35507
|
| 221 |
+
|
| 222 |
+
accuracy 0.99 54358
|
| 223 |
+
macro avg 0.98 0.98 0.98 54358
|
| 224 |
+
weighted avg 0.99 0.99 0.99 54358
|
| 225 |
+
|
| 226 |
+
----- Person classification report -----
|
| 227 |
+
precision recall f1-score support
|
| 228 |
+
|
| 229 |
+
1 0.99 1.00 0.99 857
|
| 230 |
+
2 1.00 0.99 1.00 472
|
| 231 |
+
3 1.00 1.00 1.00 2772
|
| 232 |
+
X 1.00 1.00 1.00 50257
|
| 233 |
+
|
| 234 |
+
accuracy 1.00 54358
|
| 235 |
+
macro avg 1.00 1.00 1.00 54358
|
| 236 |
+
weighted avg 1.00 1.00 1.00 54358
|
| 237 |
+
|
| 238 |
+
----- Polarity classification report -----
|
| 239 |
+
precision recall f1-score support
|
| 240 |
+
|
| 241 |
+
Neg 0.98 0.98 0.98 240
|
| 242 |
+
Pos 1.00 0.88 0.93 8
|
| 243 |
+
X 1.00 1.00 1.00 54110
|
| 244 |
+
|
| 245 |
+
accuracy 1.00 54358
|
| 246 |
+
macro avg 0.99 0.95 0.97 54358
|
| 247 |
+
weighted avg 1.00 1.00 1.00 54358
|
| 248 |
+
|
| 249 |
+
----- PronType classification report -----
|
| 250 |
+
precision recall f1-score support
|
| 251 |
+
|
| 252 |
+
Art 1.00 1.00 1.00 4129
|
| 253 |
+
Dem 0.99 0.98 0.99 517
|
| 254 |
+
Int 0.98 0.93 0.95 307
|
| 255 |
+
Neg 0.96 0.99 0.98 82
|
| 256 |
+
Prs 1.00 1.00 1.00 2614
|
| 257 |
+
Rel 0.91 0.98 0.94 347
|
| 258 |
+
X 1.00 1.00 1.00 46362
|
| 259 |
+
|
| 260 |
+
accuracy 1.00 54358
|
| 261 |
+
macro avg 0.98 0.98 0.98 54358
|
| 262 |
+
weighted avg 1.00 1.00 1.00 54358
|
| 263 |
+
|
| 264 |
+
----- Poss classification report -----
|
| 265 |
+
precision recall f1-score support
|
| 266 |
+
|
| 267 |
+
X 1.00 1.00 1.00 53671
|
| 268 |
+
Yes 1.00 0.99 1.00 687
|
| 269 |
+
|
| 270 |
+
accuracy 1.00 54358
|
| 271 |
+
macro avg 1.00 1.00 1.00 54358
|
| 272 |
+
weighted avg 1.00 1.00 1.00 54358
|
| 273 |
+
|
| 274 |
+
----- Reflex classification report -----
|
| 275 |
+
precision recall f1-score support
|
| 276 |
+
|
| 277 |
+
X 1.00 1.00 1.00 54337
|
| 278 |
+
Yes 0.95 0.86 0.90 21
|
| 279 |
+
|
| 280 |
+
accuracy 1.00 54358
|
| 281 |
+
macro avg 0.97 0.93 0.95 54358
|
| 282 |
+
weighted avg 1.00 1.00 1.00 54358
|
| 283 |
+
|
| 284 |
+
----- Tense classification report -----
|
| 285 |
+
precision recall f1-score support
|
| 286 |
+
|
| 287 |
+
Past 0.98 0.99 0.98 2847
|
| 288 |
+
Pres 0.97 0.99 0.98 2289
|
| 289 |
+
X 1.00 1.00 1.00 49222
|
| 290 |
+
|
| 291 |
+
accuracy 1.00 54358
|
| 292 |
+
macro avg 0.98 0.99 0.99 54358
|
| 293 |
+
weighted avg 1.00 1.00 1.00 54358
|
| 294 |
+
|
| 295 |
+
----- VerbForm classification report -----
|
| 296 |
+
precision recall f1-score support
|
| 297 |
+
|
| 298 |
+
Fin 0.99 0.99 0.99 4579
|
| 299 |
+
Ger 0.95 0.91 0.93 722
|
| 300 |
+
Inf 0.98 0.97 0.97 1562
|
| 301 |
+
Part 0.93 0.96 0.94 1332
|
| 302 |
+
X 1.00 1.00 1.00 46163
|
| 303 |
+
|
| 304 |
+
accuracy 0.99 54358
|
| 305 |
+
macro avg 0.97 0.97 0.97 54358
|
| 306 |
+
weighted avg 0.99 0.99 0.99 54358
|
| 307 |
+
```
|
| 308 |
+
|
| 309 |
+
## Training logs
|
| 310 |
+
|
| 311 |
+
```
|
| 312 |
+
$ python -m multi_head_trainer --data-path dataset/ud_ewt_gum_pud_20250611 --save-path models/ud_ewt_gum_pud_20250611 --from-base microsoft/deberta-v3-base --train -E 16 -A 17
|
| 313 |
+
{'loss': 231.4746, 'grad_norm': 106.06476593017578, 'learning_rate': 1.1363636363636366e-05, 'epoch': 0.91}
|
| 314 |
+
{'eval_loss': 7.66445255279541, 'eval_f1_macro': 0.3212549341453801, 'eval_xpos_accuracy': 0.453834308592547, 'eval_xpos_precision_macro': 0.0985374290046747, 'eval_xpos_recall_macro': 0.11212050248120882, 'eval_xpos_f1_macro': 0.08354665721491084, 'eval_xpos_precision_micro': 0.453834308592547, 'eval_xpos_recall_micro': 0.453834308592547, 'eval_xpos_f1_micro': 0.453834308592547, 'eval_deprel_accuracy': 0.31413612565445026, 'eval_deprel_precision_macro': 0.10606953018602618, 'eval_deprel_recall_macro': 0.07957130702428165, 'eval_deprel_f1_macro': 0.060603378111730576, 'eval_deprel_precision_micro': 0.31413612565445026, 'eval_deprel_recall_micro': 0.31413612565445026, 'eval_deprel_f1_micro': 0.31413612565445026, 'eval_pos_accuracy': 0.5520172466892516, 'eval_pos_precision_macro': 0.3360610744921144, 'eval_pos_recall_macro': 0.30288392927640373, 'eval_pos_f1_macro': 0.2832616828686859, 'eval_pos_precision_micro': 0.5520172466892516, 'eval_pos_recall_micro': 0.5520172466892516, 'eval_pos_f1_micro': 0.5520172466892516, 'eval_Case_accuracy': 0.9519556513704959, 'eval_Case_precision_macro': 0.6507193247281353, 'eval_Case_recall_macro': 0.3338043056538773, 'eval_Case_f1_macro': 0.32621944206972703, 'eval_Case_precision_micro': 0.9519556513704959, 'eval_Case_recall_micro': 0.9519556513704959, 'eval_Case_f1_micro': 0.9519556513704959, 'eval_Definite_accuracy': 0.9592546966430552, 'eval_Definite_precision_macro': 0.65276545400769, 'eval_Definite_recall_macro': 0.5302160169723852, 'eval_Definite_f1_macro': 0.5738090050016655, 'eval_Definite_precision_micro': 0.9592546966430552, 'eval_Definite_recall_micro': 0.9592546966430552, 'eval_Definite_f1_micro': 0.9592546966430552, 'eval_Degree_accuracy': 0.9233754234678164, 'eval_Degree_precision_macro': 0.23089363275113206, 'eval_Degree_recall_macro': 0.24996665110384847, 'eval_Degree_f1_macro': 0.24005188233598618, 'eval_Degree_precision_micro': 0.9233754234678164, 'eval_Degree_recall_micro': 0.9233754234678164, 'eval_Degree_f1_micro': 0.9233754234678164, 'eval_Foreign_accuracy': 0.9990452725592855, 'eval_Foreign_precision_macro': 0.49963034839663617, 'eval_Foreign_recall_macro': 0.4998921284595944, 'eval_Foreign_f1_macro': 0.49976120414734476, 'eval_Foreign_precision_micro': 0.9990452725592855, 'eval_Foreign_recall_micro': 0.9990452725592855, 'eval_Foreign_f1_micro': 0.9990452725592855, 'eval_Gender_accuracy': 0.9816137973514013, 'eval_Gender_precision_macro': 0.24545636570865292, 'eval_Gender_recall_macro': 0.24994510664993727, 'eval_Gender_f1_macro': 0.2476804003543509, 'eval_Gender_precision_micro': 0.9816137973514013, 'eval_Gender_recall_micro': 0.9816137973514013, 'eval_Gender_f1_micro': 0.9816137973514013, 'eval_Mood_accuracy': 0.9199876809362488, 'eval_Mood_precision_macro': 0.4279375286491957, 'eval_Mood_recall_macro': 0.33382044137322686, 'eval_Mood_f1_macro': 0.32056560960087205, 'eval_Mood_precision_micro': 0.9199876809362488, 'eval_Mood_recall_micro': 0.9199876809362488, 'eval_Mood_f1_micro': 0.9199876809362488, 'eval_NumType_accuracy': 0.9826609177702494, 'eval_NumType_precision_macro': 0.24571820226103563, 'eval_NumType_recall_macro': 0.24994516513129034, 'eval_NumType_f1_macro': 0.247813660158131, 'eval_NumType_precision_micro': 0.9826609177702494, 'eval_NumType_recall_micro': 0.9826609177702494, 'eval_NumType_f1_micro': 0.9826609177702494, 'eval_Number_accuracy': 0.785525100092393, 'eval_Number_precision_macro': 0.5001241663136943, 'eval_Number_recall_macro': 0.5252545809547717, 'eval_Number_f1_macro': 0.5119670612048098, 'eval_Number_precision_micro': 0.785525100092393, 'eval_Number_recall_micro': 0.785525100092393, 'eval_Number_f1_micro': 0.785525100092393, 'eval_Person_accuracy': 0.9086233446258084, 'eval_Person_precision_macro': 0.22720481779256385, 'eval_Person_recall_macro': 0.24994069806845137, 'eval_Person_f1_macro': 0.2380310780501186, 'eval_Person_precision_micro': 0.9086233446258084, 'eval_Person_recall_micro': 0.9086233446258084, 'eval_Person_f1_micro': 0.9086233446258084, 'eval_Polarity_accuracy': 0.993717277486911, 'eval_Polarity_precision_macro': 0.3313105176149257, 'eval_Polarity_recall_macro': 0.3332610334748345, 'eval_Polarity_f1_macro': 0.3322829131652661, 'eval_Polarity_precision_micro': 0.993717277486911, 'eval_Polarity_recall_micro': 0.993717277486911, 'eval_Polarity_f1_micro': 0.993717277486911, 'eval_PronType_accuracy': 0.8850015398829689, 'eval_PronType_precision_macro': 0.33913256786339513, 'eval_PronType_recall_macro': 0.22909293694986518, 'eval_PronType_f1_macro': 0.241420508051835, 'eval_PronType_precision_micro': 0.8850015398829689, 'eval_PronType_recall_micro': 0.8850015398829689, 'eval_PronType_f1_micro': 0.8850015398829689, 'eval_Poss_accuracy': 0.9857098860486603, 'eval_Poss_precision_macro': 0.49285494302433014, 'eval_Poss_recall_macro': 0.5, 'eval_Poss_f1_macro': 0.49640176189589924, 'eval_Poss_precision_micro': 0.9857098860486603, 'eval_Poss_recall_micro': 0.9857098860486603, 'eval_Poss_f1_micro': 0.9857098860486603, 'eval_Reflex_accuracy': 0.9989220819217739, 'eval_Reflex_precision_macro': 0.4995687397960755, 'eval_Reflex_recall_macro': 0.4998921151593613, 'eval_Reflex_f1_macro': 0.4997303751637008, 'eval_Reflex_precision_micro': 0.9989220819217739, 'eval_Reflex_recall_micro': 0.9989220819217739, 'eval_Reflex_f1_micro': 0.9989220819217739, 'eval_Tense_accuracy': 0.904896827841084, 'eval_Tense_precision_macro': 0.6349499804851996, 'eval_Tense_recall_macro': 0.3366113501331694, 'eval_Tense_f1_macro': 0.3231750317464975, 'eval_Tense_precision_micro': 0.904896827841084, 'eval_Tense_recall_micro': 0.904896827841084, 'eval_Tense_f1_micro': 0.904896827841084, 'eval_VerbForm_accuracy': 0.8587311364336311, 'eval_VerbForm_precision_macro': 0.3706041017094936, 'eval_VerbForm_recall_macro': 0.24373002742431563, 'eval_VerbForm_f1_macro': 0.25626716347530987, 'eval_VerbForm_precision_micro': 0.8587311364336311, 'eval_VerbForm_recall_micro': 0.8587311364336311, 'eval_VerbForm_f1_micro': 0.8587311364336311, 'eval_runtime': 255.7745, 'eval_samples_per_second': 9.356, 'eval_steps_per_second': 4.68, 'epoch': 0.91}
|
| 315 |
+
{'loss': 62.568, 'grad_norm': 29.363380432128906, 'learning_rate': 1.96969696969697e-05, 'epoch': 1.81}
|
| 316 |
+
{'eval_loss': 1.5485634803771973, 'eval_f1_macro': 0.7251004846978346, 'eval_xpos_accuracy': 0.89781336618417, 'eval_xpos_precision_macro': 0.4189080143475885, 'eval_xpos_recall_macro': 0.4183066111972118, 'eval_xpos_f1_macro': 0.4072079555660955, 'eval_xpos_precision_micro': 0.89781336618417, 'eval_xpos_recall_micro': 0.89781336618417, 'eval_xpos_f1_micro': 0.89781336618417, 'eval_deprel_accuracy': 0.7230674468740376, 'eval_deprel_precision_macro': 0.35091430802826373, 'eval_deprel_recall_macro': 0.35532092053616493, 'eval_deprel_f1_macro': 0.3339262047895113, 'eval_deprel_precision_micro': 0.7230674468740376, 'eval_deprel_recall_micro': 0.7230674468740376, 'eval_deprel_f1_micro': 0.7230674468740376, 'eval_pos_accuracy': 0.9451801663073607, 'eval_pos_precision_macro': 0.7746892031061138, 'eval_pos_recall_macro': 0.7688502419391033, 'eval_pos_f1_macro': 0.7697645179995556, 'eval_pos_precision_micro': 0.9451801663073607, 'eval_pos_recall_micro': 0.9451801663073607, 'eval_pos_f1_micro': 0.9451801663073607, 'eval_Case_accuracy': 0.9972282106559901, 'eval_Case_precision_macro': 0.9571153892911846, 'eval_Case_recall_macro': 0.9429939795485179, 'eval_Case_f1_macro': 0.949550690498813, 'eval_Case_precision_micro': 0.9972282106559901, 'eval_Case_recall_micro': 0.9972282106559901, 'eval_Case_f1_micro': 0.9972282106559901, 'eval_Definite_accuracy': 0.9987372959655066, 'eval_Definite_precision_macro': 0.9827523049499879, 'eval_Definite_recall_macro': 0.999135894777587, 'eval_Definite_f1_macro': 0.9907326490598157, 'eval_Definite_precision_micro': 0.9987372959655066, 'eval_Definite_recall_micro': 0.9987372959655066, 'eval_Definite_f1_micro': 0.9987372959655066, 'eval_Degree_accuracy': 0.9824453341546042, 'eval_Degree_precision_macro': 0.46380002110433677, 'eval_Degree_recall_macro': 0.47851253117946807, 'eval_Degree_f1_macro': 0.4709255268772733, 'eval_Degree_precision_micro': 0.9824453341546042, 'eval_Degree_recall_micro': 0.9824453341546042, 'eval_Degree_f1_micro': 0.9824453341546042, 'eval_Foreign_accuracy': 0.9992608561749307, 'eval_Foreign_precision_macro': 0.49963042808746533, 'eval_Foreign_recall_macro': 0.5, 'eval_Foreign_f1_macro': 0.49981514572678537, 'eval_Foreign_precision_micro': 0.9992608561749307, 'eval_Foreign_recall_micro': 0.9992608561749307, 'eval_Foreign_f1_micro': 0.9992608561749307, 'eval_Gender_accuracy': 0.9929473360024638, 'eval_Gender_precision_macro': 0.5572125445758415, 'eval_Gender_recall_macro': 0.592241580257665, 'eval_Gender_f1_macro': 0.564806228601335, 'eval_Gender_precision_micro': 0.9929473360024638, 'eval_Gender_recall_micro': 0.9929473360024638, 'eval_Gender_f1_micro': 0.9929473360024638, 'eval_Mood_accuracy': 0.9923621804742839, 'eval_Mood_precision_macro': 0.9376884536362167, 'eval_Mood_recall_macro': 0.8162174082599184, 'eval_Mood_f1_macro': 0.8589676618826433, 'eval_Mood_precision_micro': 0.9923621804742839, 'eval_Mood_recall_micro': 0.9923621804742839, 'eval_Mood_f1_micro': 0.9923621804742839, 'eval_NumType_accuracy': 0.9975977825685248, 'eval_NumType_precision_macro': 0.48635108994901743, 'eval_NumType_recall_macro': 0.4939682868411982, 'eval_NumType_f1_macro': 0.4901027311450764, 'eval_NumType_precision_micro': 0.9975977825685248, 'eval_NumType_recall_micro': 0.9975977825685248, 'eval_NumType_f1_micro': 0.9975977825685248, 'eval_Number_accuracy': 0.9815522020326455, 'eval_Number_precision_macro': 0.972467722373755, 'eval_Number_recall_macro': 0.978175648807779, 'eval_Number_f1_macro': 0.9752904200419685, 'eval_Number_precision_micro': 0.9815522020326455, 'eval_Number_recall_micro': 0.9815522020326455, 'eval_Number_f1_micro': 0.9815522020326455, 'eval_Person_accuracy': 0.993963658761934, 'eval_Person_precision_macro': 0.9728795173109788, 'eval_Person_recall_macro': 0.9849107219848866, 'eval_Person_f1_macro': 0.9783149962339074, 'eval_Person_precision_micro': 0.993963658761934, 'eval_Person_recall_micro': 0.993963658761934, 'eval_Person_f1_micro': 0.993963658761934, 'eval_Polarity_accuracy': 0.9987988912842624, 'eval_Polarity_precision_macro': 0.662169697933114, 'eval_Polarity_recall_macro': 0.6216009645191934, 'eval_Polarity_f1_macro': 0.6405287696477676, 'eval_Polarity_precision_micro': 0.9987988912842624, 'eval_Polarity_recall_micro': 0.9987988912842624, 'eval_Polarity_f1_micro': 0.9987988912842624, 'eval_PronType_accuracy': 0.9898675700646751, 'eval_PronType_precision_macro': 0.7853386383418702, 'eval_PronType_recall_macro': 0.7472930954508582, 'eval_PronType_f1_macro': 0.7595622886370467, 'eval_PronType_precision_micro': 0.9898675700646751, 'eval_PronType_recall_micro': 0.9898675700646751, 'eval_PronType_f1_micro': 0.9898675700646751, 'eval_Poss_accuracy': 0.9997844163843548, 'eval_Poss_precision_macro': 0.9925690021231423, 'eval_Poss_recall_macro': 0.999890645503968, 'eval_Poss_f1_macro': 0.9962020012641057, 'eval_Poss_precision_micro': 0.9997844163843548, 'eval_Poss_recall_micro': 0.9997844163843548, 'eval_Poss_f1_micro': 0.9997844163843548, 'eval_Reflex_accuracy': 0.9991376655374191, 'eval_Reflex_precision_macro': 0.49956883276870956, 'eval_Reflex_recall_macro': 0.5, 'eval_Reflex_f1_macro': 0.49978432339166873, 'eval_Reflex_precision_micro': 0.9991376655374191, 'eval_Reflex_recall_micro': 0.9991376655374191, 'eval_Reflex_f1_micro': 0.9991376655374191, 'eval_Tense_accuracy': 0.992608561749307, 'eval_Tense_precision_macro': 0.9656908580652658, 'eval_Tense_recall_macro': 0.9823099012061105, 'eval_Tense_f1_macro': 0.9737702990215137, 'eval_Tense_precision_micro': 0.992608561749307, 'eval_Tense_recall_micro': 0.992608561749307, 'eval_Tense_f1_micro': 0.992608561749307, 'eval_VerbForm_accuracy': 0.9823221435170927, 'eval_VerbForm_precision_macro': 0.8905976605259734, 'eval_VerbForm_recall_macro': 0.8984709989973482, 'eval_VerbForm_f1_macro': 0.8925563141761395, 'eval_VerbForm_precision_micro': 0.9823221435170927, 'eval_VerbForm_recall_micro': 0.9823221435170927, 'eval_VerbForm_f1_micro': 0.9823221435170927, 'eval_runtime': 185.7828, 'eval_samples_per_second': 12.881, 'eval_steps_per_second': 6.443, 'epoch': 1.81}
|
| 317 |
+
{'loss': 17.1872, 'grad_norm': 22.771862030029297, 'learning_rate': 1.8434343434343437e-05, 'epoch': 2.71}
|
| 318 |
+
{'eval_loss': 0.7269241809844971, 'eval_f1_macro': 0.8116491422564279, 'eval_xpos_accuracy': 0.9481983369263935, 'eval_xpos_precision_macro': 0.6600220806367743, 'eval_xpos_recall_macro': 0.6472446095465938, 'eval_xpos_f1_macro': 0.643066314297495, 'eval_xpos_precision_micro': 0.9481983369263935, 'eval_xpos_recall_micro': 0.9481983369263935, 'eval_xpos_f1_micro': 0.9481983369263935, 'eval_deprel_accuracy': 0.8582999692023406, 'eval_deprel_precision_macro': 0.5527845474769064, 'eval_deprel_recall_macro': 0.4976910116719008, 'eval_deprel_f1_macro': 0.497298056183901, 'eval_deprel_precision_micro': 0.8582999692023406, 'eval_deprel_recall_micro': 0.8582999692023406, 'eval_deprel_f1_micro': 0.8582999692023406, 'eval_pos_accuracy': 0.9637511549122266, 'eval_pos_precision_macro': 0.9553702427412276, 'eval_pos_recall_macro': 0.8711403830822372, 'eval_pos_f1_macro': 0.8894834785197641, 'eval_pos_precision_micro': 0.9637511549122266, 'eval_pos_recall_micro': 0.9637511549122266, 'eval_pos_f1_micro': 0.9637511549122266, 'eval_Case_accuracy': 0.9985833076686171, 'eval_Case_precision_macro': 0.9685013847425162, 'eval_Case_recall_macro': 0.984937981536758, 'eval_Case_f1_macro': 0.9763189308133121, 'eval_Case_precision_micro': 0.9985833076686171, 'eval_Case_recall_micro': 0.9985833076686171, 'eval_Case_f1_micro': 0.9985833076686171, 'eval_Definite_accuracy': 0.9996612257468432, 'eval_Definite_precision_macro': 0.9961863294639094, 'eval_Definite_recall_macro': 0.9994665060778813, 'eval_Definite_f1_macro': 0.9978179168508036, 'eval_Definite_precision_micro': 0.9996612257468432, 'eval_Definite_recall_micro': 0.9996612257468432, 'eval_Definite_f1_micro': 0.9996612257468432, 'eval_Degree_accuracy': 0.989344009855251, 'eval_Degree_precision_macro': 0.9479393707543897, 'eval_Degree_recall_macro': 0.9185496642416123, 'eval_Degree_f1_macro': 0.9323726006274098, 'eval_Degree_precision_micro': 0.989344009855251, 'eval_Degree_recall_micro': 0.989344009855251, 'eval_Degree_f1_micro': 0.989344009855251, 'eval_Foreign_accuracy': 0.9992608561749307, 'eval_Foreign_precision_macro': 0.49963042808746533, 'eval_Foreign_recall_macro': 0.5, 'eval_Foreign_f1_macro': 0.49981514572678537, 'eval_Foreign_precision_micro': 0.9992608561749307, 'eval_Foreign_recall_micro': 0.9992608561749307, 'eval_Foreign_f1_micro': 0.9992608561749307, 'eval_Gender_accuracy': 0.9968278410840776, 'eval_Gender_precision_macro': 0.9171126934911522, 'eval_Gender_recall_macro': 0.7532854765238975, 'eval_Gender_f1_macro': 0.738963645800478, 'eval_Gender_precision_micro': 0.9968278410840776, 'eval_Gender_recall_micro': 0.9968278410840776, 'eval_Gender_f1_micro': 0.9968278410840776, 'eval_Mood_accuracy': 0.995349553433939, 'eval_Mood_precision_macro': 0.9245176429183594, 'eval_Mood_recall_macro': 0.9346464147800998, 'eval_Mood_f1_macro': 0.929465756148751, 'eval_Mood_precision_micro': 0.995349553433939, 'eval_Mood_recall_micro': 0.995349553433939, 'eval_Mood_f1_micro': 0.995349553433939, 'eval_NumType_accuracy': 0.9976285802279027, 'eval_NumType_precision_macro': 0.6876960521215374, 'eval_NumType_recall_macro': 0.5195858118242055, 'eval_NumType_f1_macro': 0.5362370302327577, 'eval_NumType_precision_micro': 0.9976285802279027, 'eval_NumType_recall_micro': 0.9976285802279027, 'eval_NumType_f1_micro': 0.9976285802279027, 'eval_Number_accuracy': 0.9876193409300893, 'eval_Number_precision_macro': 0.9834029415301421, 'eval_Number_recall_macro': 0.9842909544463275, 'eval_Number_f1_macro': 0.9838431694065118, 'eval_Number_precision_micro': 0.9876193409300893, 'eval_Number_recall_micro': 0.9876193409300893, 'eval_Number_f1_micro': 0.9876193409300893, 'eval_Person_accuracy': 0.9989528795811519, 'eval_Person_precision_macro': 0.9939441883837415, 'eval_Person_recall_macro': 0.9942794271236972, 'eval_Person_f1_macro': 0.9940845658371668, 'eval_Person_precision_micro': 0.9989528795811519, 'eval_Person_recall_micro': 0.9989528795811519, 'eval_Person_f1_micro': 0.9989528795811519, 'eval_Polarity_accuracy': 0.9991068678780413, 'eval_Polarity_precision_macro': 0.6588328632206752, 'eval_Polarity_recall_macro': 0.6432019290383867, 'eval_Polarity_f1_macro': 0.6508198138030398, 'eval_Polarity_precision_micro': 0.9991068678780413, 'eval_Polarity_recall_micro': 0.9991068678780413, 'eval_Polarity_f1_micro': 0.9991068678780413, 'eval_PronType_accuracy': 0.9967354481059439, 'eval_PronType_precision_macro': 0.960512585663275, 'eval_PronType_recall_macro': 0.8944858082036587, 'eval_PronType_f1_macro': 0.9159045601961793, 'eval_PronType_precision_micro': 0.9967354481059439, 'eval_PronType_recall_micro': 0.9967354481059439, 'eval_PronType_f1_micro': 0.9967354481059439, 'eval_Poss_accuracy': 0.9998768093624885, 'eval_Poss_precision_macro': 0.9957264957264957, 'eval_Poss_recall_macro': 0.9999375117165532, 'eval_Poss_f1_macro': 0.9978228311589807, 'eval_Poss_precision_micro': 0.9998768093624885, 'eval_Poss_recall_micro': 0.9998768093624885, 'eval_Poss_f1_micro': 0.9998768093624885, 'eval_Reflex_accuracy': 0.9991376655374191, 'eval_Reflex_precision_macro': 0.49956883276870956, 'eval_Reflex_recall_macro': 0.5, 'eval_Reflex_f1_macro': 0.49978432339166873, 'eval_Reflex_precision_micro': 0.9991376655374191, 'eval_Reflex_recall_micro': 0.9991376655374191, 'eval_Reflex_f1_micro': 0.9991376655374191, 'eval_Tense_accuracy': 0.9952879581151832, 'eval_Tense_precision_macro': 0.9787871267745433, 'eval_Tense_recall_macro': 0.9864770652457818, 'eval_Tense_f1_macro': 0.9825904650648791, 'eval_Tense_precision_micro': 0.9952879581151832, 'eval_Tense_recall_micro': 0.9952879581151832, 'eval_Tense_f1_micro': 0.9952879581151832, 'eval_VerbForm_accuracy': 0.9902063443178318, 'eval_VerbForm_precision_macro': 0.9488646236993693, 'eval_VerbForm_recall_macro': 0.9397177219211919, 'eval_VerbForm_f1_macro': 0.943995956555818, 'eval_VerbForm_precision_micro': 0.9902063443178318, 'eval_VerbForm_recall_micro': 0.9902063443178318, 'eval_VerbForm_f1_micro': 0.9902063443178318, 'eval_runtime': 186.7334, 'eval_samples_per_second': 12.815, 'eval_steps_per_second': 6.41, 'epoch': 2.71}
|
| 319 |
+
{'loss': 9.388, 'grad_norm': 25.146930694580078, 'learning_rate': 1.7171717171717173e-05, 'epoch': 3.61}
|
| 320 |
+
{'eval_loss': 0.49747249484062195, 'eval_f1_macro': 0.8718377259092057, 'eval_xpos_accuracy': 0.960948567908839, 'eval_xpos_precision_macro': 0.8062329343755253, 'eval_xpos_recall_macro': 0.7627058644666792, 'eval_xpos_f1_macro': 0.7735844398201657, 'eval_xpos_precision_micro': 0.960948567908839, 'eval_xpos_recall_micro': 0.960948567908839, 'eval_xpos_f1_micro': 0.960948567908839, 'eval_deprel_accuracy': 0.8987064983061287, 'eval_deprel_precision_macro': 0.6649961928130208, 'eval_deprel_recall_macro': 0.6061168035600968, 'eval_deprel_f1_macro': 0.6145059768785477, 'eval_deprel_precision_micro': 0.8987064983061287, 'eval_deprel_recall_micro': 0.8987064983061287, 'eval_deprel_f1_micro': 0.8987064983061287, 'eval_pos_accuracy': 0.9664613489374807, 'eval_pos_precision_macro': 0.9574652805906176, 'eval_pos_recall_macro': 0.9091873832322055, 'eval_pos_f1_macro': 0.9269694027860854, 'eval_pos_precision_micro': 0.9664613489374807, 'eval_pos_recall_micro': 0.9664613489374807, 'eval_pos_f1_micro': 0.9664613489374807, 'eval_Case_accuracy': 0.9987064983061288, 'eval_Case_precision_macro': 0.9693431856757901, 'eval_Case_recall_macro': 0.9855059941290149, 'eval_Case_f1_macro': 0.977021476488875, 'eval_Case_precision_micro': 0.9987064983061288, 'eval_Case_recall_micro': 0.9987064983061288, 'eval_Case_f1_micro': 0.9987064983061288, 'eval_Definite_accuracy': 0.9999384046812442, 'eval_Definite_precision_macro': 0.9995662546085448, 'eval_Definite_recall_macro': 0.999977959246647, 'eval_Definite_f1_macro': 0.9997719653700766, 'eval_Definite_precision_micro': 0.9999384046812442, 'eval_Definite_recall_micro': 0.9999384046812442, 'eval_Definite_f1_micro': 0.9999384046812442, 'eval_Degree_accuracy': 0.9905759162303664, 'eval_Degree_precision_macro': 0.9404722911369776, 'eval_Degree_recall_macro': 0.9643513679469289, 'eval_Degree_f1_macro': 0.9518304351585247, 'eval_Degree_precision_micro': 0.9905759162303664, 'eval_Degree_recall_micro': 0.9905759162303664, 'eval_Degree_f1_micro': 0.9905759162303664, 'eval_Foreign_accuracy': 0.999445642131198, 'eval_Foreign_precision_macro': 0.9997227698373583, 'eval_Foreign_recall_macro': 0.625, 'eval_Foreign_f1_macro': 0.6998613464797412, 'eval_Foreign_precision_micro': 0.999445642131198, 'eval_Foreign_recall_micro': 0.999445642131198, 'eval_Foreign_f1_micro': 0.999445642131198, 'eval_Gender_accuracy': 0.9999384046812442, 'eval_Gender_precision_macro': 0.9979993409593748, 'eval_Gender_recall_macro': 0.9999843161856964, 'eval_Gender_f1_macro': 0.9989897828680285, 'eval_Gender_precision_micro': 0.9999384046812442, 'eval_Gender_recall_micro': 0.9999384046812442, 'eval_Gender_f1_micro': 0.9999384046812442, 'eval_Mood_accuracy': 0.9959655066214967, 'eval_Mood_precision_macro': 0.9293040431350059, 'eval_Mood_recall_macro': 0.9494028654198089, 'eval_Mood_f1_macro': 0.938936855522995, 'eval_Mood_precision_micro': 0.9959655066214967, 'eval_Mood_recall_micro': 0.9959655066214967, 'eval_Mood_f1_micro': 0.9959655066214967, 'eval_NumType_accuracy': 0.9982445334154604, 'eval_NumType_precision_macro': 0.6993009241429441, 'eval_NumType_recall_macro': 0.6305054622458915, 'eval_NumType_f1_macro': 0.6566138277103395, 'eval_NumType_precision_micro': 0.9982445334154604, 'eval_NumType_recall_micro': 0.9982445334154604, 'eval_NumType_f1_micro': 0.9982445334154604, 'eval_Number_accuracy': 0.988266091777025, 'eval_Number_precision_macro': 0.9850941695389235, 'eval_Number_recall_macro': 0.9857136154248215, 'eval_Number_f1_macro': 0.9853955679702847, 'eval_Number_precision_micro': 0.988266091777025, 'eval_Number_recall_micro': 0.988266091777025, 'eval_Number_f1_micro': 0.988266091777025, 'eval_Person_accuracy': 0.9993532491530643, 'eval_Person_precision_macro': 0.9959492274518652, 'eval_Person_recall_macro': 0.9975098186925492, 'eval_Person_f1_macro': 0.9967214484807434, 'eval_Person_precision_micro': 0.9993532491530643, 'eval_Person_recall_micro': 0.9993532491530643, 'eval_Person_f1_micro': 0.9993532491530643, 'eval_Polarity_accuracy': 0.9991992608561749, 'eval_Polarity_precision_macro': 0.6607795396004207, 'eval_Polarity_recall_macro': 0.6468158611932046, 'eval_Polarity_f1_macro': 0.6536410927097368, 'eval_Polarity_precision_micro': 0.9991992608561749, 'eval_Polarity_recall_micro': 0.9991992608561749, 'eval_Polarity_f1_micro': 0.9991992608561749, 'eval_PronType_accuracy': 0.99781336618417, 'eval_PronType_precision_macro': 0.9644844775814299, 'eval_PronType_recall_macro': 0.9638509473805712, 'eval_PronType_f1_macro': 0.9640893045253183, 'eval_PronType_precision_micro': 0.99781336618417, 'eval_PronType_recall_micro': 0.99781336618417, 'eval_PronType_f1_micro': 0.99781336618417, 'eval_Poss_accuracy': 0.9997536187249769, 'eval_Poss_precision_macro': 0.99458832399169, 'eval_Poss_recall_macro': 0.9966891310250018, 'eval_Poss_f1_macro': 0.9956364344952822, 'eval_Poss_precision_micro': 0.9997536187249769, 'eval_Poss_recall_micro': 0.9997536187249769, 'eval_Poss_f1_micro': 0.9997536187249769, 'eval_Reflex_accuracy': 0.9992608561749307, 'eval_Reflex_precision_macro': 0.9996303825540566, 'eval_Reflex_recall_macro': 0.5714285714285714, 'eval_Reflex_f1_macro': 0.6248151229432428, 'eval_Reflex_precision_micro': 0.9992608561749307, 'eval_Reflex_recall_micro': 0.9992608561749307, 'eval_Reflex_f1_micro': 0.9992608561749307, 'eval_Tense_accuracy': 0.9957191253464737, 'eval_Tense_precision_macro': 0.9794265610405795, 'eval_Tense_recall_macro': 0.9897261147614769, 'eval_Tense_f1_macro': 0.9845279675778684, 'eval_Tense_precision_micro': 0.9957191253464737, 'eval_Tense_recall_micro': 0.9957191253464737, 'eval_Tense_f1_micro': 0.9957191253464737, 'eval_VerbForm_accuracy': 0.9914690483523252, 'eval_VerbForm_precision_macro': 0.9504258537812117, 'eval_VerbForm_recall_macro': 0.9503359343965861, 'eval_VerbForm_f1_macro': 0.9501666185798474, 'eval_VerbForm_precision_micro': 0.9914690483523252, 'eval_VerbForm_recall_micro': 0.9914690483523252, 'eval_VerbForm_f1_micro': 0.9914690483523252, 'eval_runtime': 188.9191, 'eval_samples_per_second': 12.667, 'eval_steps_per_second': 6.336, 'epoch': 3.61}
|
| 321 |
+
{'loss': 6.5081, 'grad_norm': 21.06374740600586, 'learning_rate': 1.590909090909091e-05, 'epoch': 4.51}
|
| 322 |
+
{'eval_loss': 0.408866822719574, 'eval_f1_macro': 0.8954199126696436, 'eval_xpos_accuracy': 0.9660301817061904, 'eval_xpos_precision_macro': 0.8447770793450754, 'eval_xpos_recall_macro': 0.8037038582000618, 'eval_xpos_f1_macro': 0.8057847594652022, 'eval_xpos_precision_micro': 0.9660301817061904, 'eval_xpos_recall_micro': 0.9660301817061904, 'eval_xpos_f1_micro': 0.9660301817061904, 'eval_deprel_accuracy': 0.9175546658453958, 'eval_deprel_precision_macro': 0.7712950346412832, 'eval_deprel_recall_macro': 0.6759337104704818, 'eval_deprel_f1_macro': 0.6839128952920054, 'eval_deprel_precision_micro': 0.9175546658453958, 'eval_deprel_recall_micro': 0.9175546658453958, 'eval_deprel_f1_micro': 0.9175546658453958, 'eval_pos_accuracy': 0.9687403757314444, 'eval_pos_precision_macro': 0.9605966613306007, 'eval_pos_recall_macro': 0.9193023354683654, 'eval_pos_f1_macro': 0.9354703235410045, 'eval_pos_precision_micro': 0.9687403757314444, 'eval_pos_recall_micro': 0.9687403757314444, 'eval_pos_f1_micro': 0.9687403757314444, 'eval_Case_accuracy': 0.9985525100092393, 'eval_Case_precision_macro': 0.9681490373165985, 'eval_Case_recall_macro': 0.9839429566611361, 'eval_Case_f1_macro': 0.975677912282945, 'eval_Case_precision_micro': 0.9985525100092393, 'eval_Case_recall_micro': 0.9985525100092393, 'eval_Case_f1_micro': 0.9985525100092393, 'eval_Definite_accuracy': 0.9999384046812442, 'eval_Definite_precision_macro': 0.9995662546085448, 'eval_Definite_recall_macro': 0.999977959246647, 'eval_Definite_f1_macro': 0.9997719653700766, 'eval_Definite_precision_micro': 0.9999384046812442, 'eval_Definite_recall_micro': 0.9999384046812442, 'eval_Definite_f1_micro': 0.9999384046812442, 'eval_Degree_accuracy': 0.9911302740991684, 'eval_Degree_precision_macro': 0.93486030156168, 'eval_Degree_recall_macro': 0.9676954382176055, 'eval_Degree_f1_macro': 0.950630871614094, 'eval_Degree_precision_micro': 0.9911302740991684, 'eval_Degree_recall_micro': 0.9911302740991684, 'eval_Degree_f1_micro': 0.9911302740991684, 'eval_Foreign_accuracy': 0.9995688327687096, 'eval_Foreign_precision_macro': 0.9997843499691929, 'eval_Foreign_recall_macro': 0.7083333333333334, 'eval_Foreign_f1_macro': 0.7940097987859366, 'eval_Foreign_precision_micro': 0.9995688327687096, 'eval_Foreign_recall_micro': 0.9995688327687096, 'eval_Foreign_f1_micro': 0.9995688327687096, 'eval_Gender_accuracy': 0.9999384046812442, 'eval_Gender_precision_macro': 0.9977272727272728, 'eval_Gender_recall_macro': 0.9999843161856964, 'eval_Gender_f1_macro': 0.9988506053354429, 'eval_Gender_precision_micro': 0.9999384046812442, 'eval_Gender_recall_micro': 0.9999384046812442, 'eval_Gender_f1_micro': 0.9999384046812442, 'eval_Mood_accuracy': 0.9960886972590083, 'eval_Mood_precision_macro': 0.9285990916036216, 'eval_Mood_recall_macro': 0.9507186223908771, 'eval_Mood_f1_macro': 0.9391042378788114, 'eval_Mood_precision_micro': 0.9960886972590083, 'eval_Mood_recall_micro': 0.9960886972590083, 'eval_Mood_f1_micro': 0.9960886972590083, 'eval_NumType_accuracy': 0.9986141053279951, 'eval_NumType_precision_macro': 0.6822860763993688, 'eval_NumType_recall_macro': 0.676377320275705, 'eval_NumType_f1_macro': 0.6791893073788933, 'eval_NumType_precision_micro': 0.9986141053279951, 'eval_NumType_recall_micro': 0.9986141053279951, 'eval_NumType_f1_micro': 0.9986141053279951, 'eval_Number_accuracy': 0.9889436402833385, 'eval_Number_precision_macro': 0.98638555354807, 'eval_Number_recall_macro': 0.9862674454146649, 'eval_Number_f1_macro': 0.9863242604642144, 'eval_Number_precision_micro': 0.9889436402833385, 'eval_Number_recall_micro': 0.9889436402833385, 'eval_Number_f1_micro': 0.9889436402833385, 'eval_Person_accuracy': 0.9992608561749307, 'eval_Person_precision_macro': 0.9954674214517129, 'eval_Person_recall_macro': 0.9967809199283294, 'eval_Person_f1_macro': 0.9961187221016584, 'eval_Person_precision_micro': 0.9992608561749307, 'eval_Person_recall_micro': 0.9992608561749307, 'eval_Person_f1_micro': 0.9992608561749307, 'eval_Polarity_accuracy': 0.9993532491530643, 'eval_Polarity_precision_macro': 0.6592447751841108, 'eval_Polarity_recall_macro': 0.6576163434528012, 'eval_Polarity_f1_macro': 0.6584281574162262, 'eval_Polarity_precision_micro': 0.9993532491530643, 'eval_Polarity_recall_micro': 0.9993532491530643, 'eval_Polarity_f1_micro': 0.9993532491530643, 'eval_PronType_accuracy': 0.9979365568216816, 'eval_PronType_precision_macro': 0.9683675975317747, 'eval_PronType_recall_macro': 0.9663774078572499, 'eval_PronType_f1_macro': 0.9672379432789368, 'eval_PronType_precision_micro': 0.9979365568216816, 'eval_PronType_recall_micro': 0.9979365568216816, 'eval_PronType_f1_micro': 0.9979365568216816, 'eval_Poss_accuracy': 0.9997228210655991, 'eval_Poss_precision_macro': 0.9935291465247402, 'eval_Poss_recall_macro': 0.9966735089541401, 'eval_Poss_f1_macro': 0.9950961850339957, 'eval_Poss_precision_micro': 0.9997228210655991, 'eval_Poss_recall_micro': 0.9997228210655991, 'eval_Poss_f1_micro': 0.9997228210655991, 'eval_Reflex_accuracy': 0.9995380351093317, 'eval_Reflex_precision_macro': 0.9997689250392827, 'eval_Reflex_recall_macro': 0.7321428571428572, 'eval_Reflex_f1_macro': 0.8169576065473594, 'eval_Reflex_precision_micro': 0.9995380351093317, 'eval_Reflex_recall_micro': 0.9995380351093317, 'eval_Reflex_f1_micro': 0.9995380351093317, 'eval_Tense_accuracy': 0.9958731136433631, 'eval_Tense_precision_macro': 0.9809496532246222, 'eval_Tense_recall_macro': 0.9892439078556619, 'eval_Tense_f1_macro': 0.9850671410936594, 'eval_Tense_precision_micro': 0.9958731136433631, 'eval_Tense_recall_micro': 0.9958731136433631, 'eval_Tense_f1_micro': 0.9958731136433631, 'eval_VerbForm_accuracy': 0.9914074530335695, 'eval_VerbForm_precision_macro': 0.9459356559961168, 'eval_VerbForm_recall_macro': 0.9543664388755427, 'eval_VerbForm_f1_macro': 0.9499257351731222, 'eval_VerbForm_precision_micro': 0.9914074530335695, 'eval_VerbForm_recall_micro': 0.9914074530335695, 'eval_VerbForm_f1_micro': 0.9914074530335695, 'eval_runtime': 184.6158, 'eval_samples_per_second': 12.962, 'eval_steps_per_second': 6.484, 'epoch': 4.51}
|
| 323 |
+
{'loss': 5.1338, 'grad_norm': 16.48375701904297, 'learning_rate': 1.4646464646464649e-05, 'epoch': 5.41}
|
| 324 |
+
{'eval_loss': 0.36643537878990173, 'eval_f1_macro': 0.9241799342795853, 'eval_xpos_accuracy': 0.9675392670157068, 'eval_xpos_precision_macro': 0.9066585459411307, 'eval_xpos_recall_macro': 0.8650145319707331, 'eval_xpos_f1_macro': 0.8733249510022046, 'eval_xpos_precision_micro': 0.9675392670157068, 'eval_xpos_recall_micro': 0.9675392670157068, 'eval_xpos_f1_micro': 0.9675392670157068, 'eval_deprel_accuracy': 0.9263627964274715, 'eval_deprel_precision_macro': 0.7986281863613143, 'eval_deprel_recall_macro': 0.7324776421481113, 'eval_deprel_f1_macro': 0.7424124247127928, 'eval_deprel_precision_micro': 0.9263627964274715, 'eval_deprel_recall_micro': 0.9263627964274715, 'eval_deprel_f1_micro': 0.9263627964274715, 'eval_pos_accuracy': 0.969664305512781, 'eval_pos_precision_macro': 0.9597509199987729, 'eval_pos_recall_macro': 0.9279522767919809, 'eval_pos_f1_macro': 0.9413842585004687, 'eval_pos_precision_micro': 0.969664305512781, 'eval_pos_recall_micro': 0.969664305512781, 'eval_pos_f1_micro': 0.969664305512781, 'eval_Case_accuracy': 0.998644902987373, 'eval_Case_precision_macro': 0.968321177469761, 'eval_Case_recall_macro': 0.9832535025864676, 'eval_Case_f1_macro': 0.975413333731463, 'eval_Case_precision_micro': 0.998644902987373, 'eval_Case_recall_micro': 0.998644902987373, 'eval_Case_f1_micro': 0.998644902987373, 'eval_Definite_accuracy': 0.9999692023406221, 'eval_Definite_precision_macro': 0.9997829861111112, 'eval_Definite_recall_macro': 0.9999889796233236, 'eval_Definite_f1_macro': 0.9998859474433567, 'eval_Definite_precision_micro': 0.9999692023406221, 'eval_Definite_recall_micro': 0.9999692023406221, 'eval_Definite_f1_micro': 0.9999692023406221, 'eval_Degree_accuracy': 0.9910994764397906, 'eval_Degree_precision_macro': 0.9490721872470783, 'eval_Degree_recall_macro': 0.9681919824291281, 'eval_Degree_f1_macro': 0.9584396894675267, 'eval_Degree_precision_micro': 0.9910994764397906, 'eval_Degree_recall_micro': 0.9910994764397906, 'eval_Degree_f1_micro': 0.9910994764397906, 'eval_Foreign_accuracy': 0.9995688327687096, 'eval_Foreign_precision_macro': 0.9997843499691929, 'eval_Foreign_recall_macro': 0.7083333333333334, 'eval_Foreign_f1_macro': 0.7940097987859366, 'eval_Foreign_precision_micro': 0.9995688327687096, 'eval_Foreign_recall_micro': 0.9995688327687096, 'eval_Foreign_f1_micro': 0.9995688327687096, 'eval_Gender_accuracy': 0.9999692023406221, 'eval_Gender_precision_macro': 0.9988584474885844, 'eval_Gender_recall_macro': 0.9999921580928481, 'eval_Gender_f1_macro': 0.9994239966050649, 'eval_Gender_precision_micro': 0.9999692023406221, 'eval_Gender_recall_micro': 0.9999692023406221, 'eval_Gender_f1_micro': 0.9999692023406221, 'eval_Mood_accuracy': 0.9960271019402526, 'eval_Mood_precision_macro': 0.9302300109068503, 'eval_Mood_recall_macro': 0.9503058715562149, 'eval_Mood_f1_macro': 0.9398033347625038, 'eval_Mood_precision_micro': 0.9960271019402526, 'eval_Mood_recall_micro': 0.9960271019402526, 'eval_Mood_f1_micro': 0.9960271019402526, 'eval_NumType_accuracy': 0.9987988912842624, 'eval_NumType_precision_macro': 0.6895853568005501, 'eval_NumType_recall_macro': 0.708916883576987, 'eval_NumType_f1_macro': 0.6989526751698049, 'eval_NumType_precision_micro': 0.9987988912842624, 'eval_NumType_recall_micro': 0.9987988912842624, 'eval_NumType_f1_micro': 0.9987988912842624, 'eval_Number_accuracy': 0.9887896519864491, 'eval_Number_precision_macro': 0.9851545742951385, 'eval_Number_recall_macro': 0.9852679994115098, 'eval_Number_f1_macro': 0.9852099196851308, 'eval_Number_precision_micro': 0.9887896519864491, 'eval_Number_recall_micro': 0.9887896519864491, 'eval_Number_f1_micro': 0.9887896519864491, 'eval_Person_accuracy': 0.9993532491530643, 'eval_Person_precision_macro': 0.9970752660644107, 'eval_Person_recall_macro': 0.9962361030426535, 'eval_Person_f1_macro': 0.9966506796725936, 'eval_Person_precision_micro': 0.9993532491530643, 'eval_Person_recall_micro': 0.9993532491530643, 'eval_Person_f1_micro': 0.9993532491530643, 'eval_Polarity_accuracy': 0.9996920234062211, 'eval_Polarity_precision_macro': 0.9389873962829686, 'eval_Polarity_recall_macro': 0.9389873962829686, 'eval_Polarity_f1_macro': 0.9389873962829686, 'eval_Polarity_precision_micro': 0.9996920234062211, 'eval_Polarity_recall_micro': 0.9996920234062211, 'eval_Polarity_f1_micro': 0.9996920234062211, 'eval_PronType_accuracy': 0.998090545118571, 'eval_PronType_precision_macro': 0.9686494447417681, 'eval_PronType_recall_macro': 0.9702883725094406, 'eval_PronType_f1_macro': 0.969388077882025, 'eval_PronType_precision_micro': 0.998090545118571, 'eval_PronType_recall_micro': 0.998090545118571, 'eval_PronType_f1_micro': 0.998090545118571, 'eval_Poss_accuracy': 0.9997536187249769, 'eval_Poss_precision_macro': 0.99458832399169, 'eval_Poss_recall_macro': 0.9966891310250018, 'eval_Poss_f1_macro': 0.9956364344952822, 'eval_Poss_precision_micro': 0.9997536187249769, 'eval_Poss_recall_micro': 0.9997536187249769, 'eval_Poss_f1_micro': 0.9997536187249769, 'eval_Reflex_accuracy': 0.9996920234062211, 'eval_Reflex_precision_macro': 0.9998459262911377, 'eval_Reflex_recall_macro': 0.8214285714285714, 'eval_Reflex_f1_macro': 0.8912272991004728, 'eval_Reflex_precision_micro': 0.9996920234062211, 'eval_Reflex_recall_micro': 0.9996920234062211, 'eval_Reflex_f1_micro': 0.9996920234062211, 'eval_Tense_accuracy': 0.9955959347089621, 'eval_Tense_precision_macro': 0.9788025068268645, 'eval_Tense_recall_macro': 0.989162555536469, 'eval_Tense_f1_macro': 0.9839336910315675, 'eval_Tense_precision_micro': 0.9955959347089621, 'eval_Tense_recall_micro': 0.9955959347089621, 'eval_Tense_f1_micro': 0.9955959347089621, 'eval_VerbForm_accuracy': 0.9915614413304589, 'eval_VerbForm_precision_macro': 0.9476096358002539, 'eval_VerbForm_recall_macro': 0.9552034318237569, 'eval_VerbForm_f1_macro': 0.9511549087013748, 'eval_VerbForm_precision_micro': 0.9915614413304589, 'eval_VerbForm_recall_micro': 0.9915614413304589, 'eval_VerbForm_f1_micro': 0.9915614413304589, 'eval_runtime': 184.9351, 'eval_samples_per_second': 12.94, 'eval_steps_per_second': 6.473, 'epoch': 5.41}
|
| 325 |
+
{'loss': 4.2362, 'grad_norm': 20.03514289855957, 'learning_rate': 1.3383838383838385e-05, 'epoch': 6.31}
|
| 326 |
+
{'eval_loss': 0.3454221487045288, 'eval_f1_macro': 0.927191178980668, 'eval_xpos_accuracy': 0.9697259008315368, 'eval_xpos_precision_macro': 0.9120176676761855, 'eval_xpos_recall_macro': 0.8727963832660698, 'eval_xpos_f1_macro': 0.8817950230513683, 'eval_xpos_precision_micro': 0.9697259008315368, 'eval_xpos_recall_micro': 0.9697259008315368, 'eval_xpos_f1_micro': 0.9697259008315368, 'eval_deprel_accuracy': 0.9314752078842008, 'eval_deprel_precision_macro': 0.852884091184579, 'eval_deprel_recall_macro': 0.7606003458175867, 'eval_deprel_f1_macro': 0.7830208706525961, 'eval_deprel_precision_micro': 0.9314752078842008, 'eval_deprel_recall_micro': 0.9314752078842008, 'eval_deprel_f1_micro': 0.9314752078842008, 'eval_pos_accuracy': 0.9713889744379427, 'eval_pos_precision_macro': 0.9637647444684193, 'eval_pos_recall_macro': 0.9316105534958254, 'eval_pos_f1_macro': 0.9452720649009796, 'eval_pos_precision_micro': 0.9713889744379427, 'eval_pos_recall_micro': 0.9713889744379427, 'eval_pos_f1_micro': 0.9713889744379427, 'eval_Case_accuracy': 0.998644902987373, 'eval_Case_precision_macro': 0.9693356623836876, 'eval_Case_recall_macro': 0.9820723427139589, 'eval_Case_f1_macro': 0.9754485543666854, 'eval_Case_precision_micro': 0.998644902987373, 'eval_Case_recall_micro': 0.998644902987373, 'eval_Case_f1_micro': 0.998644902987373, 'eval_Definite_accuracy': 1.0, 'eval_Definite_precision_macro': 1.0, 'eval_Definite_recall_macro': 1.0, 'eval_Definite_f1_macro': 1.0, 'eval_Definite_precision_micro': 1.0, 'eval_Definite_recall_micro': 1.0, 'eval_Definite_f1_micro': 1.0, 'eval_Degree_accuracy': 0.99125346473668, 'eval_Degree_precision_macro': 0.9518965711368261, 'eval_Degree_recall_macro': 0.9653518811561206, 'eval_Degree_f1_macro': 0.9585419040234433, 'eval_Degree_precision_micro': 0.99125346473668, 'eval_Degree_recall_micro': 0.99125346473668, 'eval_Degree_f1_micro': 0.99125346473668, 'eval_Foreign_accuracy': 0.9995688327687096, 'eval_Foreign_precision_macro': 0.9997843499691929, 'eval_Foreign_recall_macro': 0.7083333333333334, 'eval_Foreign_f1_macro': 0.7940097987859366, 'eval_Foreign_precision_micro': 0.9995688327687096, 'eval_Foreign_recall_micro': 0.9995688327687096, 'eval_Foreign_f1_micro': 0.9995688327687096, 'eval_Gender_accuracy': 0.9999692023406221, 'eval_Gender_precision_macro': 0.9988584474885844, 'eval_Gender_recall_macro': 0.9999921580928481, 'eval_Gender_f1_macro': 0.9994239966050649, 'eval_Gender_precision_micro': 0.9999692023406221, 'eval_Gender_recall_micro': 0.9999692023406221, 'eval_Gender_f1_micro': 0.9999692023406221, 'eval_Mood_accuracy': 0.9959963042808746, 'eval_Mood_precision_macro': 0.9255401109080846, 'eval_Mood_recall_macro': 0.9590927802520216, 'eval_Mood_f1_macro': 0.9411842210866329, 'eval_Mood_precision_micro': 0.9959963042808746, 'eval_Mood_recall_micro': 0.9959963042808746, 'eval_Mood_f1_micro': 0.9959963042808746, 'eval_NumType_accuracy': 0.9987680936248845, 'eval_NumType_precision_macro': 0.685465227290188, 'eval_NumType_recall_macro': 0.708428602326987, 'eval_NumType_f1_macro': 0.6964556489152147, 'eval_NumType_precision_micro': 0.9987680936248845, 'eval_NumType_recall_micro': 0.9987680936248845, 'eval_NumType_f1_micro': 0.9987680936248845, 'eval_Number_accuracy': 0.9892208192177394, 'eval_Number_precision_macro': 0.9864998826772883, 'eval_Number_recall_macro': 0.9855751060999873, 'eval_Number_f1_macro': 0.9860361829601003, 'eval_Number_precision_micro': 0.9892208192177394, 'eval_Number_recall_micro': 0.9892208192177394, 'eval_Number_f1_micro': 0.9892208192177394, 'eval_Person_accuracy': 0.9993532491530643, 'eval_Person_precision_macro': 0.9967006676877255, 'eval_Person_recall_macro': 0.9967403582439176, 'eval_Person_f1_macro': 0.996719094352911, 'eval_Person_precision_micro': 0.9993532491530643, 'eval_Person_recall_micro': 0.9993532491530643, 'eval_Person_f1_micro': 0.9993532491530643, 'eval_Polarity_accuracy': 0.9996304280874654, 'eval_Polarity_precision_macro': 0.9611195676225487, 'eval_Polarity_recall_macro': 0.9076163434528012, 'eval_Polarity_f1_macro': 0.9320855951152653, 'eval_Polarity_precision_micro': 0.9996304280874654, 'eval_Polarity_recall_micro': 0.9996304280874654, 'eval_Polarity_f1_micro': 0.9996304280874654, 'eval_PronType_accuracy': 0.9981829380967047, 'eval_PronType_precision_macro': 0.9693779325345468, 'eval_PronType_recall_macro': 0.9756421815451005, 'eval_PronType_f1_macro': 0.9723088141352486, 'eval_PronType_precision_micro': 0.9981829380967047, 'eval_PronType_recall_micro': 0.9981829380967047, 'eval_PronType_f1_micro': 0.9981829380967047, 'eval_Poss_accuracy': 0.9997228210655991, 'eval_Poss_precision_macro': 0.9935291465247402, 'eval_Poss_recall_macro': 0.9966735089541401, 'eval_Poss_f1_macro': 0.9950961850339957, 'eval_Poss_precision_micro': 0.9997228210655991, 'eval_Poss_recall_micro': 0.9997228210655991, 'eval_Poss_f1_micro': 0.9997228210655991, 'eval_Reflex_accuracy': 0.9996920234062211, 'eval_Reflex_precision_macro': 0.9998459262911377, 'eval_Reflex_recall_macro': 0.8214285714285714, 'eval_Reflex_f1_macro': 0.8912272991004728, 'eval_Reflex_precision_micro': 0.9996920234062211, 'eval_Reflex_recall_micro': 0.9996920234062211, 'eval_Reflex_f1_micro': 0.9996920234062211, 'eval_Tense_accuracy': 0.9959347089621189, 'eval_Tense_precision_macro': 0.9805174402763704, 'eval_Tense_recall_macro': 0.9900407100646563, 'eval_Tense_f1_macro': 0.9852373030182698, 'eval_Tense_precision_micro': 0.9959347089621189, 'eval_Tense_recall_micro': 0.9959347089621189, 'eval_Tense_f1_micro': 0.9959347089621189, 'eval_VerbForm_accuracy': 0.9924237757930398, 'eval_VerbForm_precision_macro': 0.9582794436379263, 'eval_VerbForm_recall_macro': 0.953610611651494, 'eval_VerbForm_f1_macro': 0.9555786655478402, 'eval_VerbForm_precision_micro': 0.9924237757930398, 'eval_VerbForm_recall_micro': 0.9924237757930398, 'eval_VerbForm_f1_micro': 0.9924237757930398, 'eval_runtime': 185.1084, 'eval_samples_per_second': 12.928, 'eval_steps_per_second': 6.466, 'epoch': 6.31}
|
| 327 |
+
{'loss': 3.8109, 'grad_norm': 12.93899917602539, 'learning_rate': 1.2121212121212122e-05, 'epoch': 7.21}
|
| 328 |
+
{'eval_loss': 0.32562968134880066, 'eval_f1_macro': 0.9343274107120304, 'eval_xpos_accuracy': 0.969941484447182, 'eval_xpos_precision_macro': 0.9120132506574007, 'eval_xpos_recall_macro': 0.8831554189840309, 'eval_xpos_f1_macro': 0.8874732055833041, 'eval_xpos_precision_micro': 0.969941484447182, 'eval_xpos_recall_micro': 0.969941484447182, 'eval_xpos_f1_micro': 0.969941484447182, 'eval_deprel_accuracy': 0.9351093316907915, 'eval_deprel_precision_macro': 0.8449162056679124, 'eval_deprel_recall_macro': 0.8036792440436371, 'eval_deprel_f1_macro': 0.8179579679191769, 'eval_deprel_precision_micro': 0.9351093316907915, 'eval_deprel_recall_micro': 0.9351093316907915, 'eval_deprel_f1_micro': 0.9351093316907915, 'eval_pos_accuracy': 0.9709270095472744, 'eval_pos_precision_macro': 0.9594838943585567, 'eval_pos_recall_macro': 0.933477064749745, 'eval_pos_f1_macro': 0.9448065605920223, 'eval_pos_precision_micro': 0.9709270095472744, 'eval_pos_recall_micro': 0.9709270095472744, 'eval_pos_f1_micro': 0.9709270095472744, 'eval_Case_accuracy': 0.9986757006467508, 'eval_Case_precision_macro': 0.9696845938686529, 'eval_Case_recall_macro': 0.9828049257982774, 'eval_Case_f1_macro': 0.9759597233287761, 'eval_Case_precision_micro': 0.9986757006467508, 'eval_Case_recall_micro': 0.9986757006467508, 'eval_Case_f1_micro': 0.9986757006467508, 'eval_Definite_accuracy': 0.9999384046812442, 'eval_Definite_precision_macro': 0.9995662546085448, 'eval_Definite_recall_macro': 0.999977959246647, 'eval_Definite_f1_macro': 0.9997719653700766, 'eval_Definite_precision_micro': 0.9999384046812442, 'eval_Definite_recall_micro': 0.9999384046812442, 'eval_Definite_f1_micro': 0.9999384046812442, 'eval_Degree_accuracy': 0.991530643671081, 'eval_Degree_precision_macro': 0.9520605462601486, 'eval_Degree_recall_macro': 0.9605721279700763, 'eval_Degree_f1_macro': 0.956286381013717, 'eval_Degree_precision_micro': 0.991530643671081, 'eval_Degree_recall_micro': 0.991530643671081, 'eval_Degree_f1_micro': 0.991530643671081, 'eval_Foreign_accuracy': 0.9995380351093317, 'eval_Foreign_precision_macro': 0.9543297978708805, 'eval_Foreign_recall_macro': 0.7083179231132753, 'eval_Foreign_f1_macro': 0.7855987322130147, 'eval_Foreign_precision_micro': 0.9995380351093317, 'eval_Foreign_recall_micro': 0.9995380351093317, 'eval_Foreign_f1_micro': 0.9995380351093317, 'eval_Gender_accuracy': 0.9999692023406221, 'eval_Gender_precision_macro': 0.9988584474885844, 'eval_Gender_recall_macro': 0.9999921580928481, 'eval_Gender_f1_macro': 0.9994239966050649, 'eval_Gender_precision_micro': 0.9999692023406221, 'eval_Gender_recall_micro': 0.9999692023406221, 'eval_Gender_f1_micro': 0.9999692023406221, 'eval_Mood_accuracy': 0.996181090237142, 'eval_Mood_precision_macro': 0.9327497736806049, 'eval_Mood_recall_macro': 0.9520232217608294, 'eval_Mood_f1_macro': 0.9419627283644093, 'eval_Mood_precision_micro': 0.996181090237142, 'eval_Mood_recall_micro': 0.996181090237142, 'eval_Mood_f1_micro': 0.996181090237142, 'eval_NumType_accuracy': 0.9989220819217739, 'eval_NumType_precision_macro': 0.9457750146330861, 'eval_NumType_recall_macro': 0.7584599365376782, 'eval_NumType_f1_macro': 0.7853160162000002, 'eval_NumType_precision_micro': 0.9989220819217739, 'eval_NumType_recall_micro': 0.9989220819217739, 'eval_NumType_f1_micro': 0.9989220819217739, 'eval_Number_accuracy': 0.9894979981521405, 'eval_Number_precision_macro': 0.9854504781790397, 'eval_Number_recall_macro': 0.9876534934419489, 'eval_Number_f1_macro': 0.9865476985437925, 'eval_Number_precision_micro': 0.9894979981521405, 'eval_Number_recall_micro': 0.9894979981521405, 'eval_Number_f1_micro': 0.9894979981521405, 'eval_Person_accuracy': 0.9993840468124423, 'eval_Person_precision_macro': 0.9973462143399449, 'eval_Person_recall_macro': 0.9964300765220414, 'eval_Person_f1_macro': 0.9968851195932011, 'eval_Person_precision_micro': 0.9993840468124423, 'eval_Person_recall_micro': 0.9993840468124423, 'eval_Person_f1_micro': 0.9993840468124423, 'eval_Polarity_accuracy': 0.9997536187249769, 'eval_Polarity_precision_macro': 0.9642793114060918, 'eval_Polarity_recall_macro': 0.9407995266359843, 'eval_Polarity_f1_macro': 0.9519880619426493, 'eval_Polarity_precision_micro': 0.9997536187249769, 'eval_Polarity_recall_micro': 0.9997536187249769, 'eval_Polarity_f1_micro': 0.9997536187249769, 'eval_PronType_accuracy': 0.9982445334154604, 'eval_PronType_precision_macro': 0.9704384701653251, 'eval_PronType_recall_macro': 0.9756526090737763, 'eval_PronType_f1_macro': 0.9728708374812266, 'eval_PronType_precision_micro': 0.9982445334154604, 'eval_PronType_recall_micro': 0.9982445334154604, 'eval_PronType_f1_micro': 0.9982445334154604, 'eval_Poss_accuracy': 0.9997536187249769, 'eval_Poss_precision_macro': 0.99458832399169, 'eval_Poss_recall_macro': 0.9966891310250018, 'eval_Poss_f1_macro': 0.9956364344952822, 'eval_Poss_precision_micro': 0.9997536187249769, 'eval_Poss_recall_micro': 0.9997536187249769, 'eval_Poss_f1_micro': 0.9997536187249769, 'eval_Reflex_accuracy': 0.9996612257468432, 'eval_Reflex_precision_macro': 0.9735301320695655, 'eval_Reflex_recall_macro': 0.8214131593084801, 'eval_Reflex_f1_macro': 0.8828939685000283, 'eval_Reflex_precision_micro': 0.9996612257468432, 'eval_Reflex_recall_micro': 0.9996612257468432, 'eval_Reflex_f1_micro': 0.9996612257468432, 'eval_Tense_accuracy': 0.9957191253464737, 'eval_Tense_precision_macro': 0.9822411548842864, 'eval_Tense_recall_macro': 0.9865943659022381, 'eval_Tense_f1_macro': 0.9844041844217392, 'eval_Tense_precision_micro': 0.9957191253464737, 'eval_Tense_recall_micro': 0.9957191253464737, 'eval_Tense_f1_micro': 0.9957191253464737, 'eval_VerbForm_accuracy': 0.9918694179242378, 'eval_VerbForm_precision_macro': 0.9504650929123184, 'eval_VerbForm_recall_macro': 0.9540288308710366, 'eval_VerbForm_f1_macro': 0.9521098106490633, 'eval_VerbForm_precision_micro': 0.9918694179242378, 'eval_VerbForm_recall_micro': 0.9918694179242378, 'eval_VerbForm_f1_micro': 0.9918694179242378, 'eval_runtime': 184.4327, 'eval_samples_per_second': 12.975, 'eval_steps_per_second': 6.49, 'epoch': 7.21}
|
| 329 |
+
{'loss': 3.3362, 'grad_norm': 13.36613941192627, 'learning_rate': 1.0858585858585859e-05, 'epoch': 8.11}
|
| 330 |
+
{'eval_loss': 0.318782776594162, 'eval_f1_macro': 0.9444604092302595, 'eval_xpos_accuracy': 0.9703418540190946, 'eval_xpos_precision_macro': 0.9067546860794263, 'eval_xpos_recall_macro': 0.8859339224699845, 'eval_xpos_f1_macro': 0.8878404824411606, 'eval_xpos_precision_micro': 0.9703418540190946, 'eval_xpos_recall_micro': 0.9703418540190946, 'eval_xpos_f1_micro': 0.9703418540190946, 'eval_deprel_accuracy': 0.9370187865722205, 'eval_deprel_precision_macro': 0.850309057220788, 'eval_deprel_recall_macro': 0.8171501306733592, 'eval_deprel_f1_macro': 0.8269662033561302, 'eval_deprel_precision_micro': 0.9370187865722205, 'eval_deprel_recall_micro': 0.9370187865722205, 'eval_deprel_f1_micro': 0.9370187865722205, 'eval_pos_accuracy': 0.9712041884816754, 'eval_pos_precision_macro': 0.9600750938532333, 'eval_pos_recall_macro': 0.9384310813774656, 'eval_pos_f1_macro': 0.9480806877889156, 'eval_pos_precision_micro': 0.9712041884816754, 'eval_pos_recall_micro': 0.9712041884816754, 'eval_pos_f1_micro': 0.9712041884816754, 'eval_Case_accuracy': 0.9987064983061288, 'eval_Case_precision_macro': 0.9708137462083638, 'eval_Case_recall_macro': 0.98281570805069, 'eval_Case_f1_macro': 0.9765522821985616, 'eval_Case_precision_micro': 0.9987064983061288, 'eval_Case_recall_micro': 0.9987064983061288, 'eval_Case_f1_micro': 0.9987064983061288, 'eval_Definite_accuracy': 0.9999384046812442, 'eval_Definite_precision_macro': 0.9995662546085448, 'eval_Definite_recall_macro': 0.999977959246647, 'eval_Definite_f1_macro': 0.9997719653700766, 'eval_Definite_precision_micro': 0.9999384046812442, 'eval_Definite_recall_micro': 0.9999384046812442, 'eval_Definite_f1_micro': 0.9999384046812442, 'eval_Degree_accuracy': 0.9914074530335695, 'eval_Degree_precision_macro': 0.9497400666000834, 'eval_Degree_recall_macro': 0.9687802361050675, 'eval_Degree_f1_macro': 0.9590687937319229, 'eval_Degree_precision_micro': 0.9914074530335695, 'eval_Degree_recall_micro': 0.9914074530335695, 'eval_Degree_f1_micro': 0.9914074530335695, 'eval_Foreign_accuracy': 0.9995072374499538, 'eval_Foreign_precision_macro': 0.9164510033479163, 'eval_Foreign_recall_macro': 0.7083025128932174, 'eval_Foreign_f1_macro': 0.7776545188106879, 'eval_Foreign_precision_micro': 0.9995072374499538, 'eval_Foreign_recall_micro': 0.9995072374499538, 'eval_Foreign_f1_micro': 0.9995072374499538, 'eval_Gender_accuracy': 0.9999692023406221, 'eval_Gender_precision_macro': 0.9988584474885844, 'eval_Gender_recall_macro': 0.9999921580928481, 'eval_Gender_f1_macro': 0.9994239966050649, 'eval_Gender_precision_micro': 0.9999692023406221, 'eval_Gender_recall_micro': 0.9999692023406221, 'eval_Gender_f1_micro': 0.9999692023406221, 'eval_Mood_accuracy': 0.9960578995996304, 'eval_Mood_precision_macro': 0.9280289563037746, 'eval_Mood_recall_macro': 0.9585945146110123, 'eval_Mood_f1_macro': 0.9423008128801754, 'eval_Mood_precision_micro': 0.9960578995996304, 'eval_Mood_recall_micro': 0.9960578995996304, 'eval_Mood_f1_micro': 0.9960578995996304, 'eval_NumType_accuracy': 0.9987680936248845, 'eval_NumType_precision_macro': 0.9373268715970364, 'eval_NumType_recall_macro': 0.8515222311140578, 'eval_NumType_f1_macro': 0.8817809124674306, 'eval_NumType_precision_micro': 0.9987680936248845, 'eval_NumType_recall_micro': 0.9987680936248845, 'eval_NumType_f1_micro': 0.9987680936248845, 'eval_Number_accuracy': 0.9896827841084077, 'eval_Number_precision_macro': 0.9857473453854567, 'eval_Number_recall_macro': 0.9873716159710328, 'eval_Number_f1_macro': 0.9865562160799088, 'eval_Number_precision_micro': 0.9896827841084077, 'eval_Number_recall_micro': 0.9896827841084077, 'eval_Number_f1_micro': 0.9896827841084077, 'eval_Person_accuracy': 0.9994148444718202, 'eval_Person_precision_macro': 0.9974306500729042, 'eval_Person_recall_macro': 0.9963725714286156, 'eval_Person_f1_macro': 0.9968999846117008, 'eval_Person_precision_micro': 0.9994148444718202, 'eval_Person_recall_micro': 0.9994148444718202, 'eval_Person_f1_micro': 0.9994148444718202, 'eval_Polarity_accuracy': 0.9997844163843548, 'eval_Polarity_precision_macro': 0.9469839492721027, 'eval_Polarity_recall_macro': 0.9963447536403258, 'eval_Polarity_f1_macro': 0.969830459766524, 'eval_Polarity_precision_micro': 0.9997844163843548, 'eval_Polarity_recall_micro': 0.9997844163843548, 'eval_Polarity_f1_micro': 0.9997844163843548, 'eval_PronType_accuracy': 0.9980597474591931, 'eval_PronType_precision_macro': 0.9690374012959582, 'eval_PronType_recall_macro': 0.9750193422251782, 'eval_PronType_f1_macro': 0.9717234267249184, 'eval_PronType_precision_micro': 0.9980597474591931, 'eval_PronType_recall_micro': 0.9980597474591931, 'eval_PronType_f1_micro': 0.9980597474591931, 'eval_Poss_accuracy': 0.9997228210655991, 'eval_Poss_precision_macro': 0.9935291465247402, 'eval_Poss_recall_macro': 0.9966735089541401, 'eval_Poss_f1_macro': 0.9950961850339957, 'eval_Poss_precision_micro': 0.9997228210655991, 'eval_Poss_recall_micro': 0.9997228210655991, 'eval_Poss_f1_micro': 0.9997228210655991, 'eval_Reflex_accuracy': 0.9998152140437326, 'eval_Reflex_precision_macro': 0.9999075443786982, 'eval_Reflex_recall_macro': 0.8928571428571428, 'eval_Reflex_f1_macro': 0.939953767914933, 'eval_Reflex_precision_micro': 0.9998152140437326, 'eval_Reflex_recall_micro': 0.9998152140437326, 'eval_Reflex_f1_micro': 0.9998152140437326, 'eval_Tense_accuracy': 0.9957807206652295, 'eval_Tense_precision_macro': 0.9821169096222659, 'eval_Tense_recall_macro': 0.9870041180022177, 'eval_Tense_f1_macro': 0.9845415003770398, 'eval_Tense_precision_micro': 0.9957807206652295, 'eval_Tense_recall_micro': 0.9957807206652295, 'eval_Tense_f1_micro': 0.9957807206652295, 'eval_VerbForm_accuracy': 0.9925777640899291, 'eval_VerbForm_precision_macro': 0.9570466310356014, 'eval_VerbForm_recall_macro': 0.9561143233389743, 'eval_VerbForm_f1_macro': 0.9562451699855259, 'eval_VerbForm_precision_micro': 0.9925777640899291, 'eval_VerbForm_recall_micro': 0.9925777640899291, 'eval_VerbForm_f1_micro': 0.9925777640899291, 'eval_runtime': 185.1011, 'eval_samples_per_second': 12.928, 'eval_steps_per_second': 6.467, 'epoch': 8.11}
|
| 331 |
+
{'loss': 3.1033, 'grad_norm': 13.85925579071045, 'learning_rate': 9.595959595959597e-06, 'epoch': 9.01}
|
| 332 |
+
{'eval_loss': 0.3151477873325348, 'eval_f1_macro': 0.942692252157889, 'eval_xpos_accuracy': 0.970495842315984, 'eval_xpos_precision_macro': 0.911908180607385, 'eval_xpos_recall_macro': 0.8836936795114333, 'eval_xpos_f1_macro': 0.8885261035686352, 'eval_xpos_precision_micro': 0.970495842315984, 'eval_xpos_recall_micro': 0.970495842315984, 'eval_xpos_f1_micro': 0.970495842315984, 'eval_deprel_accuracy': 0.9376655374191561, 'eval_deprel_precision_macro': 0.8509459371299838, 'eval_deprel_recall_macro': 0.8194806778104807, 'eval_deprel_f1_macro': 0.8296227859135632, 'eval_deprel_precision_micro': 0.9376655374191561, 'eval_deprel_recall_micro': 0.9376655374191561, 'eval_deprel_f1_micro': 0.9376655374191561, 'eval_pos_accuracy': 0.9710502001847859, 'eval_pos_precision_macro': 0.9589918963020603, 'eval_pos_recall_macro': 0.9412381151643018, 'eval_pos_f1_macro': 0.9491567771368662, 'eval_pos_precision_micro': 0.9710502001847859, 'eval_pos_recall_micro': 0.9710502001847859, 'eval_pos_f1_micro': 0.9710502001847859, 'eval_Case_accuracy': 0.9986757006467508, 'eval_Case_precision_macro': 0.9701302415450517, 'eval_Case_recall_macro': 0.9813613241344653, 'eval_Case_f1_macro': 0.9755388584672033, 'eval_Case_precision_micro': 0.9986757006467508, 'eval_Case_recall_micro': 0.9986757006467508, 'eval_Case_f1_micro': 0.9986757006467508, 'eval_Definite_accuracy': 1.0, 'eval_Definite_precision_macro': 1.0, 'eval_Definite_recall_macro': 1.0, 'eval_Definite_f1_macro': 1.0, 'eval_Definite_precision_micro': 1.0, 'eval_Definite_recall_micro': 1.0, 'eval_Definite_f1_micro': 1.0, 'eval_Degree_accuracy': 0.9916846319679704, 'eval_Degree_precision_macro': 0.9434136824501856, 'eval_Degree_recall_macro': 0.9787123487463447, 'eval_Degree_f1_macro': 0.9602697061746015, 'eval_Degree_precision_micro': 0.9916846319679704, 'eval_Degree_recall_micro': 0.9916846319679704, 'eval_Degree_f1_micro': 0.9916846319679704, 'eval_Foreign_accuracy': 0.999445642131198, 'eval_Foreign_precision_macro': 0.8569271805345259, 'eval_Foreign_recall_macro': 0.7082716924531016, 'eval_Foreign_f1_macro': 0.763019224125767, 'eval_Foreign_precision_micro': 0.999445642131198, 'eval_Foreign_recall_micro': 0.999445642131198, 'eval_Foreign_f1_micro': 0.999445642131198, 'eval_Gender_accuracy': 1.0, 'eval_Gender_precision_macro': 1.0, 'eval_Gender_recall_macro': 1.0, 'eval_Gender_f1_macro': 1.0, 'eval_Gender_precision_micro': 1.0, 'eval_Gender_recall_micro': 1.0, 'eval_Gender_f1_micro': 1.0, 'eval_Mood_accuracy': 0.9963350785340314, 'eval_Mood_precision_macro': 0.9363704872285137, 'eval_Mood_recall_macro': 0.9588250782318645, 'eval_Mood_f1_macro': 0.9470253229783157, 'eval_Mood_precision_micro': 0.9963350785340314, 'eval_Mood_recall_micro': 0.9963350785340314, 'eval_Mood_f1_micro': 0.9963350785340314, 'eval_NumType_accuracy': 0.9988296889436403, 'eval_NumType_precision_macro': 0.9354688010896874, 'eval_NumType_recall_macro': 0.857940321076987, 'eval_NumType_f1_macro': 0.8837162871051388, 'eval_NumType_precision_micro': 0.9988296889436403, 'eval_NumType_recall_micro': 0.9988296889436403, 'eval_NumType_f1_micro': 0.9988296889436403, 'eval_Number_accuracy': 0.9898983677240529, 'eval_Number_precision_macro': 0.9870713706171018, 'eval_Number_recall_macro': 0.9869202142599658, 'eval_Number_f1_macro': 0.9869954318842113, 'eval_Number_precision_micro': 0.9898983677240529, 'eval_Number_recall_micro': 0.9898983677240529, 'eval_Number_f1_micro': 0.9898983677240529, 'eval_Person_accuracy': 0.9992916538343086, 'eval_Person_precision_macro': 0.9961800730224175, 'eval_Person_recall_macro': 0.9965091616552784, 'eval_Person_f1_macro': 0.996343777435336, 'eval_Person_precision_micro': 0.9992916538343086, 'eval_Person_recall_micro': 0.9992916538343086, 'eval_Person_f1_micro': 0.9992916538343086, 'eval_Polarity_accuracy': 0.9997228210655991, 'eval_Polarity_precision_macro': 0.911269662277352, 'eval_Polarity_recall_macro': 0.9963240965378976, 'eval_Polarity_f1_macro': 0.9478421073168656, 'eval_Polarity_precision_micro': 0.9997228210655991, 'eval_Polarity_recall_micro': 0.9997228210655991, 'eval_Polarity_f1_micro': 0.9997228210655991, 'eval_PronType_accuracy': 0.9982445334154604, 'eval_PronType_precision_macro': 0.9701289081950613, 'eval_PronType_recall_macro': 0.9790848926801193, 'eval_PronType_f1_macro': 0.9743844897706104, 'eval_PronType_precision_micro': 0.9982445334154604, 'eval_PronType_recall_micro': 0.9982445334154604, 'eval_PronType_f1_micro': 0.9982445334154604, 'eval_Poss_accuracy': 0.9997228210655991, 'eval_Poss_precision_macro': 0.9935291465247402, 'eval_Poss_recall_macro': 0.9966735089541401, 'eval_Poss_f1_macro': 0.9950961850339957, 'eval_Poss_precision_micro': 0.9997228210655991, 'eval_Poss_recall_micro': 0.9997228210655991, 'eval_Poss_f1_micro': 0.9997228210655991, 'eval_Reflex_accuracy': 0.9997844163843548, 'eval_Reflex_precision_macro': 0.9781684110944805, 'eval_Reflex_recall_macro': 0.8928417307370515, 'eval_Reflex_f1_macro': 0.9313186107558036, 'eval_Reflex_precision_micro': 0.9997844163843548, 'eval_Reflex_recall_micro': 0.9997844163843548, 'eval_Reflex_f1_micro': 0.9997844163843548, 'eval_Tense_accuracy': 0.9958423159839852, 'eval_Tense_precision_macro': 0.9833070480370499, 'eval_Tense_recall_macro': 0.986425438189512, 'eval_Tense_f1_macro': 0.9848537344015487, 'eval_Tense_precision_micro': 0.9958423159839852, 'eval_Tense_recall_micro': 0.9958423159839852, 'eval_Tense_f1_micro': 0.9958423159839852, 'eval_VerbForm_accuracy': 0.9922081921773945, 'eval_VerbForm_precision_macro': 0.9553859470957711, 'eval_VerbForm_recall_macro': 0.9548608288657796, 'eval_VerbForm_f1_macro': 0.9547511367735366, 'eval_VerbForm_precision_micro': 0.9922081921773945, 'eval_VerbForm_recall_micro': 0.9922081921773945, 'eval_VerbForm_f1_micro': 0.9922081921773945, 'eval_runtime': 184.365, 'eval_samples_per_second': 12.98, 'eval_steps_per_second': 6.493, 'epoch': 9.01}
|
| 333 |
+
{'loss': 2.848, 'grad_norm': 17.504152297973633, 'learning_rate': 8.333333333333334e-06, 'epoch': 9.92}
|
| 334 |
+
{'eval_loss': 0.314317524433136, 'eval_f1_macro': 0.9460086463259283, 'eval_xpos_accuracy': 0.9710809978441638, 'eval_xpos_precision_macro': 0.9137396425878821, 'eval_xpos_recall_macro': 0.8854906836774519, 'eval_xpos_f1_macro': 0.8917355451742601, 'eval_xpos_precision_micro': 0.9710809978441638, 'eval_xpos_recall_micro': 0.9710809978441638, 'eval_xpos_f1_micro': 0.9710809978441638, 'eval_deprel_accuracy': 0.938527871881737, 'eval_deprel_precision_macro': 0.8460564822586644, 'eval_deprel_recall_macro': 0.8277387909790447, 'eval_deprel_f1_macro': 0.8336886497350202, 'eval_deprel_precision_micro': 0.938527871881737, 'eval_deprel_recall_micro': 0.938527871881737, 'eval_deprel_f1_micro': 0.938527871881737, 'eval_pos_accuracy': 0.9717585463504773, 'eval_pos_precision_macro': 0.961167870210762, 'eval_pos_recall_macro': 0.9397784984412278, 'eval_pos_f1_macro': 0.949236482785107, 'eval_pos_precision_micro': 0.9717585463504773, 'eval_pos_recall_micro': 0.9717585463504773, 'eval_pos_f1_micro': 0.9717585463504773, 'eval_Case_accuracy': 0.998644902987373, 'eval_Case_precision_macro': 0.9693356623836876, 'eval_Case_recall_macro': 0.9820723427139589, 'eval_Case_f1_macro': 0.9754485543666854, 'eval_Case_precision_micro': 0.998644902987373, 'eval_Case_recall_micro': 0.998644902987373, 'eval_Case_f1_micro': 0.998644902987373, 'eval_Definite_accuracy': 0.9999692023406221, 'eval_Definite_precision_macro': 0.9997829861111112, 'eval_Definite_recall_macro': 0.9999889796233236, 'eval_Definite_f1_macro': 0.9998859474433567, 'eval_Definite_precision_micro': 0.9999692023406221, 'eval_Definite_recall_micro': 0.9999692023406221, 'eval_Definite_f1_micro': 0.9999692023406221, 'eval_Degree_accuracy': 0.9919310132429935, 'eval_Degree_precision_macro': 0.9553974962716711, 'eval_Degree_recall_macro': 0.9665450629560749, 'eval_Degree_f1_macro': 0.9608944646110371, 'eval_Degree_precision_micro': 0.9919310132429935, 'eval_Degree_recall_micro': 0.9919310132429935, 'eval_Degree_f1_micro': 0.9919310132429935, 'eval_Foreign_accuracy': 0.9994764397905759, 'eval_Foreign_precision_macro': 0.8843997146520486, 'eval_Foreign_recall_macro': 0.7082871026731595, 'eval_Foreign_f1_macro': 0.7701393055999161, 'eval_Foreign_precision_micro': 0.9994764397905759, 'eval_Foreign_recall_micro': 0.9994764397905759, 'eval_Foreign_f1_micro': 0.9994764397905759, 'eval_Gender_accuracy': 0.9999692023406221, 'eval_Gender_precision_macro': 0.9988584474885844, 'eval_Gender_recall_macro': 0.9999921580928481, 'eval_Gender_f1_macro': 0.9994239966050649, 'eval_Gender_precision_micro': 0.9999692023406221, 'eval_Gender_recall_micro': 0.9999692023406221, 'eval_Gender_f1_micro': 0.9999692023406221, 'eval_Mood_accuracy': 0.9965814598090545, 'eval_Mood_precision_macro': 0.9486490142205692, 'eval_Mood_recall_macro': 0.9548406689193548, 'eval_Mood_f1_macro': 0.9516786862543589, 'eval_Mood_precision_micro': 0.9965814598090545, 'eval_Mood_recall_micro': 0.9965814598090545, 'eval_Mood_f1_micro': 0.9965814598090545, 'eval_NumType_accuracy': 0.9987372959655066, 'eval_NumType_precision_macro': 0.932681107169649, 'eval_NumType_recall_macro': 0.851514397561385, 'eval_NumType_f1_macro': 0.8793078568809536, 'eval_NumType_precision_micro': 0.9987372959655066, 'eval_NumType_recall_micro': 0.9987372959655066, 'eval_NumType_f1_micro': 0.9987372959655066, 'eval_Number_accuracy': 0.9901447489990761, 'eval_Number_precision_macro': 0.987288893567103, 'eval_Number_recall_macro': 0.9875638297075651, 'eval_Number_f1_macro': 0.9874261583212006, 'eval_Number_precision_micro': 0.9901447489990761, 'eval_Number_recall_micro': 0.9901447489990761, 'eval_Number_f1_micro': 0.9901447489990761, 'eval_Person_accuracy': 0.9992608561749307, 'eval_Person_precision_macro': 0.996170253521355, 'eval_Person_recall_macro': 0.9959304579515746, 'eval_Person_f1_macro': 0.9960485111224247, 'eval_Person_precision_micro': 0.9992608561749307, 'eval_Person_recall_micro': 0.9992608561749307, 'eval_Person_f1_micro': 0.9992608561749307, 'eval_Polarity_accuracy': 0.9998152140437326, 'eval_Polarity_precision_macro': 0.9689619718902976, 'eval_Polarity_recall_macro': 0.99635508219154, 'eval_Polarity_f1_macro': 0.9821433170699548, 'eval_Polarity_precision_micro': 0.9998152140437326, 'eval_Polarity_recall_micro': 0.9998152140437326, 'eval_Polarity_f1_micro': 0.9998152140437326, 'eval_PronType_accuracy': 0.9982753310748383, 'eval_PronType_precision_macro': 0.9705509621204504, 'eval_PronType_recall_macro': 0.9801802716601138, 'eval_PronType_f1_macro': 0.975037572765203, 'eval_PronType_precision_micro': 0.9982753310748383, 'eval_PronType_recall_micro': 0.9982753310748383, 'eval_PronType_f1_micro': 0.9982753310748383, 'eval_Poss_accuracy': 0.9997228210655991, 'eval_Poss_precision_macro': 0.9935291465247402, 'eval_Poss_recall_macro': 0.9966735089541401, 'eval_Poss_f1_macro': 0.9950961850339957, 'eval_Poss_precision_micro': 0.9997228210655991, 'eval_Poss_recall_micro': 0.9997228210655991, 'eval_Poss_f1_micro': 0.9997228210655991, 'eval_Reflex_accuracy': 0.9998152140437326, 'eval_Reflex_precision_macro': 0.979089615566377, 'eval_Reflex_recall_macro': 0.9106988735941944, 'eval_Reflex_f1_macro': 0.9422614587976442, 'eval_Reflex_precision_micro': 0.9998152140437326, 'eval_Reflex_recall_micro': 0.9998152140437326, 'eval_Reflex_f1_micro': 0.9998152140437326, 'eval_Tense_accuracy': 0.9958115183246073, 'eval_Tense_precision_macro': 0.9821328244108822, 'eval_Tense_recall_macro': 0.9872298006923553, 'eval_Tense_f1_macro': 0.9846621818126516, 'eval_Tense_precision_micro': 0.9958115183246073, 'eval_Tense_recall_micro': 0.9958115183246073, 'eval_Tense_f1_micro': 0.9958115183246073, 'eval_VerbForm_accuracy': 0.992085001539883, 'eval_VerbForm_precision_macro': 0.9535949257358742, 'eval_VerbForm_recall_macro': 0.9550721035934254, 'eval_VerbForm_f1_macro': 0.954040759487874, 'eval_VerbForm_precision_micro': 0.992085001539883, 'eval_VerbForm_recall_micro': 0.992085001539883, 'eval_VerbForm_f1_micro': 0.992085001539883, 'eval_runtime': 184.587, 'eval_samples_per_second': 12.964, 'eval_steps_per_second': 6.485, 'epoch': 9.92}
|
| 335 |
+
{'loss': 2.704, 'grad_norm': 14.411617279052734, 'learning_rate': 7.070707070707071e-06, 'epoch': 10.82}
|
| 336 |
+
{'eval_loss': 0.3111107051372528, 'eval_f1_macro': 0.945062370330903, 'eval_xpos_accuracy': 0.9711733908222975, 'eval_xpos_precision_macro': 0.9122484129141236, 'eval_xpos_recall_macro': 0.8851900780053562, 'eval_xpos_f1_macro': 0.8914493507688107, 'eval_xpos_precision_micro': 0.9711733908222975, 'eval_xpos_recall_micro': 0.9711733908222975, 'eval_xpos_f1_micro': 0.9711733908222975, 'eval_deprel_accuracy': 0.93935940868494, 'eval_deprel_precision_macro': 0.8704809074097003, 'eval_deprel_recall_macro': 0.8304267658909016, 'eval_deprel_f1_macro': 0.837070039392518, 'eval_deprel_precision_micro': 0.93935940868494, 'eval_deprel_recall_micro': 0.93935940868494, 'eval_deprel_f1_micro': 0.93935940868494, 'eval_pos_accuracy': 0.9724668925161688, 'eval_pos_precision_macro': 0.9629390180800328, 'eval_pos_recall_macro': 0.9401887210539729, 'eval_pos_f1_macro': 0.9502075612761083, 'eval_pos_precision_micro': 0.9724668925161688, 'eval_pos_recall_micro': 0.9724668925161688, 'eval_pos_f1_micro': 0.9724668925161688, 'eval_Case_accuracy': 0.998644902987373, 'eval_Case_precision_macro': 0.9709067857297552, 'eval_Case_recall_macro': 0.9801038574675401, 'eval_Case_f1_macro': 0.9753383794953735, 'eval_Case_precision_micro': 0.998644902987373, 'eval_Case_recall_micro': 0.998644902987373, 'eval_Case_f1_micro': 0.998644902987373, 'eval_Definite_accuracy': 0.9999692023406221, 'eval_Definite_precision_macro': 0.9997829861111112, 'eval_Definite_recall_macro': 0.9999889796233236, 'eval_Definite_f1_macro': 0.9998859474433567, 'eval_Definite_precision_micro': 0.9999692023406221, 'eval_Definite_recall_micro': 0.9999692023406221, 'eval_Definite_f1_micro': 0.9999692023406221, 'eval_Degree_accuracy': 0.9916846319679704, 'eval_Degree_precision_macro': 0.9528721696269224, 'eval_Degree_recall_macro': 0.9717370585146055, 'eval_Degree_f1_macro': 0.9620534219072117, 'eval_Degree_precision_micro': 0.9916846319679704, 'eval_Degree_recall_micro': 0.9916846319679704, 'eval_Degree_f1_micro': 0.9916846319679704, 'eval_Foreign_accuracy': 0.9995072374499538, 'eval_Foreign_precision_macro': 0.9164510033479163, 'eval_Foreign_recall_macro': 0.7083025128932174, 'eval_Foreign_f1_macro': 0.7776545188106879, 'eval_Foreign_precision_micro': 0.9995072374499538, 'eval_Foreign_recall_micro': 0.9995072374499538, 'eval_Foreign_f1_micro': 0.9995072374499538, 'eval_Gender_accuracy': 1.0, 'eval_Gender_precision_macro': 1.0, 'eval_Gender_recall_macro': 1.0, 'eval_Gender_f1_macro': 1.0, 'eval_Gender_precision_micro': 1.0, 'eval_Gender_recall_micro': 1.0, 'eval_Gender_f1_micro': 1.0, 'eval_Mood_accuracy': 0.996427471512165, 'eval_Mood_precision_macro': 0.9339227016402227, 'eval_Mood_recall_macro': 0.9620515302224729, 'eval_Mood_f1_macro': 0.9471461378443453, 'eval_Mood_precision_micro': 0.996427471512165, 'eval_Mood_recall_micro': 0.996427471512165, 'eval_Mood_f1_micro': 0.996427471512165, 'eval_NumType_accuracy': 0.9988604866030182, 'eval_NumType_precision_macro': 0.9400369110855837, 'eval_NumType_recall_macro': 0.8579481546296598, 'eval_NumType_f1_macro': 0.8862043981520569, 'eval_NumType_precision_micro': 0.9988604866030182, 'eval_NumType_recall_micro': 0.9988604866030182, 'eval_NumType_f1_micro': 0.9988604866030182, 'eval_Number_accuracy': 0.9899907607021866, 'eval_Number_precision_macro': 0.9862706884769228, 'eval_Number_recall_macro': 0.987075550671718, 'eval_Number_f1_macro': 0.986672539876313, 'eval_Number_precision_micro': 0.9899907607021866, 'eval_Number_recall_micro': 0.9899907607021866, 'eval_Number_f1_micro': 0.9899907607021866, 'eval_Person_accuracy': 0.9993224514936865, 'eval_Person_precision_macro': 0.9967668612833189, 'eval_Person_recall_macro': 0.9950734406651991, 'eval_Person_f1_macro': 0.995914593855971, 'eval_Person_precision_micro': 0.9993224514936865, 'eval_Person_recall_micro': 0.9993224514936865, 'eval_Person_f1_micro': 0.9993224514936865, 'eval_Polarity_accuracy': 0.9997844163843548, 'eval_Polarity_precision_macro': 0.913072107124339, 'eval_Polarity_recall_macro': 0.9981362268909134, 'eval_Polarity_f1_macro': 0.9496493818614056, 'eval_Polarity_precision_micro': 0.9997844163843548, 'eval_Polarity_recall_micro': 0.9997844163843548, 'eval_Polarity_f1_micro': 0.9997844163843548, 'eval_PronType_accuracy': 0.9982137357560825, 'eval_PronType_precision_macro': 0.970957099174111, 'eval_PronType_recall_macro': 0.9810634865665578, 'eval_PronType_f1_macro': 0.9755398747276506, 'eval_PronType_precision_micro': 0.9982137357560825, 'eval_PronType_recall_micro': 0.9982137357560825, 'eval_PronType_f1_micro': 0.9982137357560825, 'eval_Poss_accuracy': 0.9997228210655991, 'eval_Poss_precision_macro': 0.9935291465247402, 'eval_Poss_recall_macro': 0.9966735089541401, 'eval_Poss_f1_macro': 0.9950961850339957, 'eval_Poss_precision_micro': 0.9997228210655991, 'eval_Poss_recall_micro': 0.9997228210655991, 'eval_Poss_f1_micro': 0.9997228210655991, 'eval_Reflex_accuracy': 0.9998152140437326, 'eval_Reflex_precision_macro': 0.9999075443786982, 'eval_Reflex_recall_macro': 0.8928571428571428, 'eval_Reflex_f1_macro': 0.939953767914933, 'eval_Reflex_precision_micro': 0.9998152140437326, 'eval_Reflex_recall_micro': 0.9998152140437326, 'eval_Reflex_f1_micro': 0.9998152140437326, 'eval_Tense_accuracy': 0.9959655066214967, 'eval_Tense_precision_macro': 0.9828320188961738, 'eval_Tense_recall_macro': 0.9876736057787818, 'eval_Tense_f1_macro': 0.9852306646170327, 'eval_Tense_precision_micro': 0.9959655066214967, 'eval_Tense_recall_micro': 0.9959655066214967, 'eval_Tense_f1_micro': 0.9959655066214967, 'eval_VerbForm_accuracy': 0.9925161687711734, 'eval_VerbForm_precision_macro': 0.9569520250976588, 'eval_VerbForm_recall_macro': 0.955661245035097, 'eval_VerbForm_f1_macro': 0.9560559029784838, 'eval_VerbForm_precision_micro': 0.9925161687711734, 'eval_VerbForm_recall_micro': 0.9925161687711734, 'eval_VerbForm_f1_micro': 0.9925161687711734, 'eval_runtime': 184.3136, 'eval_samples_per_second': 12.983, 'eval_steps_per_second': 6.494, 'epoch': 10.82}
|
| 337 |
+
{'loss': 2.5336, 'grad_norm': 15.71062183380127, 'learning_rate': 5.808080808080808e-06, 'epoch': 11.72}
|
| 338 |
+
{'eval_loss': 0.31213679909706116, 'eval_f1_macro': 0.9450034781954363, 'eval_xpos_accuracy': 0.971327379119187, 'eval_xpos_precision_macro': 0.9040737990501917, 'eval_xpos_recall_macro': 0.8878791748486564, 'eval_xpos_f1_macro': 0.8915088206489913, 'eval_xpos_precision_micro': 0.971327379119187, 'eval_xpos_recall_micro': 0.971327379119187, 'eval_xpos_f1_micro': 0.971327379119187, 'eval_deprel_accuracy': 0.9391746227286726, 'eval_deprel_precision_macro': 0.875233469427972, 'eval_deprel_recall_macro': 0.8334939460324564, 'eval_deprel_f1_macro': 0.8411592808809429, 'eval_deprel_precision_micro': 0.9391746227286726, 'eval_deprel_recall_micro': 0.9391746227286726, 'eval_deprel_f1_micro': 0.9391746227286726, 'eval_pos_accuracy': 0.9720357252848784, 'eval_pos_precision_macro': 0.9589791650677912, 'eval_pos_recall_macro': 0.9425125827391407, 'eval_pos_f1_macro': 0.9500365818433866, 'eval_pos_precision_micro': 0.9720357252848784, 'eval_pos_recall_micro': 0.9720357252848784, 'eval_pos_f1_micro': 0.9720357252848784, 'eval_Case_accuracy': 0.9987372959655066, 'eval_Case_precision_macro': 0.9720786137937272, 'eval_Case_recall_macro': 0.9806610878073844, 'eval_Case_f1_macro': 0.9762236132182674, 'eval_Case_precision_micro': 0.9987372959655066, 'eval_Case_recall_micro': 0.9987372959655066, 'eval_Case_f1_micro': 0.9987372959655066, 'eval_Definite_accuracy': 1.0, 'eval_Definite_precision_macro': 1.0, 'eval_Definite_recall_macro': 1.0, 'eval_Definite_f1_macro': 1.0, 'eval_Definite_precision_micro': 1.0, 'eval_Definite_recall_micro': 1.0, 'eval_Definite_f1_micro': 1.0, 'eval_Degree_accuracy': 0.9914690483523252, 'eval_Degree_precision_macro': 0.9492829666546161, 'eval_Degree_recall_macro': 0.9753682956364341, 'eval_Degree_f1_macro': 0.9618686358893136, 'eval_Degree_precision_micro': 0.9914690483523252, 'eval_Degree_recall_micro': 0.9914690483523252, 'eval_Degree_f1_micro': 0.9914690483523252, 'eval_Foreign_accuracy': 0.9994764397905759, 'eval_Foreign_precision_macro': 0.8843997146520486, 'eval_Foreign_recall_macro': 0.7082871026731595, 'eval_Foreign_f1_macro': 0.7701393055999161, 'eval_Foreign_precision_micro': 0.9994764397905759, 'eval_Foreign_recall_micro': 0.9994764397905759, 'eval_Foreign_f1_micro': 0.9994764397905759, 'eval_Gender_accuracy': 1.0, 'eval_Gender_precision_macro': 1.0, 'eval_Gender_recall_macro': 1.0, 'eval_Gender_f1_macro': 1.0, 'eval_Gender_precision_micro': 1.0, 'eval_Gender_recall_micro': 1.0, 'eval_Gender_f1_micro': 1.0, 'eval_Mood_accuracy': 0.9964890668309209, 'eval_Mood_precision_macro': 0.9442516826655155, 'eval_Mood_recall_macro': 0.9562084678934228, 'eval_Mood_f1_macro': 0.9500486933757504, 'eval_Mood_precision_micro': 0.9964890668309209, 'eval_Mood_recall_micro': 0.9964890668309209, 'eval_Mood_f1_micro': 0.9964890668309209, 'eval_NumType_accuracy': 0.998891284262396, 'eval_NumType_precision_macro': 0.9409634130492703, 'eval_NumType_recall_macro': 0.8574755404850054, 'eval_NumType_f1_macro': 0.8864375692048152, 'eval_NumType_precision_micro': 0.998891284262396, 'eval_NumType_recall_micro': 0.998891284262396, 'eval_NumType_f1_micro': 0.998891284262396, 'eval_Number_accuracy': 0.9899907607021866, 'eval_Number_precision_macro': 0.9866747376177036, 'eval_Number_recall_macro': 0.9860314769428586, 'eval_Number_f1_macro': 0.9863505807408269, 'eval_Number_precision_micro': 0.9899907607021866, 'eval_Number_recall_micro': 0.9899907607021866, 'eval_Number_f1_micro': 0.9899907607021866, 'eval_Person_accuracy': 0.9992608561749307, 'eval_Person_precision_macro': 0.9963006318894395, 'eval_Person_recall_macro': 0.9949232456046831, 'eval_Person_f1_macro': 0.9956060632395384, 'eval_Person_precision_micro': 0.9992608561749307, 'eval_Person_recall_micro': 0.9992608561749307, 'eval_Person_f1_micro': 0.9992608561749307, 'eval_Polarity_accuracy': 0.9997844163843548, 'eval_Polarity_precision_macro': 0.913072107124339, 'eval_Polarity_recall_macro': 0.9981362268909134, 'eval_Polarity_f1_macro': 0.9496493818614056, 'eval_Polarity_precision_micro': 0.9997844163843548, 'eval_Polarity_recall_micro': 0.9997844163843548, 'eval_Polarity_f1_micro': 0.9997844163843548, 'eval_PronType_accuracy': 0.9982445334154604, 'eval_PronType_precision_macro': 0.9709855764512391, 'eval_PronType_recall_macro': 0.979728464672861, 'eval_PronType_f1_macro': 0.9751081232357731, 'eval_PronType_precision_micro': 0.9982445334154604, 'eval_PronType_recall_micro': 0.9982445334154604, 'eval_PronType_f1_micro': 0.9982445334154604, 'eval_Poss_accuracy': 0.9997228210655991, 'eval_Poss_precision_macro': 0.9935291465247402, 'eval_Poss_recall_macro': 0.9966735089541401, 'eval_Poss_f1_macro': 0.9950961850339957, 'eval_Poss_precision_micro': 0.9997228210655991, 'eval_Poss_recall_micro': 0.9997228210655991, 'eval_Poss_f1_micro': 0.9997228210655991, 'eval_Reflex_accuracy': 0.9998152140437326, 'eval_Reflex_precision_macro': 0.9999075443786982, 'eval_Reflex_recall_macro': 0.8928571428571428, 'eval_Reflex_f1_macro': 0.939953767914933, 'eval_Reflex_precision_micro': 0.9998152140437326, 'eval_Reflex_recall_micro': 0.9998152140437326, 'eval_Reflex_f1_micro': 0.9998152140437326, 'eval_Tense_accuracy': 0.9957499230058515, 'eval_Tense_precision_macro': 0.9819261355594371, 'eval_Tense_recall_macro': 0.9872070987013908, 'eval_Tense_f1_macro': 0.9845459565705231, 'eval_Tense_precision_micro': 0.9957499230058515, 'eval_Tense_recall_micro': 0.9957499230058515, 'eval_Tense_f1_micro': 0.9957499230058515, 'eval_VerbForm_accuracy': 0.9925161687711734, 'eval_VerbForm_precision_macro': 0.9593641734138385, 'eval_VerbForm_recall_macro': 0.9541936910184079, 'eval_VerbForm_f1_macro': 0.9563300482594694, 'eval_VerbForm_precision_micro': 0.9925161687711734, 'eval_VerbForm_recall_micro': 0.9925161687711734, 'eval_VerbForm_f1_micro': 0.9925161687711734, 'eval_runtime': 184.7242, 'eval_samples_per_second': 12.954, 'eval_steps_per_second': 6.48, 'epoch': 11.72}
|
| 339 |
+
{'loss': 2.4001, 'grad_norm': 13.36937141418457, 'learning_rate': 4.5454545454545455e-06, 'epoch': 12.62}
|
| 340 |
+
{'eval_loss': 0.30931687355041504, 'eval_f1_macro': 0.944792147604097, 'eval_xpos_accuracy': 0.971881736987989, 'eval_xpos_precision_macro': 0.9106803400654592, 'eval_xpos_recall_macro': 0.8876967675343638, 'eval_xpos_f1_macro': 0.8927378840468673, 'eval_xpos_precision_micro': 0.971881736987989, 'eval_xpos_recall_micro': 0.971881736987989, 'eval_xpos_f1_micro': 0.971881736987989, 'eval_deprel_accuracy': 0.9403449337850324, 'eval_deprel_precision_macro': 0.862303095193583, 'eval_deprel_recall_macro': 0.833881493123765, 'eval_deprel_f1_macro': 0.8408848510031106, 'eval_deprel_precision_micro': 0.9403449337850324, 'eval_deprel_recall_micro': 0.9403449337850324, 'eval_deprel_f1_micro': 0.9403449337850324, 'eval_pos_accuracy': 0.9725592854943025, 'eval_pos_precision_macro': 0.9592502902097619, 'eval_pos_recall_macro': 0.9440721265675522, 'eval_pos_f1_macro': 0.9511015916726798, 'eval_pos_precision_micro': 0.9725592854943025, 'eval_pos_recall_micro': 0.9725592854943025, 'eval_pos_f1_micro': 0.9725592854943025, 'eval_Case_accuracy': 0.9986757006467508, 'eval_Case_precision_macro': 0.9701302415450517, 'eval_Case_recall_macro': 0.9813613241344653, 'eval_Case_f1_macro': 0.9755388584672033, 'eval_Case_precision_micro': 0.9986757006467508, 'eval_Case_recall_micro': 0.9986757006467508, 'eval_Case_f1_micro': 0.9986757006467508, 'eval_Definite_accuracy': 1.0, 'eval_Definite_precision_macro': 1.0, 'eval_Definite_recall_macro': 1.0, 'eval_Definite_f1_macro': 1.0, 'eval_Definite_precision_micro': 1.0, 'eval_Definite_recall_micro': 1.0, 'eval_Definite_f1_micro': 1.0, 'eval_Degree_accuracy': 0.9917154296273483, 'eval_Degree_precision_macro': 0.9503228246017758, 'eval_Degree_recall_macro': 0.9751320645674009, 'eval_Degree_f1_macro': 0.9622910706448158, 'eval_Degree_precision_micro': 0.9917154296273483, 'eval_Degree_recall_micro': 0.9917154296273483, 'eval_Degree_f1_micro': 0.9917154296273483, 'eval_Foreign_accuracy': 0.999445642131198, 'eval_Foreign_precision_macro': 0.8569271805345259, 'eval_Foreign_recall_macro': 0.7082716924531016, 'eval_Foreign_f1_macro': 0.763019224125767, 'eval_Foreign_precision_micro': 0.999445642131198, 'eval_Foreign_recall_micro': 0.999445642131198, 'eval_Foreign_f1_micro': 0.999445642131198, 'eval_Gender_accuracy': 1.0, 'eval_Gender_precision_macro': 1.0, 'eval_Gender_recall_macro': 1.0, 'eval_Gender_f1_macro': 1.0, 'eval_Gender_precision_micro': 1.0, 'eval_Gender_recall_micro': 1.0, 'eval_Gender_f1_micro': 1.0, 'eval_Mood_accuracy': 0.9963042808746535, 'eval_Mood_precision_macro': 0.9361230722773487, 'eval_Mood_recall_macro': 0.9574126488533333, 'eval_Mood_f1_macro': 0.9462450765759293, 'eval_Mood_precision_micro': 0.9963042808746535, 'eval_Mood_recall_micro': 0.9963042808746535, 'eval_Mood_f1_micro': 0.9963042808746535, 'eval_NumType_accuracy': 0.9987988912842624, 'eval_NumType_precision_macro': 0.9395464503317013, 'eval_NumType_recall_macro': 0.857452039826987, 'eval_NumType_f1_macro': 0.8857111268469823, 'eval_NumType_precision_micro': 0.9987988912842624, 'eval_NumType_recall_micro': 0.9987988912842624, 'eval_NumType_f1_micro': 0.9987988912842624, 'eval_Number_accuracy': 0.9903911302740992, 'eval_Number_precision_macro': 0.9870709669229929, 'eval_Number_recall_macro': 0.987783237364828, 'eval_Number_f1_macro': 0.9874261970584594, 'eval_Number_precision_micro': 0.9903911302740992, 'eval_Number_recall_micro': 0.9903911302740992, 'eval_Number_f1_micro': 0.9903911302740992, 'eval_Person_accuracy': 0.9992916538343086, 'eval_Person_precision_macro': 0.9965754915220305, 'eval_Person_recall_macro': 0.9951172190840711, 'eval_Person_f1_macro': 0.9958400087751886, 'eval_Person_precision_micro': 0.9992916538343086, 'eval_Person_recall_micro': 0.9992916538343086, 'eval_Person_f1_micro': 0.9992916538343086, 'eval_Polarity_accuracy': 0.9998152140437326, 'eval_Polarity_precision_macro': 0.9297387741111319, 'eval_Polarity_recall_macro': 0.9981465554421276, 'eval_Polarity_f1_macro': 0.9602365575992228, 'eval_Polarity_precision_micro': 0.9998152140437326, 'eval_Polarity_recall_micro': 0.9998152140437326, 'eval_Polarity_f1_micro': 0.9998152140437326, 'eval_PronType_accuracy': 0.9983061287342162, 'eval_PronType_precision_macro': 0.9726759514620704, 'eval_PronType_recall_macro': 0.9820091060789936, 'eval_PronType_f1_macro': 0.9770522823736755, 'eval_PronType_precision_micro': 0.9983061287342162, 'eval_PronType_recall_micro': 0.9983061287342162, 'eval_PronType_f1_micro': 0.9983061287342162, 'eval_Poss_accuracy': 0.9997844163843548, 'eval_Poss_precision_macro': 0.9956520570542573, 'eval_Poss_recall_macro': 0.9967047530958635, 'eval_Poss_f1_macro': 0.9961778299709958, 'eval_Poss_precision_micro': 0.9997844163843548, 'eval_Poss_recall_micro': 0.9997844163843548, 'eval_Poss_f1_micro': 0.9997844163843548, 'eval_Reflex_accuracy': 0.9997844163843548, 'eval_Reflex_precision_macro': 0.9781684110944805, 'eval_Reflex_recall_macro': 0.8928417307370515, 'eval_Reflex_f1_macro': 0.9313186107558036, 'eval_Reflex_precision_micro': 0.9997844163843548, 'eval_Reflex_recall_micro': 0.9997844163843548, 'eval_Reflex_f1_micro': 0.9997844163843548, 'eval_Tense_accuracy': 0.9958115183246073, 'eval_Tense_precision_macro': 0.9833489858871277, 'eval_Tense_recall_macro': 0.9861581422190785, 'eval_Tense_f1_macro': 0.9847336856075598, 'eval_Tense_precision_micro': 0.9958115183246073, 'eval_Tense_recall_micro': 0.9958115183246073, 'eval_Tense_f1_micro': 0.9958115183246073, 'eval_VerbForm_accuracy': 0.9925469664305513, 'eval_VerbForm_precision_macro': 0.959243695845467, 'eval_VerbForm_recall_macro': 0.9532997264226406, 'eval_VerbForm_f1_macro': 0.9559438013494864, 'eval_VerbForm_precision_micro': 0.9925469664305513, 'eval_VerbForm_recall_micro': 0.9925469664305513, 'eval_VerbForm_f1_micro': 0.9925469664305513, 'eval_runtime': 184.1981, 'eval_samples_per_second': 12.991, 'eval_steps_per_second': 6.498, 'epoch': 12.62}
|
| 341 |
+
```
|
models/ud_ewt_gum_pud_20250611/added_tokens.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"[MASK]": 128000
|
| 3 |
+
}
|
models/ud_ewt_gum_pud_20250611/config.json
ADDED
|
@@ -0,0 +1,254 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_name_or_path": "microsoft/deberta-v3-base",
|
| 3 |
+
"architectures": [
|
| 4 |
+
"MultiHeadModel"
|
| 5 |
+
],
|
| 6 |
+
"attention_probs_dropout_prob": 0.1,
|
| 7 |
+
"hidden_act": "gelu",
|
| 8 |
+
"hidden_dropout_prob": 0.1,
|
| 9 |
+
"hidden_size": 768,
|
| 10 |
+
"initializer_range": 0.02,
|
| 11 |
+
"intermediate_size": 3072,
|
| 12 |
+
"label_maps": {
|
| 13 |
+
"Case": [
|
| 14 |
+
"Nom",
|
| 15 |
+
"Acc",
|
| 16 |
+
"X"
|
| 17 |
+
],
|
| 18 |
+
"Definite": [
|
| 19 |
+
"Ind",
|
| 20 |
+
"Def",
|
| 21 |
+
"X"
|
| 22 |
+
],
|
| 23 |
+
"Degree": [
|
| 24 |
+
"Sup",
|
| 25 |
+
"Cmp",
|
| 26 |
+
"Pos",
|
| 27 |
+
"X"
|
| 28 |
+
],
|
| 29 |
+
"Foreign": [
|
| 30 |
+
"Yes",
|
| 31 |
+
"X"
|
| 32 |
+
],
|
| 33 |
+
"Gender": [
|
| 34 |
+
"Masc",
|
| 35 |
+
"Neut",
|
| 36 |
+
"Fem",
|
| 37 |
+
"X"
|
| 38 |
+
],
|
| 39 |
+
"Mood": [
|
| 40 |
+
"Ind",
|
| 41 |
+
"Imp",
|
| 42 |
+
"X"
|
| 43 |
+
],
|
| 44 |
+
"NumType": [
|
| 45 |
+
"Mult",
|
| 46 |
+
"Card",
|
| 47 |
+
"Ord",
|
| 48 |
+
"X"
|
| 49 |
+
],
|
| 50 |
+
"Number": [
|
| 51 |
+
"Plur",
|
| 52 |
+
"Sing",
|
| 53 |
+
"X"
|
| 54 |
+
],
|
| 55 |
+
"Person": [
|
| 56 |
+
"2",
|
| 57 |
+
"1",
|
| 58 |
+
"3",
|
| 59 |
+
"X"
|
| 60 |
+
],
|
| 61 |
+
"Polarity": [
|
| 62 |
+
"Neg",
|
| 63 |
+
"Pos",
|
| 64 |
+
"X"
|
| 65 |
+
],
|
| 66 |
+
"Poss": [
|
| 67 |
+
"Yes",
|
| 68 |
+
"X"
|
| 69 |
+
],
|
| 70 |
+
"PronType": [
|
| 71 |
+
"Rel",
|
| 72 |
+
"Art",
|
| 73 |
+
"Prs",
|
| 74 |
+
"Dem",
|
| 75 |
+
"Neg",
|
| 76 |
+
"Int",
|
| 77 |
+
"X"
|
| 78 |
+
],
|
| 79 |
+
"Reflex": [
|
| 80 |
+
"Yes",
|
| 81 |
+
"X"
|
| 82 |
+
],
|
| 83 |
+
"Tense": [
|
| 84 |
+
"Past",
|
| 85 |
+
"Pres",
|
| 86 |
+
"X"
|
| 87 |
+
],
|
| 88 |
+
"VerbForm": [
|
| 89 |
+
"Part",
|
| 90 |
+
"Fin",
|
| 91 |
+
"Inf",
|
| 92 |
+
"Ger",
|
| 93 |
+
"X"
|
| 94 |
+
],
|
| 95 |
+
"deprel": [
|
| 96 |
+
"nmod:tmod",
|
| 97 |
+
"advcl",
|
| 98 |
+
"list",
|
| 99 |
+
"advmod",
|
| 100 |
+
"discourse",
|
| 101 |
+
"root",
|
| 102 |
+
"xcomp",
|
| 103 |
+
"det",
|
| 104 |
+
"obj",
|
| 105 |
+
"obl:tmod",
|
| 106 |
+
"nummod",
|
| 107 |
+
"appos",
|
| 108 |
+
"aux",
|
| 109 |
+
"expl",
|
| 110 |
+
"mark",
|
| 111 |
+
"iobj",
|
| 112 |
+
"obl:npmod",
|
| 113 |
+
"conj",
|
| 114 |
+
"compound:prt",
|
| 115 |
+
"det:predet",
|
| 116 |
+
"cc",
|
| 117 |
+
"nmod:npmod",
|
| 118 |
+
"parataxis",
|
| 119 |
+
"acl:relcl",
|
| 120 |
+
"csubj:pass",
|
| 121 |
+
"nsubj:pass",
|
| 122 |
+
"ccomp",
|
| 123 |
+
"obl",
|
| 124 |
+
"fixed",
|
| 125 |
+
"amod",
|
| 126 |
+
"aux:pass",
|
| 127 |
+
"nmod:poss",
|
| 128 |
+
"acl",
|
| 129 |
+
"vocative",
|
| 130 |
+
"cc:preconj",
|
| 131 |
+
"punct",
|
| 132 |
+
"cop",
|
| 133 |
+
"case",
|
| 134 |
+
"compound",
|
| 135 |
+
"csubj",
|
| 136 |
+
"nsubj",
|
| 137 |
+
"nmod",
|
| 138 |
+
"flat"
|
| 139 |
+
],
|
| 140 |
+
"pos": [
|
| 141 |
+
"ADV",
|
| 142 |
+
"INTJ",
|
| 143 |
+
"SCONJ",
|
| 144 |
+
"VERB",
|
| 145 |
+
"PART",
|
| 146 |
+
"SYM",
|
| 147 |
+
"PRON",
|
| 148 |
+
"AUX",
|
| 149 |
+
"PROPN",
|
| 150 |
+
"ADP",
|
| 151 |
+
"CCONJ",
|
| 152 |
+
"PUNCT",
|
| 153 |
+
"NOUN",
|
| 154 |
+
"DET",
|
| 155 |
+
"NUM",
|
| 156 |
+
"ADJ",
|
| 157 |
+
"X"
|
| 158 |
+
],
|
| 159 |
+
"xpos": [
|
| 160 |
+
"CD",
|
| 161 |
+
"''",
|
| 162 |
+
",",
|
| 163 |
+
"PDT",
|
| 164 |
+
"WDT",
|
| 165 |
+
"VBD",
|
| 166 |
+
"VBP",
|
| 167 |
+
"WP$",
|
| 168 |
+
"MD",
|
| 169 |
+
"RB",
|
| 170 |
+
"VB",
|
| 171 |
+
"PRP",
|
| 172 |
+
"HYPH",
|
| 173 |
+
"``",
|
| 174 |
+
"ADD",
|
| 175 |
+
"PRP$",
|
| 176 |
+
"NNPS",
|
| 177 |
+
"SYM",
|
| 178 |
+
"POS",
|
| 179 |
+
"AFX",
|
| 180 |
+
"JJS",
|
| 181 |
+
"NNS",
|
| 182 |
+
"$",
|
| 183 |
+
"JJR",
|
| 184 |
+
"RBS",
|
| 185 |
+
"UH",
|
| 186 |
+
"VBN",
|
| 187 |
+
"FW",
|
| 188 |
+
"-LRB-",
|
| 189 |
+
".",
|
| 190 |
+
"JJ",
|
| 191 |
+
"IN",
|
| 192 |
+
"RP",
|
| 193 |
+
"TO",
|
| 194 |
+
"EX",
|
| 195 |
+
"VBG",
|
| 196 |
+
"NNP",
|
| 197 |
+
"VBZ",
|
| 198 |
+
"RBR",
|
| 199 |
+
"NN",
|
| 200 |
+
"DT",
|
| 201 |
+
"LS",
|
| 202 |
+
"WP",
|
| 203 |
+
"CC",
|
| 204 |
+
"WRB",
|
| 205 |
+
":",
|
| 206 |
+
"-RRB-",
|
| 207 |
+
"NFP"
|
| 208 |
+
]
|
| 209 |
+
},
|
| 210 |
+
"layer_norm_eps": 1e-07,
|
| 211 |
+
"legacy": true,
|
| 212 |
+
"max_position_embeddings": 512,
|
| 213 |
+
"max_relative_positions": -1,
|
| 214 |
+
"model_type": "deberta-v2",
|
| 215 |
+
"norm_rel_ebd": "layer_norm",
|
| 216 |
+
"num_attention_heads": 12,
|
| 217 |
+
"num_hidden_layers": 12,
|
| 218 |
+
"num_labels_dict": {
|
| 219 |
+
"Case": 3,
|
| 220 |
+
"Definite": 3,
|
| 221 |
+
"Degree": 4,
|
| 222 |
+
"Foreign": 2,
|
| 223 |
+
"Gender": 4,
|
| 224 |
+
"Mood": 3,
|
| 225 |
+
"NumType": 4,
|
| 226 |
+
"Number": 3,
|
| 227 |
+
"Person": 4,
|
| 228 |
+
"Polarity": 3,
|
| 229 |
+
"Poss": 2,
|
| 230 |
+
"PronType": 7,
|
| 231 |
+
"Reflex": 2,
|
| 232 |
+
"Tense": 3,
|
| 233 |
+
"VerbForm": 5,
|
| 234 |
+
"deprel": 43,
|
| 235 |
+
"pos": 17,
|
| 236 |
+
"xpos": 48
|
| 237 |
+
},
|
| 238 |
+
"pad_token_id": 0,
|
| 239 |
+
"pooler_dropout": 0,
|
| 240 |
+
"pooler_hidden_act": "gelu",
|
| 241 |
+
"pooler_hidden_size": 768,
|
| 242 |
+
"pos_att_type": [
|
| 243 |
+
"p2c",
|
| 244 |
+
"c2p"
|
| 245 |
+
],
|
| 246 |
+
"position_biased_input": false,
|
| 247 |
+
"position_buckets": 256,
|
| 248 |
+
"relative_attention": true,
|
| 249 |
+
"share_att_key": true,
|
| 250 |
+
"torch_dtype": "float32",
|
| 251 |
+
"transformers_version": "4.49.0",
|
| 252 |
+
"type_vocab_size": 0,
|
| 253 |
+
"vocab_size": 128100
|
| 254 |
+
}
|
models/ud_ewt_gum_pud_20250611/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae23188a45d023577d6842d09e7aeb9d26b9ef5ddeab939103bb0019f8acd614
|
| 3 |
+
size 778372024
|
models/ud_ewt_gum_pud_20250611/special_tokens_map.json
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": "[CLS]",
|
| 3 |
+
"cls_token": "[CLS]",
|
| 4 |
+
"eos_token": "[SEP]",
|
| 5 |
+
"mask_token": "[MASK]",
|
| 6 |
+
"pad_token": "[PAD]",
|
| 7 |
+
"sep_token": "[SEP]",
|
| 8 |
+
"unk_token": {
|
| 9 |
+
"content": "[UNK]",
|
| 10 |
+
"lstrip": false,
|
| 11 |
+
"normalized": true,
|
| 12 |
+
"rstrip": false,
|
| 13 |
+
"single_word": false
|
| 14 |
+
}
|
| 15 |
+
}
|
models/ud_ewt_gum_pud_20250611/spm.model
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c679fbf93643d19aab7ee10c0b99e460bdbc02fedf34b92b05af343b4af586fd
|
| 3 |
+
size 2464616
|
models/ud_ewt_gum_pud_20250611/tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
models/ud_ewt_gum_pud_20250611/tokenizer_config.json
ADDED
|
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_prefix_space": true,
|
| 3 |
+
"added_tokens_decoder": {
|
| 4 |
+
"0": {
|
| 5 |
+
"content": "[PAD]",
|
| 6 |
+
"lstrip": false,
|
| 7 |
+
"normalized": false,
|
| 8 |
+
"rstrip": false,
|
| 9 |
+
"single_word": false,
|
| 10 |
+
"special": true
|
| 11 |
+
},
|
| 12 |
+
"1": {
|
| 13 |
+
"content": "[CLS]",
|
| 14 |
+
"lstrip": false,
|
| 15 |
+
"normalized": false,
|
| 16 |
+
"rstrip": false,
|
| 17 |
+
"single_word": false,
|
| 18 |
+
"special": true
|
| 19 |
+
},
|
| 20 |
+
"2": {
|
| 21 |
+
"content": "[SEP]",
|
| 22 |
+
"lstrip": false,
|
| 23 |
+
"normalized": false,
|
| 24 |
+
"rstrip": false,
|
| 25 |
+
"single_word": false,
|
| 26 |
+
"special": true
|
| 27 |
+
},
|
| 28 |
+
"3": {
|
| 29 |
+
"content": "[UNK]",
|
| 30 |
+
"lstrip": false,
|
| 31 |
+
"normalized": true,
|
| 32 |
+
"rstrip": false,
|
| 33 |
+
"single_word": false,
|
| 34 |
+
"special": true
|
| 35 |
+
},
|
| 36 |
+
"128000": {
|
| 37 |
+
"content": "[MASK]",
|
| 38 |
+
"lstrip": false,
|
| 39 |
+
"normalized": false,
|
| 40 |
+
"rstrip": false,
|
| 41 |
+
"single_word": false,
|
| 42 |
+
"special": true
|
| 43 |
+
}
|
| 44 |
+
},
|
| 45 |
+
"bos_token": "[CLS]",
|
| 46 |
+
"clean_up_tokenization_spaces": false,
|
| 47 |
+
"cls_token": "[CLS]",
|
| 48 |
+
"do_lower_case": false,
|
| 49 |
+
"eos_token": "[SEP]",
|
| 50 |
+
"extra_special_tokens": {},
|
| 51 |
+
"mask_token": "[MASK]",
|
| 52 |
+
"model_max_length": 1000000000000000019884624838656,
|
| 53 |
+
"pad_token": "[PAD]",
|
| 54 |
+
"sep_token": "[SEP]",
|
| 55 |
+
"sp_model_kwargs": {},
|
| 56 |
+
"split_by_punct": false,
|
| 57 |
+
"tokenizer_class": "DebertaV2Tokenizer",
|
| 58 |
+
"unk_token": "[UNK]",
|
| 59 |
+
"vocab_type": "spm"
|
| 60 |
+
}
|
models/ud_ewt_gum_pud_20250611/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:828cf2eb1193c0bb76fa39060608f6f9f9358d1521c589fd17d08a0144a64027
|
| 3 |
+
size 5304
|