| /gpfs/bwfor/home/hd/hd_hd/hd_ec199/reproduce/evalatin2024-latinpipe/.venv/lib/python3.12/site-packages/keras/src/models/functional.py:225: UserWarning: The structure of `inputs` doesn't match the expected structure: ['keras_tensor', 'keras_tensor_1', 'keras_tensor_2', 'keras_tensor_3', 'keras_tensor_4', 'keras_tensor_5']. Received: the structure of inputs=('*', '*', '*', '*', '*', '*') | |
| warnings.warn( | |
| { | |
| "batch_size": 16, | |
| "deprel": "full", | |
| "dev": [ | |
| "la_giuseppe/dev.conllu" | |
| ], | |
| "dropout": 0.5, | |
| "embed_tags": [], | |
| "epochs": 100, | |
| "epochs_frozen": 20, | |
| "exp": "all_three_100_epochs", | |
| "label_smoothing": 0.03, | |
| "learning_rate": 2e-05, | |
| "learning_rate_decay": "cos", | |
| "learning_rate_warmup": 2000, | |
| "load": [], | |
| "logdir": "logs/all_three_100_epochs-latinpipe_evalatin24-8201717-250407_140047-s2", | |
| "max_train_sentence_len": 150, | |
| "optimizer": "adam", | |
| "parse": 1, | |
| "parse_attention_dim": 512, | |
| "rnn_dim": 512, | |
| "rnn_layers": 2, | |
| "rnn_type": "LSTMTorch", | |
| "save_checkpoint": true, | |
| "script": "latinpipe_evalatin24.py", | |
| "seed": 2, | |
| "single_root": 1, | |
| "steps_per_epoch": 1000, | |
| "subword_combination": "first", | |
| "tags": [ | |
| 2, | |
| 1, | |
| 4 | |
| ], | |
| "task_hidden_layer": 2048, | |
| "test": [ | |
| "la_giuseppe/test.conllu" | |
| ], | |
| "threads": 4, | |
| "train": [ | |
| "la_giuseppe/train.conllu" | |
| ], | |
| "train_sampling_exponent": 0.5, | |
| "transformers": [ | |
| "bowphs/LaBerta", | |
| "bowphs/PhilBerta", | |
| "FacebookAI/xlm-roberta-large" | |
| ], | |
| "treebank_ids": false, | |
| "verbose": 2, | |
| "wandb": false, | |
| "word_masking": null | |
| } | |
| Trimmed 2 out of 5089 sentences | |
| Epoch 1/20 | |
| 319/319 - 50s - 158ms/step - dense_1_loss: 0.2477 - dense_3_loss: 0.9185 - dense_5_loss: 0.7275 - loss: 3.4780 - parsing_head_loss: 0.6817 - learning_rate: 1.0000e-03 - dev_UPOS: 93.9191 - dev_UFeats: 82.3443 - dev_Lemmas: 73.4568 - dev_UAS: 60.3320 - dev_LAS: 49.1975 | |
| Epoch 2/20 | |
| 319/319 - 47s - 147ms/step - dense_1_loss: 0.1904 - dense_3_loss: 0.6759 - dense_5_loss: 0.5141 - loss: 2.5663 - parsing_head_loss: 0.5140 - learning_rate: 1.0000e-03 - dev_UPOS: 94.6804 - dev_UFeats: 83.8577 - dev_Lemmas: 77.2998 - dev_UAS: 66.0552 - dev_LAS: 56.0304 | |
| Epoch 3/20 | |
| 319/319 - 47s - 147ms/step - dense_1_loss: 0.1783 - dense_3_loss: 0.6080 - dense_5_loss: 0.4744 - loss: 2.3521 - parsing_head_loss: 0.4798 - learning_rate: 1.0000e-03 - dev_UPOS: 95.2674 - dev_UFeats: 85.1876 - dev_Lemmas: 79.2993 - dev_UAS: 69.1920 - dev_LAS: 59.4607 | |
| Epoch 4/20 | |
| 319/319 - 47s - 148ms/step - dense_1_loss: 0.1717 - dense_3_loss: 0.5644 - dense_5_loss: 0.4464 - loss: 2.2021 - parsing_head_loss: 0.4540 - learning_rate: 1.0000e-03 - dev_UPOS: 95.0197 - dev_UFeats: 85.6370 - dev_Lemmas: 80.7209 - dev_UAS: 70.3476 - dev_LAS: 61.0382 | |
| Epoch 5/20 | |
| 319/319 - 47s - 149ms/step - dense_1_loss: 0.1690 - dense_3_loss: 0.5288 - dense_5_loss: 0.4247 - loss: 2.0944 - parsing_head_loss: 0.4340 - learning_rate: 1.0000e-03 - dev_UPOS: 94.8088 - dev_UFeats: 86.0772 - dev_Lemmas: 81.4455 - dev_UAS: 71.7784 - dev_LAS: 62.4415 | |
| Epoch 6/20 | |
| 319/319 - 47s - 148ms/step - dense_1_loss: 0.1705 - dense_3_loss: 0.5209 - dense_5_loss: 0.4314 - loss: 2.0831 - parsing_head_loss: 0.4325 - learning_rate: 1.0000e-03 - dev_UPOS: 95.4600 - dev_UFeats: 85.8571 - dev_Lemmas: 81.7940 - dev_UAS: 73.0808 - dev_LAS: 64.3034 | |
| Epoch 7/20 | |
| 319/319 - 47s - 147ms/step - dense_1_loss: 0.1616 - dense_3_loss: 0.4974 - dense_5_loss: 0.4151 - loss: 1.9977 - parsing_head_loss: 0.4142 - learning_rate: 1.0000e-03 - dev_UPOS: 95.5242 - dev_UFeats: 86.4533 - dev_Lemmas: 82.2801 - dev_UAS: 74.3282 - dev_LAS: 65.0738 | |
| Epoch 8/20 | |
| 319/319 - 47s - 148ms/step - dense_1_loss: 0.1619 - dense_3_loss: 0.4869 - dense_5_loss: 0.4090 - loss: 1.9691 - parsing_head_loss: 0.4101 - learning_rate: 1.0000e-03 - dev_UPOS: 95.6984 - dev_UFeats: 86.4074 - dev_Lemmas: 82.7020 - dev_UAS: 74.1631 - dev_LAS: 65.8993 | |
| Epoch 9/20 | |
| 319/319 - 47s - 148ms/step - dense_1_loss: 0.1561 - dense_3_loss: 0.4713 - dense_5_loss: 0.3972 - loss: 1.8996 - parsing_head_loss: 0.3948 - learning_rate: 1.0000e-03 - dev_UPOS: 95.6709 - dev_UFeats: 86.2973 - dev_Lemmas: 83.0872 - dev_UAS: 75.0344 - dev_LAS: 66.3487 | |
| Epoch 10/20 | |
| 319/319 - 47s - 146ms/step - dense_1_loss: 0.1590 - dense_3_loss: 0.4727 - dense_5_loss: 0.3997 - loss: 1.9004 - parsing_head_loss: 0.3945 - learning_rate: 1.0000e-03 - dev_UPOS: 95.6984 - dev_UFeats: 86.5175 - dev_Lemmas: 83.3165 - dev_UAS: 75.2637 - dev_LAS: 67.0549 | |
| Epoch 11/20 | |
| 319/319 - 47s - 148ms/step - dense_1_loss: 0.1544 - dense_3_loss: 0.4592 - dense_5_loss: 0.3919 - loss: 1.8534 - parsing_head_loss: 0.3850 - learning_rate: 1.0000e-03 - dev_UPOS: 95.9277 - dev_UFeats: 86.5175 - dev_Lemmas: 83.1514 - dev_UAS: 75.9974 - dev_LAS: 67.4035 | |
| Epoch 12/20 | |
| 319/319 - 47s - 148ms/step - dense_1_loss: 0.1530 - dense_3_loss: 0.4516 - dense_5_loss: 0.3868 - loss: 1.8219 - parsing_head_loss: 0.3785 - learning_rate: 1.0000e-03 - dev_UPOS: 95.7810 - dev_UFeats: 86.7376 - dev_Lemmas: 83.7843 - dev_UAS: 76.0066 - dev_LAS: 67.4952 | |
| Epoch 13/20 | |
| 319/319 - 48s - 149ms/step - dense_1_loss: 0.1497 - dense_3_loss: 0.4368 - dense_5_loss: 0.3795 - loss: 1.7703 - parsing_head_loss: 0.3676 - learning_rate: 1.0000e-03 - dev_UPOS: 96.0378 - dev_UFeats: 86.5175 - dev_Lemmas: 83.8118 - dev_UAS: 76.4652 - dev_LAS: 68.5041 | |
| Epoch 14/20 | |
| 319/319 - 47s - 148ms/step - dense_1_loss: 0.1495 - dense_3_loss: 0.4314 - dense_5_loss: 0.3793 - loss: 1.7641 - parsing_head_loss: 0.3651 - learning_rate: 1.0000e-03 - dev_UPOS: 95.7810 - dev_UFeats: 86.8018 - dev_Lemmas: 83.8852 - dev_UAS: 76.1992 - dev_LAS: 68.1189 | |
| Epoch 15/20 | |
| 319/319 - 47s - 148ms/step - dense_1_loss: 0.1507 - dense_3_loss: 0.4319 - dense_5_loss: 0.3804 - loss: 1.7555 - parsing_head_loss: 0.3631 - learning_rate: 1.0000e-03 - dev_UPOS: 95.9094 - dev_UFeats: 86.7009 - dev_Lemmas: 84.0044 - dev_UAS: 76.6028 - dev_LAS: 68.3482 | |
| Epoch 16/20 | |
| 319/319 - 47s - 148ms/step - dense_1_loss: 0.1488 - dense_3_loss: 0.4267 - dense_5_loss: 0.3816 - loss: 1.7477 - parsing_head_loss: 0.3629 - learning_rate: 1.0000e-03 - dev_UPOS: 95.9919 - dev_UFeats: 86.6459 - dev_Lemmas: 83.9585 - dev_UAS: 76.9880 - dev_LAS: 69.0085 | |
| Epoch 17/20 | |
| 319/319 - 47s - 148ms/step - dense_1_loss: 0.1462 - dense_3_loss: 0.4171 - dense_5_loss: 0.3698 - loss: 1.7093 - parsing_head_loss: 0.3555 - learning_rate: 1.0000e-03 - dev_UPOS: 95.8544 - dev_UFeats: 86.7193 - dev_Lemmas: 84.4722 - dev_UAS: 77.1898 - dev_LAS: 69.0911 | |
| Epoch 18/20 | |
| 319/319 - 47s - 148ms/step - dense_1_loss: 0.1462 - dense_3_loss: 0.4209 - dense_5_loss: 0.3700 - loss: 1.7049 - parsing_head_loss: 0.3523 - learning_rate: 1.0000e-03 - dev_UPOS: 96.0103 - dev_UFeats: 86.5542 - dev_Lemmas: 84.4630 - dev_UAS: 77.4741 - dev_LAS: 69.0085 | |
| Epoch 19/20 | |
| 319/319 - 47s - 147ms/step - dense_1_loss: 0.1462 - dense_3_loss: 0.4230 - dense_5_loss: 0.3723 - loss: 1.7028 - parsing_head_loss: 0.3499 - learning_rate: 1.0000e-03 - dev_UPOS: 96.2121 - dev_UFeats: 86.6917 - dev_Lemmas: 84.5914 - dev_UAS: 77.4191 - dev_LAS: 69.3020 | |
| Epoch 20/20 | |
| 319/319 - 47s - 147ms/step - dense_1_loss: 0.1449 - dense_3_loss: 0.4171 - dense_5_loss: 0.3664 - loss: 1.6902 - parsing_head_loss: 0.3478 - learning_rate: 1.0000e-03 - dev_UPOS: 96.0286 - dev_UFeats: 86.6000 - dev_Lemmas: 84.5364 - dev_UAS: 77.5750 - dev_LAS: 69.1828 | |
| Epoch 21/120 | |
| /gpfs/bwfor/home/hd/hd_hd/hd_ec199/reproduce/evalatin2024-latinpipe/.venv/lib/python3.12/site-packages/keras/src/optimizers/base_optimizer.py:731: UserWarning: Gradients do not exist for variables ['variable_783', 'variable_784'] when minimizing the loss. If using `model.compile()`, did you forget to provide a `loss` argument? | |
| warnings.warn( | |
| 319/319 - 119s - 373ms/step - dense_1_loss: 0.1385 - dense_3_loss: 0.3823 - dense_5_loss: 0.3379 - loss: 1.5763 - parsing_head_loss: 0.3282 - learning_rate: 3.1900e-06 - dev_UPOS: 96.2579 - dev_UFeats: 88.3610 - dev_Lemmas: 85.7746 - dev_UAS: 78.2812 - dev_LAS: 70.1458 | |
| Epoch 22/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.1323 - dense_3_loss: 0.3601 - dense_5_loss: 0.3065 - loss: 1.4845 - parsing_head_loss: 0.3118 - learning_rate: 6.3800e-06 - dev_UPOS: 96.4047 - dev_UFeats: 89.5258 - dev_Lemmas: 86.3432 - dev_UAS: 78.8957 - dev_LAS: 70.9346 | |
| Epoch 23/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.1313 - dense_3_loss: 0.3562 - dense_5_loss: 0.2980 - loss: 1.4578 - parsing_head_loss: 0.3071 - learning_rate: 9.5700e-06 - dev_UPOS: 96.4964 - dev_UFeats: 90.1403 - dev_Lemmas: 86.9669 - dev_UAS: 79.2901 - dev_LAS: 71.6684 | |
| Epoch 24/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.1284 - dense_3_loss: 0.3436 - dense_5_loss: 0.2849 - loss: 1.4103 - parsing_head_loss: 0.2982 - learning_rate: 1.2760e-05 - dev_UPOS: 96.6064 - dev_UFeats: 90.6906 - dev_Lemmas: 87.4255 - dev_UAS: 79.4827 - dev_LAS: 71.9894 | |
| Epoch 25/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.1280 - dense_3_loss: 0.3364 - dense_5_loss: 0.2808 - loss: 1.3872 - parsing_head_loss: 0.2948 - learning_rate: 1.5950e-05 - dev_UPOS: 96.5973 - dev_UFeats: 90.7732 - dev_Lemmas: 87.8382 - dev_UAS: 79.8588 - dev_LAS: 72.3654 | |
| Epoch 26/120 | |
| 319/319 - 119s - 373ms/step - dense_1_loss: 0.1241 - dense_3_loss: 0.3243 - dense_5_loss: 0.2704 - loss: 1.3395 - parsing_head_loss: 0.2844 - learning_rate: 1.9140e-05 - dev_UPOS: 96.7348 - dev_UFeats: 91.1401 - dev_Lemmas: 88.2876 - dev_UAS: 79.9780 - dev_LAS: 72.5672 | |
| Epoch 27/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.1227 - dense_3_loss: 0.3165 - dense_5_loss: 0.2652 - loss: 1.3156 - parsing_head_loss: 0.2804 - learning_rate: 1.9997e-05 - dev_UPOS: 96.7257 - dev_UFeats: 91.4427 - dev_Lemmas: 88.3702 - dev_UAS: 80.7301 - dev_LAS: 73.5027 | |
| Epoch 28/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.1247 - dense_3_loss: 0.3399 - dense_5_loss: 0.2654 - loss: 1.3321 - parsing_head_loss: 0.2761 - learning_rate: 1.9983e-05 - dev_UPOS: 96.5697 - dev_UFeats: 91.1401 - dev_Lemmas: 87.2329 - dev_UAS: 80.4733 - dev_LAS: 73.1725 | |
| Epoch 29/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.1240 - dense_3_loss: 0.3514 - dense_5_loss: 0.2657 - loss: 1.3377 - parsing_head_loss: 0.2733 - learning_rate: 1.9958e-05 - dev_UPOS: 96.5422 - dev_UFeats: 91.4702 - dev_Lemmas: 87.5997 - dev_UAS: 80.2807 - dev_LAS: 73.2276 | |
| Epoch 30/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.1213 - dense_3_loss: 0.3353 - dense_5_loss: 0.2564 - loss: 1.2933 - parsing_head_loss: 0.2668 - learning_rate: 1.9922e-05 - dev_UPOS: 96.6156 - dev_UFeats: 91.5711 - dev_Lemmas: 88.0125 - dev_UAS: 80.7209 - dev_LAS: 73.6586 | |
| Epoch 31/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.1189 - dense_3_loss: 0.3207 - dense_5_loss: 0.2492 - loss: 1.2555 - parsing_head_loss: 0.2600 - learning_rate: 1.9875e-05 - dev_UPOS: 96.6248 - dev_UFeats: 91.5528 - dev_Lemmas: 88.0950 - dev_UAS: 80.5191 - dev_LAS: 73.3926 | |
| Epoch 32/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.1176 - dense_3_loss: 0.3127 - dense_5_loss: 0.2456 - loss: 1.2358 - parsing_head_loss: 0.2577 - learning_rate: 1.9816e-05 - dev_UPOS: 96.5881 - dev_UFeats: 91.7913 - dev_Lemmas: 88.5903 - dev_UAS: 80.7484 - dev_LAS: 73.5394 | |
| Epoch 33/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.1171 - dense_3_loss: 0.3062 - dense_5_loss: 0.2440 - loss: 1.2205 - parsing_head_loss: 0.2546 - learning_rate: 1.9747e-05 - dev_UPOS: 96.6248 - dev_UFeats: 91.9105 - dev_Lemmas: 88.7279 - dev_UAS: 81.0694 - dev_LAS: 74.1631 | |
| Epoch 34/120 | |
| 319/319 - 117s - 367ms/step - dense_1_loss: 0.1170 - dense_3_loss: 0.3011 - dense_5_loss: 0.2414 - loss: 1.2074 - parsing_head_loss: 0.2520 - learning_rate: 1.9666e-05 - dev_UPOS: 96.6982 - dev_UFeats: 92.0114 - dev_Lemmas: 88.9480 - dev_UAS: 81.2070 - dev_LAS: 74.1906 | |
| Epoch 35/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.1131 - dense_3_loss: 0.2862 - dense_5_loss: 0.2331 - loss: 1.1602 - parsing_head_loss: 0.2428 - learning_rate: 1.9575e-05 - dev_UPOS: 96.6340 - dev_UFeats: 92.0205 - dev_Lemmas: 89.0672 - dev_UAS: 81.0969 - dev_LAS: 74.0989 | |
| Epoch 36/120 | |
| 319/319 - 119s - 373ms/step - dense_1_loss: 0.1107 - dense_3_loss: 0.2792 - dense_5_loss: 0.2267 - loss: 1.1310 - parsing_head_loss: 0.2381 - learning_rate: 1.9473e-05 - dev_UPOS: 96.6798 - dev_UFeats: 92.0022 - dev_Lemmas: 89.2048 - dev_UAS: 81.4546 - dev_LAS: 74.4749 | |
| Epoch 37/120 | |
| 319/319 - 119s - 373ms/step - dense_1_loss: 0.1103 - dense_3_loss: 0.2745 - dense_5_loss: 0.2243 - loss: 1.1184 - parsing_head_loss: 0.2335 - learning_rate: 1.9360e-05 - dev_UPOS: 96.7440 - dev_UFeats: 92.1123 - dev_Lemmas: 89.2782 - dev_UAS: 81.4638 - dev_LAS: 74.4749 | |
| Epoch 38/120 | |
| 319/319 - 119s - 373ms/step - dense_1_loss: 0.1095 - dense_3_loss: 0.2741 - dense_5_loss: 0.2221 - loss: 1.1060 - parsing_head_loss: 0.2301 - learning_rate: 1.9237e-05 - dev_UPOS: 96.7073 - dev_UFeats: 92.1948 - dev_Lemmas: 89.4433 - dev_UAS: 81.5922 - dev_LAS: 74.6767 | |
| Epoch 39/120 | |
| 319/319 - 119s - 373ms/step - dense_1_loss: 0.1083 - dense_3_loss: 0.2663 - dense_5_loss: 0.2203 - loss: 1.0912 - parsing_head_loss: 0.2287 - learning_rate: 1.9103e-05 - dev_UPOS: 96.7899 - dev_UFeats: 92.2040 - dev_Lemmas: 89.5900 - dev_UAS: 81.6564 - dev_LAS: 74.5208 | |
| Epoch 40/120 | |
| 319/319 - 119s - 371ms/step - dense_1_loss: 0.1078 - dense_3_loss: 0.2597 - dense_5_loss: 0.2181 - loss: 1.0751 - parsing_head_loss: 0.2262 - learning_rate: 1.8960e-05 - dev_UPOS: 96.7348 - dev_UFeats: 92.0572 - dev_Lemmas: 89.6451 - dev_UAS: 81.8674 - dev_LAS: 74.9610 | |
| Epoch 41/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.1073 - dense_3_loss: 0.2565 - dense_5_loss: 0.2161 - loss: 1.0628 - parsing_head_loss: 0.2227 - learning_rate: 1.8806e-05 - dev_UPOS: 96.7715 - dev_UFeats: 92.1856 - dev_Lemmas: 89.7826 - dev_UAS: 81.6106 - dev_LAS: 74.6492 | |
| Epoch 42/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.1068 - dense_3_loss: 0.2524 - dense_5_loss: 0.2135 - loss: 1.0497 - parsing_head_loss: 0.2197 - learning_rate: 1.8642e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.2223 - dev_Lemmas: 89.9385 - dev_UAS: 81.8765 - dev_LAS: 74.9794 | |
| Epoch 43/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.1050 - dense_3_loss: 0.2498 - dense_5_loss: 0.2108 - loss: 1.0346 - parsing_head_loss: 0.2162 - learning_rate: 1.8469e-05 - dev_UPOS: 96.8449 - dev_UFeats: 92.3324 - dev_Lemmas: 90.0486 - dev_UAS: 81.9041 - dev_LAS: 74.9885 | |
| Epoch 44/120 | |
| 319/319 - 120s - 375ms/step - dense_1_loss: 0.1037 - dense_3_loss: 0.2427 - dense_5_loss: 0.2060 - loss: 1.0097 - parsing_head_loss: 0.2098 - learning_rate: 1.8286e-05 - dev_UPOS: 96.7165 - dev_UFeats: 92.1581 - dev_Lemmas: 90.0486 - dev_UAS: 81.3446 - dev_LAS: 74.4749 | |
| Epoch 45/120 | |
| 319/319 - 119s - 374ms/step - dense_1_loss: 0.1055 - dense_3_loss: 0.2472 - dense_5_loss: 0.2106 - loss: 1.0258 - parsing_head_loss: 0.2135 - learning_rate: 1.8093e-05 - dev_UPOS: 96.6890 - dev_UFeats: 92.3232 - dev_Lemmas: 90.2320 - dev_UAS: 81.9316 - dev_LAS: 74.9885 | |
| Epoch 46/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.1047 - dense_3_loss: 0.2424 - dense_5_loss: 0.2084 - loss: 1.0162 - parsing_head_loss: 0.2131 - learning_rate: 1.7892e-05 - dev_UPOS: 96.7899 - dev_UFeats: 92.3049 - dev_Lemmas: 90.3971 - dev_UAS: 82.1976 - dev_LAS: 75.3004 | |
| Epoch 47/120 | |
| 319/319 - 119s - 373ms/step - dense_1_loss: 0.1033 - dense_3_loss: 0.2379 - dense_5_loss: 0.2035 - loss: 0.9938 - parsing_head_loss: 0.2076 - learning_rate: 1.7682e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.2590 - dev_Lemmas: 90.3513 - dev_UAS: 81.9774 - dev_LAS: 75.1169 | |
| Epoch 48/120 | |
| 319/319 - 119s - 374ms/step - dense_1_loss: 0.1016 - dense_3_loss: 0.2314 - dense_5_loss: 0.2006 - loss: 0.9747 - parsing_head_loss: 0.2033 - learning_rate: 1.7463e-05 - dev_UPOS: 96.8633 - dev_UFeats: 92.4058 - dev_Lemmas: 90.5164 - dev_UAS: 82.1242 - dev_LAS: 75.2637 | |
| Epoch 49/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.1031 - dense_3_loss: 0.2358 - dense_5_loss: 0.2034 - loss: 0.9852 - parsing_head_loss: 0.2051 - learning_rate: 1.7236e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.2498 - dev_Lemmas: 90.3605 - dev_UAS: 81.9683 - dev_LAS: 75.1628 | |
| Epoch 50/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.1018 - dense_3_loss: 0.2317 - dense_5_loss: 0.2006 - loss: 0.9704 - parsing_head_loss: 0.2007 - learning_rate: 1.7000e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.3874 - dev_Lemmas: 90.5164 - dev_UAS: 81.9591 - dev_LAS: 75.3554 | |
| Epoch 51/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.1018 - dense_3_loss: 0.2302 - dense_5_loss: 0.2006 - loss: 0.9660 - parsing_head_loss: 0.1994 - learning_rate: 1.6757e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.2774 - dev_Lemmas: 90.4797 - dev_UAS: 82.1334 - dev_LAS: 75.4196 | |
| Epoch 52/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.1019 - dense_3_loss: 0.2286 - dense_5_loss: 0.1995 - loss: 0.9613 - parsing_head_loss: 0.1988 - learning_rate: 1.6506e-05 - dev_UPOS: 96.7807 - dev_UFeats: 92.3507 - dev_Lemmas: 90.5806 - dev_UAS: 82.1425 - dev_LAS: 75.3371 | |
| Epoch 53/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.1000 - dense_3_loss: 0.2238 - dense_5_loss: 0.1956 - loss: 0.9408 - parsing_head_loss: 0.1941 - learning_rate: 1.6248e-05 - dev_UPOS: 96.7165 - dev_UFeats: 92.4149 - dev_Lemmas: 90.5622 - dev_UAS: 82.2159 - dev_LAS: 75.2820 | |
| Epoch 54/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.1001 - dense_3_loss: 0.2233 - dense_5_loss: 0.1957 - loss: 0.9387 - parsing_head_loss: 0.1936 - learning_rate: 1.5983e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.4149 - dev_Lemmas: 90.7548 - dev_UAS: 82.2159 - dev_LAS: 75.4380 | |
| Epoch 55/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.0982 - dense_3_loss: 0.2167 - dense_5_loss: 0.1912 - loss: 0.9150 - parsing_head_loss: 0.1883 - learning_rate: 1.5711e-05 - dev_UPOS: 96.8541 - dev_UFeats: 92.4516 - dev_Lemmas: 90.7824 - dev_UAS: 82.4819 - dev_LAS: 75.8599 | |
| Epoch 56/120 | |
| 319/319 - 117s - 368ms/step - dense_1_loss: 0.1010 - dense_3_loss: 0.2218 - dense_5_loss: 0.1963 - loss: 0.9380 - parsing_head_loss: 0.1933 - learning_rate: 1.5433e-05 - dev_UPOS: 96.8449 - dev_UFeats: 92.3966 - dev_Lemmas: 90.7273 - dev_UAS: 82.2709 - dev_LAS: 75.6306 | |
| Epoch 57/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.1000 - dense_3_loss: 0.2185 - dense_5_loss: 0.1936 - loss: 0.9218 - parsing_head_loss: 0.1890 - learning_rate: 1.5148e-05 - dev_UPOS: 96.7715 - dev_UFeats: 92.4975 - dev_Lemmas: 90.7365 - dev_UAS: 82.3535 - dev_LAS: 75.6306 | |
| Epoch 58/120 | |
| 319/319 - 119s - 373ms/step - dense_1_loss: 0.0968 - dense_3_loss: 0.2121 - dense_5_loss: 0.1874 - loss: 0.8931 - parsing_head_loss: 0.1823 - learning_rate: 1.4858e-05 - dev_UPOS: 96.8633 - dev_UFeats: 92.6167 - dev_Lemmas: 90.7732 - dev_UAS: 82.4635 - dev_LAS: 75.6948 | |
| Epoch 59/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0988 - dense_3_loss: 0.2156 - dense_5_loss: 0.1914 - loss: 0.9091 - parsing_head_loss: 0.1852 - learning_rate: 1.4562e-05 - dev_UPOS: 96.8541 - dev_UFeats: 92.5158 - dev_Lemmas: 90.7915 - dev_UAS: 82.2801 - dev_LAS: 75.7315 | |
| Epoch 60/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0977 - dense_3_loss: 0.2126 - dense_5_loss: 0.1890 - loss: 0.8969 - parsing_head_loss: 0.1826 - learning_rate: 1.4262e-05 - dev_UPOS: 96.7899 - dev_UFeats: 92.5617 - dev_Lemmas: 90.8557 - dev_UAS: 82.4911 - dev_LAS: 75.8323 | |
| Epoch 61/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.0961 - dense_3_loss: 0.2089 - dense_5_loss: 0.1857 - loss: 0.8822 - parsing_head_loss: 0.1799 - learning_rate: 1.3956e-05 - dev_UPOS: 96.8174 - dev_UFeats: 92.4608 - dev_Lemmas: 90.9474 - dev_UAS: 82.2526 - dev_LAS: 75.5388 | |
| Epoch 62/120 | |
| 319/319 - 117s - 368ms/step - dense_1_loss: 0.0974 - dense_3_loss: 0.2105 - dense_5_loss: 0.1882 - loss: 0.8906 - parsing_head_loss: 0.1812 - learning_rate: 1.3646e-05 - dev_UPOS: 96.8816 - dev_UFeats: 92.4791 - dev_Lemmas: 90.8741 - dev_UAS: 82.5094 - dev_LAS: 75.9607 | |
| Epoch 63/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0971 - dense_3_loss: 0.2096 - dense_5_loss: 0.1874 - loss: 0.8835 - parsing_head_loss: 0.1789 - learning_rate: 1.3332e-05 - dev_UPOS: 96.8266 - dev_UFeats: 92.3874 - dev_Lemmas: 90.8924 - dev_UAS: 82.5186 - dev_LAS: 75.7957 | |
| Epoch 64/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0969 - dense_3_loss: 0.2081 - dense_5_loss: 0.1864 - loss: 0.8806 - parsing_head_loss: 0.1789 - learning_rate: 1.3014e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.5433 - dev_Lemmas: 90.9658 - dev_UAS: 82.4085 - dev_LAS: 75.7865 | |
| Epoch 65/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.0951 - dense_3_loss: 0.2036 - dense_5_loss: 0.1826 - loss: 0.8593 - parsing_head_loss: 0.1732 - learning_rate: 1.2693e-05 - dev_UPOS: 96.8724 - dev_UFeats: 92.5158 - dev_Lemmas: 90.9750 - dev_UAS: 82.3810 - dev_LAS: 75.7681 | |
| Epoch 66/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.0954 - dense_3_loss: 0.2046 - dense_5_loss: 0.1836 - loss: 0.8627 - parsing_head_loss: 0.1741 - learning_rate: 1.2369e-05 - dev_UPOS: 96.8449 - dev_UFeats: 92.5342 - dev_Lemmas: 90.9199 - dev_UAS: 82.6286 - dev_LAS: 75.9974 | |
| Epoch 67/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.0952 - dense_3_loss: 0.2028 - dense_5_loss: 0.1825 - loss: 0.8563 - parsing_head_loss: 0.1719 - learning_rate: 1.2042e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.5342 - dev_Lemmas: 90.9566 - dev_UAS: 82.4085 - dev_LAS: 75.7865 | |
| Epoch 68/120 | |
| 319/319 - 117s - 366ms/step - dense_1_loss: 0.0961 - dense_3_loss: 0.2042 - dense_5_loss: 0.1841 - loss: 0.8612 - parsing_head_loss: 0.1740 - learning_rate: 1.1713e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.5433 - dev_Lemmas: 91.0025 - dev_UAS: 82.4360 - dev_LAS: 75.9057 | |
| Epoch 69/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.0943 - dense_3_loss: 0.2004 - dense_5_loss: 0.1807 - loss: 0.8462 - parsing_head_loss: 0.1700 - learning_rate: 1.1381e-05 - dev_UPOS: 96.8724 - dev_UFeats: 92.6993 - dev_Lemmas: 91.0759 - dev_UAS: 82.4452 - dev_LAS: 75.8048 | |
| Epoch 70/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.0945 - dense_3_loss: 0.2005 - dense_5_loss: 0.1809 - loss: 0.8462 - parsing_head_loss: 0.1703 - learning_rate: 1.1049e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.5433 - dev_Lemmas: 90.9841 - dev_UAS: 82.5644 - dev_LAS: 75.9699 | |
| Epoch 71/120 | |
| 319/319 - 118s - 368ms/step - dense_1_loss: 0.0949 - dense_3_loss: 0.2006 - dense_5_loss: 0.1819 - loss: 0.8481 - parsing_head_loss: 0.1705 - learning_rate: 1.0715e-05 - dev_UPOS: 96.7807 - dev_UFeats: 92.6809 - dev_Lemmas: 90.9016 - dev_UAS: 82.5277 - dev_LAS: 75.7681 | |
| Epoch 72/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0946 - dense_3_loss: 0.1989 - dense_5_loss: 0.1808 - loss: 0.8418 - parsing_head_loss: 0.1688 - learning_rate: 1.0380e-05 - dev_UPOS: 96.8449 - dev_UFeats: 92.6442 - dev_Lemmas: 91.0300 - dev_UAS: 82.7662 - dev_LAS: 76.1075 | |
| Epoch 73/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.0941 - dense_3_loss: 0.1976 - dense_5_loss: 0.1795 - loss: 0.8370 - parsing_head_loss: 0.1682 - learning_rate: 1.0045e-05 - dev_UPOS: 96.8082 - dev_UFeats: 92.6442 - dev_Lemmas: 91.1401 - dev_UAS: 82.6195 - dev_LAS: 76.0525 | |
| Epoch 74/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0941 - dense_3_loss: 0.1984 - dense_5_loss: 0.1792 - loss: 0.8365 - parsing_head_loss: 0.1677 - learning_rate: 9.7100e-06 - dev_UPOS: 96.8724 - dev_UFeats: 92.5709 - dev_Lemmas: 91.0208 - dev_UAS: 82.7295 - dev_LAS: 75.8782 | |
| Epoch 75/120 | |
| 319/319 - 119s - 373ms/step - dense_1_loss: 0.0924 - dense_3_loss: 0.1937 - dense_5_loss: 0.1759 - loss: 0.8182 - parsing_head_loss: 0.1641 - learning_rate: 9.3752e-06 - dev_UPOS: 96.8633 - dev_UFeats: 92.6351 - dev_Lemmas: 90.9933 - dev_UAS: 82.7112 - dev_LAS: 76.1167 | |
| Epoch 76/120 | |
| 319/319 - 119s - 373ms/step - dense_1_loss: 0.0923 - dense_3_loss: 0.1932 - dense_5_loss: 0.1756 - loss: 0.8164 - parsing_head_loss: 0.1638 - learning_rate: 9.0411e-06 - dev_UPOS: 96.8449 - dev_UFeats: 92.5525 - dev_Lemmas: 91.0759 - dev_UAS: 82.9038 - dev_LAS: 76.2176 | |
| Epoch 77/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0938 - dense_3_loss: 0.1958 - dense_5_loss: 0.1777 - loss: 0.8261 - parsing_head_loss: 0.1656 - learning_rate: 8.7081e-06 - dev_UPOS: 96.8266 - dev_UFeats: 92.6626 - dev_Lemmas: 91.0575 - dev_UAS: 82.6103 - dev_LAS: 75.7590 | |
| Epoch 78/120 | |
| 319/319 - 118s - 368ms/step - dense_1_loss: 0.0941 - dense_3_loss: 0.1964 - dense_5_loss: 0.1783 - loss: 0.8268 - parsing_head_loss: 0.1653 - learning_rate: 8.3765e-06 - dev_UPOS: 96.8174 - dev_UFeats: 92.6075 - dev_Lemmas: 91.0850 - dev_UAS: 82.8121 - dev_LAS: 76.1625 | |
| Epoch 79/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.0921 - dense_3_loss: 0.1916 - dense_5_loss: 0.1748 - loss: 0.8098 - parsing_head_loss: 0.1615 - learning_rate: 8.0468e-06 - dev_UPOS: 96.8357 - dev_UFeats: 92.5617 - dev_Lemmas: 91.1125 - dev_UAS: 82.6011 - dev_LAS: 76.0066 | |
| Epoch 80/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.0928 - dense_3_loss: 0.1932 - dense_5_loss: 0.1763 - loss: 0.8147 - parsing_head_loss: 0.1624 - learning_rate: 7.7192e-06 - dev_UPOS: 96.8266 - dev_UFeats: 92.5433 - dev_Lemmas: 91.1217 - dev_UAS: 82.4819 - dev_LAS: 75.8507 | |
| Epoch 81/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.0922 - dense_3_loss: 0.1912 - dense_5_loss: 0.1746 - loss: 0.8088 - parsing_head_loss: 0.1618 - learning_rate: 7.3942e-06 - dev_UPOS: 96.8541 - dev_UFeats: 92.5892 - dev_Lemmas: 91.1401 - dev_UAS: 82.8212 - dev_LAS: 76.1900 | |
| Epoch 82/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.0917 - dense_3_loss: 0.1904 - dense_5_loss: 0.1734 - loss: 0.8012 - parsing_head_loss: 0.1596 - learning_rate: 7.0722e-06 - dev_UPOS: 96.8266 - dev_UFeats: 92.5800 - dev_Lemmas: 91.1767 - dev_UAS: 82.6928 - dev_LAS: 76.0433 | |
| Epoch 83/120 | |
| 319/319 - 117s - 368ms/step - dense_1_loss: 0.0929 - dense_3_loss: 0.1923 - dense_5_loss: 0.1755 - loss: 0.8112 - parsing_head_loss: 0.1623 - learning_rate: 6.7534e-06 - dev_UPOS: 96.8724 - dev_UFeats: 92.6167 - dev_Lemmas: 91.1951 - dev_UAS: 82.6837 - dev_LAS: 75.9699 | |
| Epoch 84/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.0919 - dense_3_loss: 0.1904 - dense_5_loss: 0.1736 - loss: 0.8032 - parsing_head_loss: 0.1605 - learning_rate: 6.4382e-06 - dev_UPOS: 96.8357 - dev_UFeats: 92.5984 - dev_Lemmas: 91.2409 - dev_UAS: 82.8671 - dev_LAS: 76.2726 | |
| Epoch 85/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0926 - dense_3_loss: 0.1914 - dense_5_loss: 0.1743 - loss: 0.8058 - parsing_head_loss: 0.1609 - learning_rate: 6.1271e-06 - dev_UPOS: 96.8633 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2134 - dev_UAS: 82.8029 - dev_LAS: 76.1900 | |
| Epoch 86/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.0915 - dense_3_loss: 0.1895 - dense_5_loss: 0.1732 - loss: 0.7982 - parsing_head_loss: 0.1595 - learning_rate: 5.8203e-06 - dev_UPOS: 96.8266 - dev_UFeats: 92.6626 - dev_Lemmas: 91.2685 - dev_UAS: 82.8854 - dev_LAS: 76.2176 | |
| Epoch 87/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.0916 - dense_3_loss: 0.1888 - dense_5_loss: 0.1731 - loss: 0.7967 - parsing_head_loss: 0.1592 - learning_rate: 5.5182e-06 - dev_UPOS: 96.8082 - dev_UFeats: 92.5342 - dev_Lemmas: 91.1492 - dev_UAS: 82.8121 - dev_LAS: 76.1809 | |
| Epoch 88/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.0912 - dense_3_loss: 0.1870 - dense_5_loss: 0.1717 - loss: 0.7896 - parsing_head_loss: 0.1573 - learning_rate: 5.2212e-06 - dev_UPOS: 96.8541 - dev_UFeats: 92.5525 - dev_Lemmas: 91.1584 - dev_UAS: 82.8396 - dev_LAS: 76.2359 | |
| Epoch 89/120 | |
| 319/319 - 119s - 374ms/step - dense_1_loss: 0.0902 - dense_3_loss: 0.1852 - dense_5_loss: 0.1699 - loss: 0.7832 - parsing_head_loss: 0.1564 - learning_rate: 4.9295e-06 - dev_UPOS: 96.8357 - dev_UFeats: 92.5158 - dev_Lemmas: 91.1951 - dev_UAS: 82.8488 - dev_LAS: 76.2451 | |
| Epoch 90/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.0908 - dense_3_loss: 0.1866 - dense_5_loss: 0.1711 - loss: 0.7863 - parsing_head_loss: 0.1566 - learning_rate: 4.6435e-06 - dev_UPOS: 96.8633 - dev_UFeats: 92.5709 - dev_Lemmas: 91.1584 - dev_UAS: 82.8121 - dev_LAS: 76.1258 | |
| Epoch 91/120 | |
| 319/319 - 117s - 367ms/step - dense_1_loss: 0.0928 - dense_3_loss: 0.1897 - dense_5_loss: 0.1743 - loss: 0.8008 - parsing_head_loss: 0.1597 - learning_rate: 4.3635e-06 - dev_UPOS: 96.8357 - dev_UFeats: 92.6442 - dev_Lemmas: 91.2318 - dev_UAS: 82.9221 - dev_LAS: 76.1992 | |
| Epoch 92/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.0916 - dense_3_loss: 0.1877 - dense_5_loss: 0.1720 - loss: 0.7908 - parsing_head_loss: 0.1573 - learning_rate: 4.0899e-06 - dev_UPOS: 96.8724 - dev_UFeats: 92.5617 - dev_Lemmas: 91.1584 - dev_UAS: 82.8671 - dev_LAS: 76.2084 | |
| Epoch 93/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.0915 - dense_3_loss: 0.1874 - dense_5_loss: 0.1716 - loss: 0.7898 - parsing_head_loss: 0.1573 - learning_rate: 3.8229e-06 - dev_UPOS: 96.8449 - dev_UFeats: 92.6167 - dev_Lemmas: 91.2226 - dev_UAS: 83.0047 - dev_LAS: 76.4652 | |
| Epoch 94/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.0906 - dense_3_loss: 0.1859 - dense_5_loss: 0.1707 - loss: 0.7818 - parsing_head_loss: 0.1557 - learning_rate: 3.5628e-06 - dev_UPOS: 96.8724 - dev_UFeats: 92.6167 - dev_Lemmas: 91.1859 - dev_UAS: 82.9405 - dev_LAS: 76.3643 | |
| Epoch 95/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0910 - dense_3_loss: 0.1860 - dense_5_loss: 0.1708 - loss: 0.7825 - parsing_head_loss: 0.1559 - learning_rate: 3.3100e-06 - dev_UPOS: 96.8082 - dev_UFeats: 92.5800 - dev_Lemmas: 91.2501 - dev_UAS: 82.9680 - dev_LAS: 76.3368 | |
| Epoch 96/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.0911 - dense_3_loss: 0.1862 - dense_5_loss: 0.1707 - loss: 0.7841 - parsing_head_loss: 0.1562 - learning_rate: 3.0647e-06 - dev_UPOS: 96.8541 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2501 - dev_UAS: 82.9772 - dev_LAS: 76.3184 | |
| Epoch 97/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.0909 - dense_3_loss: 0.1858 - dense_5_loss: 0.1702 - loss: 0.7812 - parsing_head_loss: 0.1550 - learning_rate: 2.8272e-06 - dev_UPOS: 96.8633 - dev_UFeats: 92.6351 - dev_Lemmas: 91.2226 - dev_UAS: 82.9496 - dev_LAS: 76.1992 | |
| Epoch 98/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0916 - dense_3_loss: 0.1872 - dense_5_loss: 0.1721 - loss: 0.7876 - parsing_head_loss: 0.1568 - learning_rate: 2.5977e-06 - dev_UPOS: 96.8816 - dev_UFeats: 92.6442 - dev_Lemmas: 91.2501 - dev_UAS: 83.1056 - dev_LAS: 76.3918 | |
| Epoch 99/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.0911 - dense_3_loss: 0.1858 - dense_5_loss: 0.1709 - loss: 0.7825 - parsing_head_loss: 0.1560 - learning_rate: 2.3765e-06 - dev_UPOS: 96.8908 - dev_UFeats: 92.6351 - dev_Lemmas: 91.2868 - dev_UAS: 83.0780 - dev_LAS: 76.4193 | |
| Epoch 100/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.0910 - dense_3_loss: 0.1860 - dense_5_loss: 0.1707 - loss: 0.7828 - parsing_head_loss: 0.1563 - learning_rate: 2.1639e-06 - dev_UPOS: 96.8724 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2868 - dev_UAS: 83.0597 - dev_LAS: 76.3460 | |
| Epoch 101/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.0910 - dense_3_loss: 0.1853 - dense_5_loss: 0.1701 - loss: 0.7803 - parsing_head_loss: 0.1553 - learning_rate: 1.9601e-06 - dev_UPOS: 96.8816 - dev_UFeats: 92.6075 - dev_Lemmas: 91.2501 - dev_UAS: 82.9405 - dev_LAS: 76.2176 | |
| Epoch 102/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0917 - dense_3_loss: 0.1868 - dense_5_loss: 0.1715 - loss: 0.7851 - parsing_head_loss: 0.1563 - learning_rate: 1.7654e-06 - dev_UPOS: 96.8908 - dev_UFeats: 92.6626 - dev_Lemmas: 91.2043 - dev_UAS: 83.0322 - dev_LAS: 76.3093 | |
| Epoch 103/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.0904 - dense_3_loss: 0.1838 - dense_5_loss: 0.1689 - loss: 0.7747 - parsing_head_loss: 0.1546 - learning_rate: 1.5799e-06 - dev_UPOS: 96.8633 - dev_UFeats: 92.6534 - dev_Lemmas: 91.2226 - dev_UAS: 83.0597 - dev_LAS: 76.3093 | |
| Epoch 104/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0914 - dense_3_loss: 0.1863 - dense_5_loss: 0.1716 - loss: 0.7853 - parsing_head_loss: 0.1562 - learning_rate: 1.4038e-06 - dev_UPOS: 96.8357 - dev_UFeats: 92.6717 - dev_Lemmas: 91.2318 - dev_UAS: 82.9588 - dev_LAS: 76.2542 | |
| Epoch 105/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.0907 - dense_3_loss: 0.1852 - dense_5_loss: 0.1694 - loss: 0.7765 - parsing_head_loss: 0.1546 - learning_rate: 1.2374e-06 - dev_UPOS: 96.8724 - dev_UFeats: 92.6626 - dev_Lemmas: 91.2593 - dev_UAS: 82.9221 - dev_LAS: 76.2909 | |
| Epoch 106/120 | |
| 319/319 - 117s - 367ms/step - dense_1_loss: 0.0920 - dense_3_loss: 0.1871 - dense_5_loss: 0.1720 - loss: 0.7874 - parsing_head_loss: 0.1566 - learning_rate: 1.0809e-06 - dev_UPOS: 96.8633 - dev_UFeats: 92.6442 - dev_Lemmas: 91.2685 - dev_UAS: 82.9772 - dev_LAS: 76.3551 | |
| Epoch 107/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.0896 - dense_3_loss: 0.1819 - dense_5_loss: 0.1674 - loss: 0.7668 - parsing_head_loss: 0.1535 - learning_rate: 9.3436e-07 - dev_UPOS: 96.8816 - dev_UFeats: 92.6534 - dev_Lemmas: 91.2685 - dev_UAS: 82.9863 - dev_LAS: 76.3551 | |
| Epoch 108/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0919 - dense_3_loss: 0.1867 - dense_5_loss: 0.1718 - loss: 0.7850 - parsing_head_loss: 0.1558 - learning_rate: 7.9801e-07 - dev_UPOS: 96.8633 - dev_UFeats: 92.6534 - dev_Lemmas: 91.3143 - dev_UAS: 83.0047 - dev_LAS: 76.3918 | |
| Epoch 109/120 | |
| 319/319 - 117s - 367ms/step - dense_1_loss: 0.0925 - dense_3_loss: 0.1879 - dense_5_loss: 0.1728 - loss: 0.7907 - parsing_head_loss: 0.1576 - learning_rate: 6.7200e-07 - dev_UPOS: 96.8633 - dev_UFeats: 92.6167 - dev_Lemmas: 91.2685 - dev_UAS: 82.9772 - dev_LAS: 76.3368 | |
| Epoch 110/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0914 - dense_3_loss: 0.1859 - dense_5_loss: 0.1708 - loss: 0.7818 - parsing_head_loss: 0.1556 - learning_rate: 5.5647e-07 - dev_UPOS: 96.8816 - dev_UFeats: 92.5892 - dev_Lemmas: 91.2501 - dev_UAS: 82.9863 - dev_LAS: 76.3643 | |
| Epoch 111/120 | |
| 319/319 - 118s - 371ms/step - dense_1_loss: 0.0912 - dense_3_loss: 0.1860 - dense_5_loss: 0.1704 - loss: 0.7807 - parsing_head_loss: 0.1554 - learning_rate: 4.5154e-07 - dev_UPOS: 96.8724 - dev_UFeats: 92.6717 - dev_Lemmas: 91.2685 - dev_UAS: 83.0414 - dev_LAS: 76.4010 | |
| Epoch 112/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.0903 - dense_3_loss: 0.1832 - dense_5_loss: 0.1688 - loss: 0.7721 - parsing_head_loss: 0.1538 - learning_rate: 3.5734e-07 - dev_UPOS: 96.8724 - dev_UFeats: 92.6534 - dev_Lemmas: 91.2409 - dev_UAS: 83.0505 - dev_LAS: 76.3918 | |
| Epoch 113/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0908 - dense_3_loss: 0.1843 - dense_5_loss: 0.1694 - loss: 0.7747 - parsing_head_loss: 0.1537 - learning_rate: 2.7398e-07 - dev_UPOS: 96.8724 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2868 - dev_UAS: 83.0230 - dev_LAS: 76.3735 | |
| Epoch 114/120 | |
| 319/319 - 117s - 368ms/step - dense_1_loss: 0.0922 - dense_3_loss: 0.1875 - dense_5_loss: 0.1721 - loss: 0.7869 - parsing_head_loss: 0.1569 - learning_rate: 2.0153e-07 - dev_UPOS: 96.8816 - dev_UFeats: 92.6534 - dev_Lemmas: 91.2868 - dev_UAS: 83.0505 - dev_LAS: 76.3826 | |
| Epoch 115/120 | |
| 319/319 - 119s - 372ms/step - dense_1_loss: 0.0904 - dense_3_loss: 0.1836 - dense_5_loss: 0.1691 - loss: 0.7736 - parsing_head_loss: 0.1540 - learning_rate: 1.4010e-07 - dev_UPOS: 96.8816 - dev_UFeats: 92.6626 - dev_Lemmas: 91.2868 - dev_UAS: 83.0230 - dev_LAS: 76.3735 | |
| Epoch 116/120 | |
| 319/319 - 118s - 369ms/step - dense_1_loss: 0.0914 - dense_3_loss: 0.1856 - dense_5_loss: 0.1708 - loss: 0.7800 - parsing_head_loss: 0.1554 - learning_rate: 8.9738e-08 - dev_UPOS: 96.8633 - dev_UFeats: 92.6626 - dev_Lemmas: 91.2776 - dev_UAS: 82.9772 - dev_LAS: 76.3460 | |
| Epoch 117/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.0909 - dense_3_loss: 0.1848 - dense_5_loss: 0.1697 - loss: 0.7763 - parsing_head_loss: 0.1545 - learning_rate: 5.0511e-08 - dev_UPOS: 96.8633 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2868 - dev_UAS: 83.0138 - dev_LAS: 76.3551 | |
| Epoch 118/120 | |
| 319/319 - 117s - 368ms/step - dense_1_loss: 0.0918 - dense_3_loss: 0.1864 - dense_5_loss: 0.1715 - loss: 0.7834 - parsing_head_loss: 0.1561 - learning_rate: 2.2460e-08 - dev_UPOS: 96.8816 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2868 - dev_UAS: 83.0047 - dev_LAS: 76.3643 | |
| Epoch 119/120 | |
| 319/319 - 118s - 370ms/step - dense_1_loss: 0.0910 - dense_3_loss: 0.1845 - dense_5_loss: 0.1698 - loss: 0.7767 - parsing_head_loss: 0.1546 - learning_rate: 5.6165e-09 - dev_UPOS: 96.8816 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2868 - dev_UAS: 82.9955 - dev_LAS: 76.3643 | |
| Epoch 120/120 | |
| 319/319 - 123s - 385ms/step - dense_1_loss: 0.0898 - dense_3_loss: 0.1824 - dense_5_loss: 0.1676 - loss: 0.7677 - parsing_head_loss: 0.1526 - learning_rate: 0.0000e+00 - dev_UPOS: 96.8816 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2868 - dev_UAS: 82.9955 - dev_LAS: 76.3643 - test_UPOS: 97.1577 - test_UFeats: 93.5661 - test_Lemmas: 90.6416 - test_UAS: 83.7141 - test_LAS: 77.1614 | |
| Traceback (most recent call last): | |
| File "/gpfs/bwfor/home/hd/hd_hd/hd_ec199/reproduce/evalatin2024-latinpipe/latinpipe_evalatin24.py", line 935, in <module> | |
| main([] if "__file__" not in globals() else None) | |
| File "/gpfs/bwfor/home/hd/hd_hd/hd_ec199/reproduce/evalatin2024-latinpipe/latinpipe_evalatin24.py", line 819, in main | |
| with open(os.path.join(os.path.dirname(args.load[0]), "options.json"), mode="r") as options_file: | |
| ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ | |
| FileNotFoundError: [Errno 2] No such file or directory: '/home/hd/hd_hd/hd_ec199/evalatin2024-latinpipe/latinpipe-evalatin/options.json' | |