Upload training.log with huggingface_hub
Browse files- training.log +226 -0
training.log
CHANGED
|
@@ -696,3 +696,229 @@
|
|
| 696 |
[22:52:22] step= 55700 | loss=3.2295 | acc30=0.085 | lr=1.00e-08 | 3.00h
|
| 697 |
[22:52:24] --- CHECKPOINT (hora 3.0) ---
|
| 698 |
[22:52:24] Checkpoint salvo: checkpoint_step00055712.pt (59.0 MB)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 696 |
[22:52:22] step= 55700 | loss=3.2295 | acc30=0.085 | lr=1.00e-08 | 3.00h
|
| 697 |
[22:52:24] --- CHECKPOINT (hora 3.0) ---
|
| 698 |
[22:52:24] Checkpoint salvo: checkpoint_step00055712.pt (59.0 MB)
|
| 699 |
+
[22:52:30] ☁ Upload HuggingFace OK: step=55712
|
| 700 |
+
[22:52:41] step= 55800 | loss=2.9909 | acc30=0.156 | lr=1.00e-08 | 3.00h
|
| 701 |
+
[22:52:59] step= 55900 | loss=2.0742 | acc30=0.397 | lr=1.00e-08 | 3.01h
|
| 702 |
+
[22:53:16] step= 56000 | loss=4.4831 | acc30=0.021 | lr=1.00e-08 | 3.01h
|
| 703 |
+
[22:53:16] Validando...
|
| 704 |
+
[22:53:32] VAL: loss=2.3540 acc30=0.200 acc60=0.271 acc120=0.337
|
| 705 |
+
[22:53:50] step= 56100 | loss=2.3610 | acc30=0.193 | lr=1.00e-08 | 3.02h
|
| 706 |
+
[22:54:09] step= 56200 | loss=2.2089 | acc30=0.252 | lr=1.00e-08 | 3.03h
|
| 707 |
+
[22:54:26] step= 56300 | loss=2.1536 | acc30=0.295 | lr=1.00e-08 | 3.03h
|
| 708 |
+
[22:54:44] step= 56400 | loss=2.2717 | acc30=0.228 | lr=1.00e-08 | 3.04h
|
| 709 |
+
[22:55:02] step= 56500 | loss=2.2863 | acc30=0.217 | lr=1.00e-08 | 3.04h
|
| 710 |
+
[22:55:20] step= 56600 | loss=2.3772 | acc30=0.219 | lr=1.00e-08 | 3.05h
|
| 711 |
+
[22:55:37] step= 56700 | loss=2.7942 | acc30=0.112 | lr=1.00e-08 | 3.05h
|
| 712 |
+
[22:55:55] step= 56800 | loss=2.2847 | acc30=0.240 | lr=1.00e-08 | 3.06h
|
| 713 |
+
[22:56:13] step= 56900 | loss=2.2913 | acc30=0.220 | lr=1.00e-08 | 3.06h
|
| 714 |
+
[22:56:32] step= 57000 | loss=2.3060 | acc30=0.236 | lr=1.00e-08 | 3.07h
|
| 715 |
+
[22:56:32] Validando...
|
| 716 |
+
[22:56:48] VAL: loss=2.3539 acc30=0.200 acc60=0.271 acc120=0.337
|
| 717 |
+
[22:57:05] step= 57100 | loss=2.1354 | acc30=0.314 | lr=1.00e-08 | 3.08h
|
| 718 |
+
[22:57:23] step= 57200 | loss=2.1181 | acc30=0.340 | lr=1.00e-08 | 3.08h
|
| 719 |
+
[22:57:41] step= 57300 | loss=2.4983 | acc30=0.205 | lr=1.00e-08 | 3.09h
|
| 720 |
+
[22:57:59] step= 57400 | loss=2.5378 | acc30=0.175 | lr=1.00e-08 | 3.09h
|
| 721 |
+
[22:58:17] step= 57500 | loss=2.1528 | acc30=0.309 | lr=1.00e-08 | 3.10h
|
| 722 |
+
[22:58:35] step= 57600 | loss=2.2481 | acc30=0.233 | lr=1.00e-08 | 3.10h
|
| 723 |
+
[22:58:53] step= 57700 | loss=2.0927 | acc30=0.351 | lr=1.00e-08 | 3.11h
|
| 724 |
+
[22:59:11] step= 57800 | loss=2.1765 | acc30=0.330 | lr=1.00e-08 | 3.11h
|
| 725 |
+
[22:59:28] step= 57900 | loss=2.4018 | acc30=0.187 | lr=1.00e-08 | 3.12h
|
| 726 |
+
[22:59:46] step= 58000 | loss=2.1278 | acc30=0.337 | lr=1.00e-08 | 3.12h
|
| 727 |
+
[22:59:46] Validando...
|
| 728 |
+
[23:00:02] VAL: loss=2.3539 acc30=0.200 acc60=0.272 acc120=0.337
|
| 729 |
+
[23:00:20] step= 58100 | loss=2.3080 | acc30=0.236 | lr=1.00e-08 | 3.13h
|
| 730 |
+
[23:00:39] step= 58200 | loss=2.1964 | acc30=0.266 | lr=1.00e-08 | 3.14h
|
| 731 |
+
[23:00:56] step= 58300 | loss=2.6340 | acc30=0.120 | lr=1.00e-08 | 3.14h
|
| 732 |
+
[23:01:14] step= 58400 | loss=2.2567 | acc30=0.289 | lr=1.00e-08 | 3.15h
|
| 733 |
+
[23:01:32] step= 58500 | loss=2.1296 | acc30=0.329 | lr=1.00e-08 | 3.15h
|
| 734 |
+
[23:01:50] step= 58600 | loss=2.2153 | acc30=0.287 | lr=1.00e-08 | 3.16h
|
| 735 |
+
[23:02:07] step= 58700 | loss=2.7896 | acc30=0.087 | lr=1.00e-08 | 3.16h
|
| 736 |
+
[23:02:25] step= 58800 | loss=3.7694 | acc30=0.030 | lr=1.00e-08 | 3.17h
|
| 737 |
+
[23:02:43] step= 58900 | loss=2.9895 | acc30=0.172 | lr=1.00e-08 | 3.17h
|
| 738 |
+
[23:03:01] step= 59000 | loss=2.1703 | acc30=0.292 | lr=1.00e-08 | 3.18h
|
| 739 |
+
[23:03:01] Validando...
|
| 740 |
+
[23:03:17] VAL: loss=2.3538 acc30=0.200 acc60=0.272 acc120=0.337
|
| 741 |
+
[23:03:34] step= 59100 | loss=2.2143 | acc30=0.257 | lr=1.00e-08 | 3.19h
|
| 742 |
+
[23:03:52] step= 59200 | loss=2.1340 | acc30=0.316 | lr=1.00e-08 | 3.19h
|
| 743 |
+
[23:04:10] step= 59300 | loss=2.6779 | acc30=0.212 | lr=1.00e-08 | 3.20h
|
| 744 |
+
[23:04:28] step= 59400 | loss=2.7009 | acc30=0.130 | lr=1.00e-08 | 3.20h
|
| 745 |
+
[23:04:45] step= 59500 | loss=2.1256 | acc30=0.322 | lr=1.00e-08 | 3.21h
|
| 746 |
+
[23:05:03] step= 59600 | loss=2.2170 | acc30=0.258 | lr=1.00e-08 | 3.21h
|
| 747 |
+
[23:05:21] step= 59700 | loss=2.2213 | acc30=0.241 | lr=1.00e-08 | 3.22h
|
| 748 |
+
[23:05:39] step= 59800 | loss=2.2089 | acc30=0.236 | lr=1.00e-08 | 3.22h
|
| 749 |
+
[23:05:56] step= 59900 | loss=2.2164 | acc30=0.245 | lr=1.00e-08 | 3.23h
|
| 750 |
+
[23:06:14] step= 60000 | loss=2.3375 | acc30=0.191 | lr=1.00e-08 | 3.23h
|
| 751 |
+
[23:06:14] Validando...
|
| 752 |
+
[23:06:30] VAL: loss=2.3538 acc30=0.200 acc60=0.272 acc120=0.337
|
| 753 |
+
[23:06:48] step= 60100 | loss=2.2735 | acc30=0.224 | lr=1.00e-08 | 3.24h
|
| 754 |
+
[23:07:06] step= 60200 | loss=2.3135 | acc30=0.207 | lr=1.00e-08 | 3.25h
|
| 755 |
+
[23:07:23] step= 60300 | loss=2.2916 | acc30=0.198 | lr=1.00e-08 | 3.25h
|
| 756 |
+
[23:07:41] step= 60400 | loss=2.4599 | acc30=0.157 | lr=1.00e-08 | 3.25h
|
| 757 |
+
[23:07:59] step= 60500 | loss=2.1560 | acc30=0.288 | lr=1.00e-08 | 3.26h
|
| 758 |
+
[23:08:17] step= 60600 | loss=2.2581 | acc30=0.231 | lr=1.00e-08 | 3.26h
|
| 759 |
+
[23:08:34] step= 60700 | loss=3.3693 | acc30=0.065 | lr=1.00e-08 | 3.27h
|
| 760 |
+
[23:08:52] step= 60800 | loss=3.0105 | acc30=0.100 | lr=1.00e-08 | 3.27h
|
| 761 |
+
[23:09:10] step= 60900 | loss=3.0241 | acc30=0.099 | lr=1.00e-08 | 3.28h
|
| 762 |
+
[23:09:28] step= 61000 | loss=2.2564 | acc30=0.238 | lr=1.00e-08 | 3.28h
|
| 763 |
+
[23:09:28] Validando...
|
| 764 |
+
[23:09:45] VAL: loss=2.3538 acc30=0.200 acc60=0.272 acc120=0.337
|
| 765 |
+
[23:10:02] step= 61100 | loss=2.3111 | acc30=0.218 | lr=1.00e-08 | 3.29h
|
| 766 |
+
[23:10:21] step= 61200 | loss=2.4487 | acc30=0.179 | lr=1.00e-08 | 3.30h
|
| 767 |
+
[23:10:38] step= 61300 | loss=2.3120 | acc30=0.238 | lr=1.00e-08 | 3.30h
|
| 768 |
+
[23:10:56] step= 61400 | loss=2.4051 | acc30=0.170 | lr=1.00e-08 | 3.31h
|
| 769 |
+
[23:11:13] step= 61500 | loss=3.0412 | acc30=0.076 | lr=1.00e-08 | 3.31h
|
| 770 |
+
[23:11:31] step= 61600 | loss=2.7332 | acc30=0.240 | lr=1.00e-08 | 3.32h
|
| 771 |
+
[23:11:49] step= 61700 | loss=2.1831 | acc30=0.332 | lr=1.00e-08 | 3.32h
|
| 772 |
+
[23:12:06] step= 61800 | loss=3.4265 | acc30=0.042 | lr=1.00e-08 | 3.33h
|
| 773 |
+
[23:12:24] step= 61900 | loss=2.3512 | acc30=0.215 | lr=1.00e-08 | 3.33h
|
| 774 |
+
[23:12:42] step= 62000 | loss=2.1792 | acc30=0.278 | lr=1.00e-08 | 3.34h
|
| 775 |
+
[23:12:42] Validando...
|
| 776 |
+
[23:12:58] VAL: loss=2.3537 acc30=0.200 acc60=0.272 acc120=0.337
|
| 777 |
+
[23:13:16] step= 62100 | loss=2.1671 | acc30=0.287 | lr=1.00e-08 | 3.35h
|
| 778 |
+
[23:13:34] step= 62200 | loss=2.3053 | acc30=0.227 | lr=1.00e-08 | 3.35h
|
| 779 |
+
[23:13:51] step= 62300 | loss=2.3611 | acc30=0.173 | lr=1.00e-08 | 3.36h
|
| 780 |
+
[23:14:09] step= 62400 | loss=2.3613 | acc30=0.177 | lr=1.00e-08 | 3.36h
|
| 781 |
+
[23:14:27] step= 62500 | loss=2.4613 | acc30=0.174 | lr=1.00e-08 | 3.37h
|
| 782 |
+
[23:14:44] step= 62600 | loss=4.4345 | acc30=0.010 | lr=1.00e-08 | 3.37h
|
| 783 |
+
[23:15:02] step= 62700 | loss=4.4721 | acc30=0.015 | lr=1.00e-08 | 3.38h
|
| 784 |
+
[23:15:20] step= 62800 | loss=3.6790 | acc30=0.094 | lr=1.00e-08 | 3.38h
|
| 785 |
+
[23:15:38] step= 62900 | loss=2.3705 | acc30=0.193 | lr=1.00e-08 | 3.39h
|
| 786 |
+
[23:15:56] step= 63000 | loss=2.2634 | acc30=0.232 | lr=1.00e-08 | 3.39h
|
| 787 |
+
[23:15:56] Validando...
|
| 788 |
+
[23:16:12] VAL: loss=2.3537 acc30=0.200 acc60=0.272 acc120=0.337
|
| 789 |
+
[23:16:30] step= 63100 | loss=3.0016 | acc30=0.080 | lr=1.00e-08 | 3.40h
|
| 790 |
+
[23:16:48] step= 63200 | loss=2.8213 | acc30=0.117 | lr=1.00e-08 | 3.41h
|
| 791 |
+
[23:17:06] step= 63300 | loss=2.8651 | acc30=0.109 | lr=1.00e-08 | 3.41h
|
| 792 |
+
[23:17:23] step= 63400 | loss=3.2287 | acc30=0.056 | lr=1.00e-08 | 3.42h
|
| 793 |
+
[23:17:41] step= 63500 | loss=3.1651 | acc30=0.067 | lr=1.00e-08 | 3.42h
|
| 794 |
+
[23:17:59] step= 63600 | loss=2.7781 | acc30=0.135 | lr=1.00e-08 | 3.43h
|
| 795 |
+
[23:18:17] step= 63700 | loss=2.1250 | acc30=0.324 | lr=1.00e-08 | 3.43h
|
| 796 |
+
[23:18:34] step= 63800 | loss=2.0288 | acc30=0.431 | lr=1.00e-08 | 3.44h
|
| 797 |
+
[23:18:52] step= 63900 | loss=2.1862 | acc30=0.270 | lr=1.00e-08 | 3.44h
|
| 798 |
+
[23:19:10] step= 64000 | loss=2.2578 | acc30=0.231 | lr=1.00e-08 | 3.45h
|
| 799 |
+
[23:19:10] Validando...
|
| 800 |
+
[23:19:26] VAL: loss=2.3537 acc30=0.200 acc60=0.272 acc120=0.337
|
| 801 |
+
[23:19:44] step= 64100 | loss=2.3196 | acc30=0.198 | lr=1.00e-08 | 3.46h
|
| 802 |
+
[23:20:02] step= 64200 | loss=4.4721 | acc30=0.013 | lr=1.00e-08 | 3.46h
|
| 803 |
+
[23:20:20] step= 64300 | loss=2.8901 | acc30=0.198 | lr=1.00e-08 | 3.47h
|
| 804 |
+
[23:20:38] step= 64400 | loss=2.4126 | acc30=0.220 | lr=1.00e-08 | 3.47h
|
| 805 |
+
[23:20:55] step= 64500 | loss=2.6992 | acc30=0.112 | lr=1.00e-08 | 3.48h
|
| 806 |
+
[23:21:13] step= 64600 | loss=2.3838 | acc30=0.185 | lr=1.00e-08 | 3.48h
|
| 807 |
+
[23:21:31] step= 64700 | loss=2.2339 | acc30=0.240 | lr=1.00e-08 | 3.49h
|
| 808 |
+
[23:21:49] step= 64800 | loss=2.2322 | acc30=0.269 | lr=1.00e-08 | 3.49h
|
| 809 |
+
[23:22:06] step= 64900 | loss=3.3390 | acc30=0.049 | lr=1.00e-08 | 3.50h
|
| 810 |
+
[23:22:24] step= 65000 | loss=2.1824 | acc30=0.264 | lr=1.00e-08 | 3.50h
|
| 811 |
+
[23:22:24] Validando...
|
| 812 |
+
[23:22:40] VAL: loss=2.3537 acc30=0.200 acc60=0.272 acc120=0.337
|
| 813 |
+
[23:22:58] step= 65100 | loss=3.3295 | acc30=0.125 | lr=1.00e-08 | 3.51h
|
| 814 |
+
[23:23:16] step= 65200 | loss=3.2426 | acc30=0.109 | lr=1.00e-08 | 3.51h
|
| 815 |
+
[23:23:33] step= 65300 | loss=2.1343 | acc30=0.327 | lr=1.00e-08 | 3.52h
|
| 816 |
+
[23:23:51] step= 65400 | loss=2.1204 | acc30=0.321 | lr=1.00e-08 | 3.52h
|
| 817 |
+
[23:24:09] step= 65500 | loss=2.1203 | acc30=0.327 | lr=1.00e-08 | 3.53h
|
| 818 |
+
[23:24:27] step= 65600 | loss=2.1497 | acc30=0.328 | lr=1.00e-08 | 3.53h
|
| 819 |
+
[23:24:44] step= 65700 | loss=2.4327 | acc30=0.167 | lr=1.00e-08 | 3.54h
|
| 820 |
+
[23:25:02] step= 65800 | loss=2.3122 | acc30=0.192 | lr=1.00e-08 | 3.54h
|
| 821 |
+
[23:25:20] step= 65900 | loss=2.3411 | acc30=0.199 | lr=1.00e-08 | 3.55h
|
| 822 |
+
[23:25:38] step= 66000 | loss=2.2726 | acc30=0.223 | lr=1.00e-08 | 3.55h
|
| 823 |
+
[23:25:38] Validando...
|
| 824 |
+
[23:25:54] VAL: loss=2.3537 acc30=0.200 acc60=0.271 acc120=0.337
|
| 825 |
+
[23:26:11] step= 66100 | loss=2.2644 | acc30=0.233 | lr=1.00e-08 | 3.56h
|
| 826 |
+
[23:26:29] step= 66200 | loss=2.2908 | acc30=0.229 | lr=1.00e-08 | 3.57h
|
| 827 |
+
[23:26:47] step= 66300 | loss=2.2408 | acc30=0.236 | lr=1.00e-08 | 3.57h
|
| 828 |
+
[23:27:05] step= 66400 | loss=2.5139 | acc30=0.150 | lr=1.00e-08 | 3.58h
|
| 829 |
+
[23:27:22] step= 66500 | loss=3.2218 | acc30=0.058 | lr=1.00e-08 | 3.58h
|
| 830 |
+
[23:27:40] step= 66600 | loss=2.7375 | acc30=0.116 | lr=1.00e-08 | 3.59h
|
| 831 |
+
[23:27:58] step= 66700 | loss=2.4877 | acc30=0.176 | lr=1.00e-08 | 3.59h
|
| 832 |
+
[23:28:16] step= 66800 | loss=2.2405 | acc30=0.242 | lr=1.00e-08 | 3.60h
|
| 833 |
+
[23:28:34] step= 66900 | loss=2.2588 | acc30=0.224 | lr=1.00e-08 | 3.60h
|
| 834 |
+
[23:28:52] step= 67000 | loss=3.2053 | acc30=0.065 | lr=1.00e-08 | 3.61h
|
| 835 |
+
[23:28:52] Validando...
|
| 836 |
+
[23:29:08] VAL: loss=2.3536 acc30=0.200 acc60=0.271 acc120=0.337
|
| 837 |
+
[23:29:26] step= 67100 | loss=2.3031 | acc30=0.225 | lr=1.00e-08 | 3.62h
|
| 838 |
+
[23:29:44] step= 67200 | loss=2.4148 | acc30=0.193 | lr=1.00e-08 | 3.62h
|
| 839 |
+
[23:30:01] step= 67300 | loss=3.9936 | acc30=0.025 | lr=1.00e-08 | 3.63h
|
| 840 |
+
[23:30:19] step= 67400 | loss=2.4836 | acc30=0.275 | lr=1.00e-08 | 3.63h
|
| 841 |
+
[23:30:37] step= 67500 | loss=2.1016 | acc30=0.357 | lr=1.00e-08 | 3.64h
|
| 842 |
+
[23:30:55] step= 67600 | loss=2.0761 | acc30=0.367 | lr=1.00e-08 | 3.64h
|
| 843 |
+
[23:31:12] step= 67700 | loss=2.6893 | acc30=0.105 | lr=1.00e-08 | 3.65h
|
| 844 |
+
[23:31:30] step= 67800 | loss=2.6904 | acc30=0.102 | lr=1.00e-08 | 3.65h
|
| 845 |
+
[23:31:48] step= 67900 | loss=2.5381 | acc30=0.190 | lr=1.00e-08 | 3.66h
|
| 846 |
+
[23:32:06] step= 68000 | loss=2.1795 | acc30=0.286 | lr=1.00e-08 | 3.66h
|
| 847 |
+
[23:32:06] Validando...
|
| 848 |
+
[23:32:22] VAL: loss=2.3536 acc30=0.200 acc60=0.271 acc120=0.337
|
| 849 |
+
[23:32:39] step= 68100 | loss=2.1938 | acc30=0.250 | lr=1.00e-08 | 3.67h
|
| 850 |
+
[23:32:57] step= 68200 | loss=2.1620 | acc30=0.293 | lr=1.00e-08 | 3.68h
|
| 851 |
+
[23:33:15] step= 68300 | loss=2.2143 | acc30=0.268 | lr=1.00e-08 | 3.68h
|
| 852 |
+
[23:33:32] step= 68400 | loss=2.3573 | acc30=0.205 | lr=1.00e-08 | 3.69h
|
| 853 |
+
[23:33:50] step= 68500 | loss=2.3138 | acc30=0.225 | lr=1.00e-08 | 3.69h
|
| 854 |
+
[23:34:08] step= 68600 | loss=3.0000 | acc30=0.101 | lr=1.00e-08 | 3.70h
|
| 855 |
+
[23:34:26] step= 68700 | loss=2.5193 | acc30=0.174 | lr=1.00e-08 | 3.70h
|
| 856 |
+
[23:34:44] step= 68800 | loss=2.2703 | acc30=0.223 | lr=1.00e-08 | 3.71h
|
| 857 |
+
[23:35:01] step= 68900 | loss=2.9359 | acc30=0.099 | lr=1.00e-08 | 3.71h
|
| 858 |
+
[23:35:19] step= 69000 | loss=2.3679 | acc30=0.244 | lr=1.00e-08 | 3.72h
|
| 859 |
+
[23:35:19] Validando...
|
| 860 |
+
[23:35:35] VAL: loss=2.3536 acc30=0.200 acc60=0.271 acc120=0.337
|
| 861 |
+
[23:35:53] step= 69100 | loss=2.1180 | acc30=0.343 | lr=1.00e-08 | 3.72h
|
| 862 |
+
[23:36:11] step= 69200 | loss=2.1652 | acc30=0.282 | lr=1.00e-08 | 3.73h
|
| 863 |
+
[23:36:29] step= 69300 | loss=2.0896 | acc30=0.374 | lr=1.00e-08 | 3.73h
|
| 864 |
+
[23:36:47] step= 69400 | loss=2.0949 | acc30=0.354 | lr=1.00e-08 | 3.74h
|
| 865 |
+
[23:37:04] step= 69500 | loss=2.0962 | acc30=0.342 | lr=1.00e-08 | 3.74h
|
| 866 |
+
[23:37:22] step= 69600 | loss=2.2294 | acc30=0.244 | lr=1.00e-08 | 3.75h
|
| 867 |
+
[23:37:40] step= 69700 | loss=2.1721 | acc30=0.299 | lr=1.00e-08 | 3.75h
|
| 868 |
+
[23:37:58] step= 69800 | loss=2.2693 | acc30=0.260 | lr=1.00e-08 | 3.76h
|
| 869 |
+
[23:38:16] step= 69900 | loss=2.2205 | acc30=0.264 | lr=1.00e-08 | 3.76h
|
| 870 |
+
[23:38:33] step= 70000 | loss=2.1133 | acc30=0.340 | lr=1.00e-08 | 3.77h
|
| 871 |
+
[23:38:33] Validando...
|
| 872 |
+
[23:38:49] VAL: loss=2.3536 acc30=0.200 acc60=0.271 acc120=0.337
|
| 873 |
+
[23:39:07] step= 70100 | loss=3.0523 | acc30=0.096 | lr=1.00e-08 | 3.78h
|
| 874 |
+
[23:39:25] step= 70200 | loss=2.4662 | acc30=0.158 | lr=1.00e-08 | 3.78h
|
| 875 |
+
[23:39:43] step= 70300 | loss=2.2519 | acc30=0.246 | lr=1.00e-08 | 3.79h
|
| 876 |
+
[23:40:00] step= 70400 | loss=2.2048 | acc30=0.266 | lr=1.00e-08 | 3.79h
|
| 877 |
+
[23:40:18] step= 70500 | loss=2.2689 | acc30=0.209 | lr=1.00e-08 | 3.80h
|
| 878 |
+
[23:40:36] step= 70600 | loss=2.4044 | acc30=0.179 | lr=1.00e-08 | 3.80h
|
| 879 |
+
[23:40:54] step= 70700 | loss=2.3477 | acc30=0.224 | lr=1.00e-08 | 3.81h
|
| 880 |
+
[23:41:11] step= 70800 | loss=2.3079 | acc30=0.210 | lr=1.00e-08 | 3.81h
|
| 881 |
+
[23:41:29] step= 70900 | loss=3.2465 | acc30=0.081 | lr=1.00e-08 | 3.82h
|
| 882 |
+
[23:41:47] step= 71000 | loss=2.6231 | acc30=0.124 | lr=1.00e-08 | 3.82h
|
| 883 |
+
[23:41:47] Validando...
|
| 884 |
+
[23:42:03] VAL: loss=2.3536 acc30=0.200 acc60=0.272 acc120=0.337
|
| 885 |
+
[23:42:21] step= 71100 | loss=2.2700 | acc30=0.219 | lr=1.00e-08 | 3.83h
|
| 886 |
+
[23:42:39] step= 71200 | loss=2.3385 | acc30=0.200 | lr=1.00e-08 | 3.84h
|
| 887 |
+
[23:42:57] step= 71300 | loss=2.1661 | acc30=0.308 | lr=1.00e-08 | 3.84h
|
| 888 |
+
[23:43:14] step= 71400 | loss=3.0915 | acc30=0.242 | lr=1.00e-08 | 3.85h
|
| 889 |
+
[23:43:32] step= 71500 | loss=4.0131 | acc30=0.060 | lr=1.00e-08 | 3.85h
|
| 890 |
+
[23:43:49] step= 71600 | loss=2.0627 | acc30=0.388 | lr=1.00e-08 | 3.86h
|
| 891 |
+
[23:44:08] step= 71700 | loss=2.3261 | acc30=0.224 | lr=1.00e-08 | 3.86h
|
| 892 |
+
[23:44:26] step= 71800 | loss=2.2657 | acc30=0.229 | lr=1.00e-08 | 3.87h
|
| 893 |
+
[23:44:44] step= 71900 | loss=2.1852 | acc30=0.283 | lr=1.00e-08 | 3.87h
|
| 894 |
+
[23:45:01] step= 72000 | loss=2.6983 | acc30=0.101 | lr=1.00e-08 | 3.88h
|
| 895 |
+
[23:45:01] Validando...
|
| 896 |
+
[23:45:17] VAL: loss=2.3535 acc30=0.200 acc60=0.271 acc120=0.337
|
| 897 |
+
[23:45:35] step= 72100 | loss=2.3227 | acc30=0.208 | lr=1.00e-08 | 3.89h
|
| 898 |
+
[23:45:53] step= 72200 | loss=2.2166 | acc30=0.267 | lr=1.00e-08 | 3.89h
|
| 899 |
+
[23:46:11] step= 72300 | loss=2.3187 | acc30=0.213 | lr=1.00e-08 | 3.90h
|
| 900 |
+
[23:46:28] step= 72400 | loss=2.0820 | acc30=0.368 | lr=1.00e-08 | 3.90h
|
| 901 |
+
[23:46:46] step= 72500 | loss=2.3422 | acc30=0.217 | lr=1.00e-08 | 3.91h
|
| 902 |
+
[23:47:04] step= 72600 | loss=2.2990 | acc30=0.209 | lr=1.00e-08 | 3.91h
|
| 903 |
+
[23:47:21] step= 72700 | loss=2.4013 | acc30=0.161 | lr=1.00e-08 | 3.92h
|
| 904 |
+
[23:47:39] step= 72800 | loss=2.2030 | acc30=0.266 | lr=1.00e-08 | 3.92h
|
| 905 |
+
[23:47:56] step= 72900 | loss=2.6753 | acc30=0.140 | lr=1.00e-08 | 3.93h
|
| 906 |
+
[23:48:14] step= 73000 | loss=2.8032 | acc30=0.106 | lr=1.00e-08 | 3.93h
|
| 907 |
+
[23:48:14] Validando...
|
| 908 |
+
[23:48:30] VAL: loss=2.3535 acc30=0.200 acc60=0.271 acc120=0.337
|
| 909 |
+
[23:48:48] step= 73100 | loss=2.3250 | acc30=0.204 | lr=1.00e-08 | 3.94h
|
| 910 |
+
[23:49:06] step= 73200 | loss=2.7735 | acc30=0.100 | lr=1.00e-08 | 3.94h
|
| 911 |
+
[23:49:24] step= 73300 | loss=2.7989 | acc30=0.133 | lr=1.00e-08 | 3.95h
|
| 912 |
+
[23:49:41] step= 73400 | loss=3.0874 | acc30=0.105 | lr=1.00e-08 | 3.95h
|
| 913 |
+
[23:49:59] step= 73500 | loss=3.7177 | acc30=0.051 | lr=1.00e-08 | 3.96h
|
| 914 |
+
[23:50:17] step= 73600 | loss=2.1981 | acc30=0.342 | lr=1.00e-08 | 3.96h
|
| 915 |
+
[23:50:34] step= 73700 | loss=2.2466 | acc30=0.264 | lr=1.00e-08 | 3.97h
|
| 916 |
+
[23:50:53] step= 73800 | loss=2.2837 | acc30=0.216 | lr=1.00e-08 | 3.97h
|
| 917 |
+
[23:51:10] step= 73900 | loss=2.3517 | acc30=0.193 | lr=1.00e-08 | 3.98h
|
| 918 |
+
[23:51:28] step= 74000 | loss=2.0779 | acc30=0.374 | lr=1.00e-08 | 3.98h
|
| 919 |
+
[23:51:28] Validando...
|
| 920 |
+
[23:51:44] VAL: loss=2.3535 acc30=0.200 acc60=0.272 acc120=0.337
|
| 921 |
+
[23:52:02] step= 74100 | loss=2.6875 | acc30=0.211 | lr=1.00e-08 | 3.99h
|
| 922 |
+
[23:52:20] step= 74200 | loss=3.2619 | acc30=0.056 | lr=1.00e-08 | 4.00h
|
| 923 |
+
[23:52:25] --- CHECKPOINT (hora 4.0) ---
|
| 924 |
+
[23:52:25] Checkpoint salvo: checkpoint_step00074226.pt (59.0 MB)
|