Training in progress, step 232
Browse files- adapter_model.safetensors +1 -1
- debug.log +21 -1
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 456206152
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b701fff68588bd76be303513e7423a03a1ce46487432370438e5a23f59bbc4e6
|
| 3 |
size 456206152
|
debug.log
CHANGED
|
@@ -840,4 +840,24 @@ trainable params: 114,032,640 || all params: 12,361,835,520 || trainable%: 0.922
|
|
| 840 |
|
| 841 |
[2025-10-07 18:44:30,660] [INFO] [axolotl.core.trainers.base._save:671] [PID:8314] Saving model checkpoint to ckpts-mmarv/checkpoint-216
|
| 842 |
|
| 843 |
94%|ββββββββββββββββββββββββββββββββββββββββββ | 217/232 [6:55:11<42:40, 170.68s/it]
|
| 844 |
|
| 845 |
-
|
| 846 |
94%|ββββββββββββββββββββββββββββββββββββββββββ | 217/232 [6:55:11<42:40, 170.68s/it]
|
|
|
|
| 847 |
94%|ββββββββββββββββββββββββββββββββββββββββββ | 217/232 [6:55:11<42:40, 170.68s/it]
|
| 848 |
94%|ββββββββββββββββββββββββββββββββββββββββββ | 218/232 [6:56:57<35:18, 151.30s/it]
|
| 849 |
|
|
|
|
| 850 |
94%|ββββββββββββββββββββββββββββββββββββββββββ | 218/232 [6:56:57<35:18, 151.30s/it]
|
| 851 |
94%|ββββββββββββββββββββββββββββββββββββββββββ | 219/232 [6:58:42<29:47, 137.53s/it]
|
| 852 |
|
|
|
|
| 853 |
94%|ββββββββββββββββββββββββββββββββββββββββββ | 219/232 [6:58:42<29:47, 137.53s/it]
|
| 854 |
95%|ββββββββββββββββββββββββββββββββββββββββββ | 220/232 [7:00:28<25:35, 127.94s/it]
|
| 855 |
|
|
|
|
| 856 |
95%|ββββββββββββββββββββββββββββββββββββββββββ | 220/232 [7:00:28<25:35, 127.94s/it]
|
| 857 |
95%|ββββββββββββββββββββββββββββββββββββββββββ | 221/232 [7:02:12<22:10, 120.97s/it]
|
| 858 |
|
|
|
|
| 859 |
95%|ββββββββββββββββββββββββββββββββββββββββββ | 221/232 [7:02:12<22:10, 120.97s/it]
|
| 860 |
96%|ββββββββββββββββββββββββββββββββββββββββββ | 222/232 [7:03:58<19:22, 116.23s/it]
|
| 861 |
|
|
|
|
| 862 |
96%|ββββββββββββββββββββββββββββββββββββββββββ | 222/232 [7:03:58<19:22, 116.23s/it]
|
| 863 |
96%|βββββββββββββββββββββββββββββββββββββββββββ | 223/232 [7:05:42<16:54, 112.77s/it]
|
| 864 |
|
|
|
|
| 865 |
96%|βββββββββββββββββοΏ½οΏ½οΏ½βββββββββββββββββββββββββ | 223/232 [7:05:42<16:54, 112.77s/it]
|
| 866 |
97%|βββββββββββββββββββββββββββββββββββββββββββ | 224/232 [7:07:28<14:44, 110.54s/it]
|
| 867 |
|
|
|
|
| 868 |
97%|βββββββββββββββββββββββββββββββββββββββββββ | 224/232 [7:07:28<14:44, 110.54s/it]
|
| 869 |
97%|βββββββββββββββββββββββββββββββββββββββββββ | 225/232 [7:09:13<12:42, 108.97s/it]
|
| 870 |
|
|
|
|
| 871 |
97%|βββββββββββββββββββββββββββββββββββββββββββ | 225/232 [7:09:13<12:42, 108.97s/it]
|
| 872 |
97%|βββββββββββββββββββββββββββββββββββββββββββ | 226/232 [7:10:58<10:45, 107.67s/it]
|
| 873 |
|
|
|
|
| 874 |
97%|βββββββββββββββββββββββββββββββββββββββββββ | 226/232 [7:10:58<10:45, 107.67s/it]
|
| 875 |
98%|βββββββββββββββββββββββββββββββββββββββββββ | 227/232 [7:12:43<08:54, 106.96s/it]
|
| 876 |
|
|
|
|
| 877 |
98%|βββββββββββββββββββββββββββββββββββββββββββ | 227/232 [7:12:43<08:54, 106.96s/it]
|
| 878 |
98%|ββββββββββββββββββββββββββββββββββββββββββββ| 228/232 [7:14:28<07:05, 106.44s/it]
|
| 879 |
|
|
|
|
| 880 |
98%|ββββββββββββββββββββββββββββββββββββββββββββ| 228/232 [7:14:28<07:05, 106.44s/it]
|
| 881 |
99%|ββββββββββββββββββββββββββββββββββββββββββββ| 229/232 [7:16:13<05:17, 105.91s/it]
|
| 882 |
|
|
|
|
| 883 |
99%|ββββββββββββββββββββββββββββββββββββββββββββ| 229/232 [7:16:13<05:17, 105.91s/it]
|
| 884 |
99%|ββββββββββββββββββββββββββββββββββββββββββββ| 230/232 [7:17:59<03:31, 105.97s/it]
|
| 885 |
|
|
|
|
| 886 |
99%|ββββββββββββββββββββββββββββββββββββββββββββ| 230/232 [7:17:59<03:31, 105.97s/it]
|
| 887 |
|
|
|
|
| 888 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 889 |
|
|
|
|
|
|
| 840 |
|
| 841 |
[2025-10-07 18:44:30,660] [INFO] [axolotl.core.trainers.base._save:671] [PID:8314] Saving model checkpoint to ckpts-mmarv/checkpoint-216
|
| 842 |
|
| 843 |
94%|ββββββββββββββββββββββββββββββββββββββββββ | 217/232 [6:55:11<42:40, 170.68s/it]
|
| 844 |
|
|
|
|
| 845 |
94%|ββββββββββββββββββββββββββββββββββββββββββ | 217/232 [6:55:11<42:40, 170.68s/it]
|
| 846 |
+
|
| 847 |
94%|ββββββββββββββββββββββββββββββββββββββββββ | 217/232 [6:55:11<42:40, 170.68s/it]
|
| 848 |
94%|ββββββββββββββββββββββββββββββββββββββββββ | 218/232 [6:56:57<35:18, 151.30s/it]
|
| 849 |
|
| 850 |
+
|
| 851 |
94%|ββββββββββββββββββββββββββββββββββββββββββ | 218/232 [6:56:57<35:18, 151.30s/it]
|
| 852 |
94%|ββββββββββββββββββββββββββββββββββββββββββ | 219/232 [6:58:42<29:47, 137.53s/it]
|
| 853 |
|
| 854 |
+
|
| 855 |
94%|ββββββββββββββββββββββββββββββββββββββββββ | 219/232 [6:58:42<29:47, 137.53s/it]
|
| 856 |
95%|ββββββββββββββββββββββββββββββββββββββββββ | 220/232 [7:00:28<25:35, 127.94s/it]
|
| 857 |
|
| 858 |
+
|
| 859 |
95%|ββββββββββββββββββββββββββββββββββββββββββ | 220/232 [7:00:28<25:35, 127.94s/it]
|
| 860 |
95%|ββββββββββββββββββββββββββββββββββββββββββ | 221/232 [7:02:12<22:10, 120.97s/it]
|
| 861 |
|
| 862 |
+
|
| 863 |
95%|ββββββββββββββββββββββββββββββββββββββββββ | 221/232 [7:02:12<22:10, 120.97s/it]
|
| 864 |
96%|ββββββββββββββββββββββββββββββββββββββββββ | 222/232 [7:03:58<19:22, 116.23s/it]
|
| 865 |
|
| 866 |
+
|
| 867 |
96%|ββββββββββββββββββββββββββββββββββββββββββ | 222/232 [7:03:58<19:22, 116.23s/it]
|
| 868 |
96%|βββββββββββββββββββββββββββββββββββββββββββ | 223/232 [7:05:42<16:54, 112.77s/it]
|
| 869 |
|
| 870 |
+
|
| 871 |
96%|βββββββββββββββββοΏ½οΏ½οΏ½βββββββββββββββββββββββββ | 223/232 [7:05:42<16:54, 112.77s/it]
|
| 872 |
97%|βββββββββββββββββββββββββββββββββββββββββββ | 224/232 [7:07:28<14:44, 110.54s/it]
|
| 873 |
|
| 874 |
+
|
| 875 |
97%|βββββββββββββββββββββββββββββββββββββββββββ | 224/232 [7:07:28<14:44, 110.54s/it]
|
| 876 |
97%|βββββββββββββββββββββββββββββββββββββββββββ | 225/232 [7:09:13<12:42, 108.97s/it]
|
| 877 |
|
| 878 |
+
|
| 879 |
97%|βββββββββββββββββββββββββββββββββββββββββββ | 225/232 [7:09:13<12:42, 108.97s/it]
|
| 880 |
97%|βββββββββββββββββββββββββββββββββββββββββββ | 226/232 [7:10:58<10:45, 107.67s/it]
|
| 881 |
|
| 882 |
+
|
| 883 |
97%|βββββββββββββββββββββββββββββββββββββββββββ | 226/232 [7:10:58<10:45, 107.67s/it]
|
| 884 |
98%|βββββββββββββββββββββββββββββββββββββββββββ | 227/232 [7:12:43<08:54, 106.96s/it]
|
| 885 |
|
| 886 |
+
|
| 887 |
98%|βββββββββββββββββββββββββββββββββββββββββββ | 227/232 [7:12:43<08:54, 106.96s/it]
|
| 888 |
98%|ββββββββββββββββββββββββββββββββββββββββββββ| 228/232 [7:14:28<07:05, 106.44s/it]
|
| 889 |
|
| 890 |
+
|
| 891 |
98%|ββββββββββββββββββββββββββββββββββββββββββββ| 228/232 [7:14:28<07:05, 106.44s/it]
|
| 892 |
99%|ββββββββββββββββββββββββββββββββββββββββββββ| 229/232 [7:16:13<05:17, 105.91s/it]
|
| 893 |
|
| 894 |
+
|
| 895 |
99%|ββββββββββββββββββββββββββββββββββββββββββββ| 229/232 [7:16:13<05:17, 105.91s/it]
|
| 896 |
99%|ββββββββββββββββββββββββββββββββββββββββββββ| 230/232 [7:17:59<03:31, 105.97s/it]
|
| 897 |
|
| 898 |
+
|
| 899 |
99%|ββββββββββββββββββββββββββββββββββββββββββββ| 230/232 [7:17:59<03:31, 105.97s/it]
|
| 900 |
|
| 901 |
+
|
| 902 |
|
| 903 |
+
|
| 904 |
+
warnings.warn(
|
| 905 |
+
|
| 906 |
+
[2025-10-07 19:12:57,756] [INFO] [axolotl.core.trainers.base._save:671] [PID:8314] Saving model checkpoint to ckpts-mmarv/checkpoint-232
|
| 907 |
+
|
| 908 |
|
| 909 |
+
|