AeonOmniverse commited on
Commit
8448e02
·
verified ·
1 Parent(s): cfcde16

Training in progress, epoch 1

Browse files
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "Qwen/Qwen2-VL-7B-Instruct",
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
@@ -24,8 +24,8 @@
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
- "v_proj",
28
- "q_proj"
29
  ],
30
  "task_type": "CAUSAL_LM",
31
  "trainable_token_indices": null,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "HuggingFaceTB/SmolVLM-Instruct",
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
 
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
+ "q_proj",
28
+ "v_proj"
29
  ],
30
  "task_type": "CAUSAL_LM",
31
  "trainable_token_indices": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3a9a961167e6590873dbf63089b55a005b5e0615c9e0e4aa182e9b55cd30e85
3
- size 10108960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90f59e2520afbb03db1ad99f02d574bb5a261f690056468180b8190e90cbe79a
3
+ size 10302960
added_tokens.json CHANGED
@@ -1,16 +1,5 @@
1
  {
2
- "<|box_end|>": 151649,
3
- "<|box_start|>": 151648,
4
- "<|endoftext|>": 151643,
5
- "<|im_end|>": 151645,
6
- "<|im_start|>": 151644,
7
- "<|image_pad|>": 151655,
8
- "<|object_ref_end|>": 151647,
9
- "<|object_ref_start|>": 151646,
10
- "<|quad_end|>": 151651,
11
- "<|quad_start|>": 151650,
12
- "<|video_pad|>": 151656,
13
- "<|vision_end|>": 151653,
14
- "<|vision_pad|>": 151654,
15
- "<|vision_start|>": 151652
16
  }
 
1
  {
2
+ "<end_of_utterance>": 49154,
3
+ "<fake_token_around_image>": 49152,
4
+ "<image>": 49153
 
 
 
 
 
 
 
 
 
 
 
5
  }
chat_template.jinja CHANGED
@@ -1,7 +1,2 @@
1
- {% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system
2
- You are a helpful assistant.<|im_end|>
3
- {% endif %}<|im_start|>{{ message['role'] }}
4
- {% if message['content'] is string %}{{ message['content'] }}<|im_end|>
5
- {% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>
6
- {% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant
7
- {% endif %}
 
1
+ <|im_start|>{% for message in messages %}{{message['role'] | capitalize}}{% if message['content'][0]['type'] == 'image' %}{{':'}}{% else %}{{': '}}{% endif %}{% for line in message['content'] %}{% if line['type'] == 'text' %}{{line['text']}}{% elif line['type'] == 'image' %}{{ '<image>' }}{% endif %}{% endfor %}<end_of_utterance>
2
+ {% endfor %}{% if add_generation_prompt %}{{ 'Assistant:' }}{% endif %}
 
 
 
 
 
merges.txt CHANGED
The diff for this file is too large to render. See raw diff
 
runs/Jul29_15-43-44_ai3.ku.io/events.out.tfevents.1753778665.ai3.ku.io.3590973.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e874791c500f7cf69b6f3deb5e07b8ebe13e369fb5b08420e338578bfdc7af8d
3
- size 8603
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01c8f33c47a4fa155f490acf51059ff3c221e47d6a6fe25e505112ae26bda84d
3
+ size 8810
runs/Jul29_16-42-15_ai3.ku.io/events.out.tfevents.1753782195.ai3.ku.io.3592098.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1ec1bc2b5b8fe18ced5f9fd861892bc671363c17cf5d4875c6ff52a4177c4a1
3
+ size 9932
special_tokens_map.json CHANGED
@@ -1,27 +1,49 @@
1
  {
2
  "additional_special_tokens": [
3
- "<|im_start|>",
4
- "<|im_end|>",
5
- "<|object_ref_start|>",
6
- "<|object_ref_end|>",
7
- "<|box_start|>",
8
- "<|box_end|>",
9
- "<|quad_start|>",
10
- "<|quad_end|>",
11
- "<|vision_start|>",
12
- "<|vision_end|>",
13
- "<|vision_pad|>",
14
- "<|image_pad|>",
15
- "<|video_pad|>"
 
 
 
 
 
 
 
 
16
  ],
 
 
 
 
 
 
 
17
  "eos_token": {
18
- "content": "<|im_end|>",
19
  "lstrip": false,
20
  "normalized": false,
21
  "rstrip": false,
22
  "single_word": false
23
  },
24
  "pad_token": {
 
 
 
 
 
 
 
25
  "content": "<|endoftext|>",
26
  "lstrip": false,
27
  "normalized": false,
 
1
  {
2
  "additional_special_tokens": [
3
+ {
4
+ "content": "<fake_token_around_image>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ },
10
+ {
11
+ "content": "<image>",
12
+ "lstrip": false,
13
+ "normalized": false,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ {
18
+ "content": "<end_of_utterance>",
19
+ "lstrip": false,
20
+ "normalized": false,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
  ],
25
+ "bos_token": {
26
+ "content": "<|im_start|>",
27
+ "lstrip": false,
28
+ "normalized": false,
29
+ "rstrip": false,
30
+ "single_word": false
31
+ },
32
  "eos_token": {
33
+ "content": "<end_of_utterance>",
34
  "lstrip": false,
35
  "normalized": false,
36
  "rstrip": false,
37
  "single_word": false
38
  },
39
  "pad_token": {
40
+ "content": "<|im_end|>",
41
+ "lstrip": false,
42
+ "normalized": false,
43
+ "rstrip": false,
44
+ "single_word": false
45
+ },
46
+ "unk_token": {
47
  "content": "<|endoftext|>",
48
  "lstrip": false,
49
  "normalized": false,
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:88a3a6fcb80132f76da8aa40cdc3fccd7e5d8468ef15421f5b0c2715e85217d2
3
- size 11420538
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43cdb6cd62df2c99a15307455f5990a7b579fefbd26c2624cd643bb7f43f4310
3
+ size 3523394
tokenizer_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "add_prefix_space": false,
3
  "added_tokens_decoder": {
4
- "151643": {
5
  "content": "<|endoftext|>",
6
  "lstrip": false,
7
  "normalized": false,
@@ -9,7 +9,7 @@
9
  "single_word": false,
10
  "special": true
11
  },
12
- "151644": {
13
  "content": "<|im_start|>",
14
  "lstrip": false,
15
  "normalized": false,
@@ -17,7 +17,7 @@
17
  "single_word": false,
18
  "special": true
19
  },
20
- "151645": {
21
  "content": "<|im_end|>",
22
  "lstrip": false,
23
  "normalized": false,
@@ -25,88 +25,136 @@
25
  "single_word": false,
26
  "special": true
27
  },
28
- "151646": {
29
- "content": "<|object_ref_start|>",
30
  "lstrip": false,
31
  "normalized": false,
32
  "rstrip": false,
33
  "single_word": false,
34
  "special": true
35
  },
36
- "151647": {
37
- "content": "<|object_ref_end|>",
38
  "lstrip": false,
39
  "normalized": false,
40
  "rstrip": false,
41
  "single_word": false,
42
  "special": true
43
  },
44
- "151648": {
45
- "content": "<|box_start|>",
46
  "lstrip": false,
47
  "normalized": false,
48
  "rstrip": false,
49
  "single_word": false,
50
  "special": true
51
  },
52
- "151649": {
53
- "content": "<|box_end|>",
54
  "lstrip": false,
55
  "normalized": false,
56
  "rstrip": false,
57
  "single_word": false,
58
  "special": true
59
  },
60
- "151650": {
61
- "content": "<|quad_start|>",
62
  "lstrip": false,
63
  "normalized": false,
64
  "rstrip": false,
65
  "single_word": false,
66
  "special": true
67
  },
68
- "151651": {
69
- "content": "<|quad_end|>",
70
  "lstrip": false,
71
  "normalized": false,
72
  "rstrip": false,
73
  "single_word": false,
74
  "special": true
75
  },
76
- "151652": {
77
- "content": "<|vision_start|>",
78
  "lstrip": false,
79
  "normalized": false,
80
  "rstrip": false,
81
  "single_word": false,
82
  "special": true
83
  },
84
- "151653": {
85
- "content": "<|vision_end|>",
86
  "lstrip": false,
87
  "normalized": false,
88
  "rstrip": false,
89
  "single_word": false,
90
  "special": true
91
  },
92
- "151654": {
93
- "content": "<|vision_pad|>",
94
  "lstrip": false,
95
  "normalized": false,
96
  "rstrip": false,
97
  "single_word": false,
98
  "special": true
99
  },
100
- "151655": {
101
- "content": "<|image_pad|>",
102
  "lstrip": false,
103
  "normalized": false,
104
  "rstrip": false,
105
  "single_word": false,
106
  "special": true
107
  },
108
- "151656": {
109
- "content": "<|video_pad|>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
110
  "lstrip": false,
111
  "normalized": false,
112
  "rstrip": false,
@@ -115,29 +163,20 @@
115
  }
116
  },
117
  "additional_special_tokens": [
118
- "<|im_start|>",
119
- "<|im_end|>",
120
- "<|object_ref_start|>",
121
- "<|object_ref_end|>",
122
- "<|box_start|>",
123
- "<|box_end|>",
124
- "<|quad_start|>",
125
- "<|quad_end|>",
126
- "<|vision_start|>",
127
- "<|vision_end|>",
128
- "<|vision_pad|>",
129
- "<|image_pad|>",
130
- "<|video_pad|>"
131
  ],
132
- "bos_token": null,
133
  "clean_up_tokenization_spaces": false,
134
- "eos_token": "<|im_end|>",
135
- "errors": "replace",
136
  "extra_special_tokens": {},
137
- "model_max_length": 32768,
138
- "pad_token": "<|endoftext|>",
139
- "padding_side": "left",
140
- "split_special_tokens": false,
141
- "tokenizer_class": "Qwen2Tokenizer",
142
- "unk_token": null
 
 
143
  }
 
1
  {
2
  "add_prefix_space": false,
3
  "added_tokens_decoder": {
4
+ "0": {
5
  "content": "<|endoftext|>",
6
  "lstrip": false,
7
  "normalized": false,
 
9
  "single_word": false,
10
  "special": true
11
  },
12
+ "1": {
13
  "content": "<|im_start|>",
14
  "lstrip": false,
15
  "normalized": false,
 
17
  "single_word": false,
18
  "special": true
19
  },
20
+ "2": {
21
  "content": "<|im_end|>",
22
  "lstrip": false,
23
  "normalized": false,
 
25
  "single_word": false,
26
  "special": true
27
  },
28
+ "3": {
29
+ "content": "<repo_name>",
30
  "lstrip": false,
31
  "normalized": false,
32
  "rstrip": false,
33
  "single_word": false,
34
  "special": true
35
  },
36
+ "4": {
37
+ "content": "<reponame>",
38
  "lstrip": false,
39
  "normalized": false,
40
  "rstrip": false,
41
  "single_word": false,
42
  "special": true
43
  },
44
+ "5": {
45
+ "content": "<file_sep>",
46
  "lstrip": false,
47
  "normalized": false,
48
  "rstrip": false,
49
  "single_word": false,
50
  "special": true
51
  },
52
+ "6": {
53
+ "content": "<filename>",
54
  "lstrip": false,
55
  "normalized": false,
56
  "rstrip": false,
57
  "single_word": false,
58
  "special": true
59
  },
60
+ "7": {
61
+ "content": "<gh_stars>",
62
  "lstrip": false,
63
  "normalized": false,
64
  "rstrip": false,
65
  "single_word": false,
66
  "special": true
67
  },
68
+ "8": {
69
+ "content": "<issue_start>",
70
  "lstrip": false,
71
  "normalized": false,
72
  "rstrip": false,
73
  "single_word": false,
74
  "special": true
75
  },
76
+ "9": {
77
+ "content": "<issue_comment>",
78
  "lstrip": false,
79
  "normalized": false,
80
  "rstrip": false,
81
  "single_word": false,
82
  "special": true
83
  },
84
+ "10": {
85
+ "content": "<issue_closed>",
86
  "lstrip": false,
87
  "normalized": false,
88
  "rstrip": false,
89
  "single_word": false,
90
  "special": true
91
  },
92
+ "11": {
93
+ "content": "<jupyter_start>",
94
  "lstrip": false,
95
  "normalized": false,
96
  "rstrip": false,
97
  "single_word": false,
98
  "special": true
99
  },
100
+ "12": {
101
+ "content": "<jupyter_text>",
102
  "lstrip": false,
103
  "normalized": false,
104
  "rstrip": false,
105
  "single_word": false,
106
  "special": true
107
  },
108
+ "13": {
109
+ "content": "<jupyter_code>",
110
+ "lstrip": false,
111
+ "normalized": false,
112
+ "rstrip": false,
113
+ "single_word": false,
114
+ "special": true
115
+ },
116
+ "14": {
117
+ "content": "<jupyter_output>",
118
+ "lstrip": false,
119
+ "normalized": false,
120
+ "rstrip": false,
121
+ "single_word": false,
122
+ "special": true
123
+ },
124
+ "15": {
125
+ "content": "<jupyter_script>",
126
+ "lstrip": false,
127
+ "normalized": false,
128
+ "rstrip": false,
129
+ "single_word": false,
130
+ "special": true
131
+ },
132
+ "16": {
133
+ "content": "<empty_output>",
134
+ "lstrip": false,
135
+ "normalized": false,
136
+ "rstrip": false,
137
+ "single_word": false,
138
+ "special": true
139
+ },
140
+ "49152": {
141
+ "content": "<fake_token_around_image>",
142
+ "lstrip": false,
143
+ "normalized": false,
144
+ "rstrip": false,
145
+ "single_word": false,
146
+ "special": true
147
+ },
148
+ "49153": {
149
+ "content": "<image>",
150
+ "lstrip": false,
151
+ "normalized": false,
152
+ "rstrip": false,
153
+ "single_word": false,
154
+ "special": true
155
+ },
156
+ "49154": {
157
+ "content": "<end_of_utterance>",
158
  "lstrip": false,
159
  "normalized": false,
160
  "rstrip": false,
 
163
  }
164
  },
165
  "additional_special_tokens": [
166
+ "<fake_token_around_image>",
167
+ "<image>",
168
+ "<end_of_utterance>"
 
 
 
 
 
 
 
 
 
 
169
  ],
170
+ "bos_token": "<|im_start|>",
171
  "clean_up_tokenization_spaces": false,
172
+ "eos_token": "<end_of_utterance>",
 
173
  "extra_special_tokens": {},
174
+ "legacy": false,
175
+ "model_max_length": 16384,
176
+ "pad_token": "<|im_end|>",
177
+ "processor_class": "Idefics3Processor",
178
+ "tokenizer_class": "GPT2Tokenizer",
179
+ "truncation_side": "left",
180
+ "unk_token": "<|endoftext|>",
181
+ "vocab_size": 49152
182
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e37a39b2beabff1416eef7134bf6f8fde339ca2ea64fb41bfcb2dc6837e74f88
3
  size 5624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fab74f982c315694a4543400e9618801b2cf892de4700dc8a940f07e84618bcd
3
  size 5624
vocab.json CHANGED
The diff for this file is too large to render. See raw diff