nrizwan commited on
Commit
2d07196
·
verified ·
1 Parent(s): 9c97082

Upload processor

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
chat_template.jinja ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {% for message in messages %}{{'<|im_start|>' + message['role'] + '
2
+ '}}{% if message['content'] is string %}{{ message['content'] }}{% else %}{% for content in message['content'] %}{% if content['type'] == 'image' %}{{ '<IMG_CONTEXT>
3
+ ' }}{% elif content['type'] == 'video' %}{{ '<video>
4
+ ' }}{% elif content['type'] == 'text' %}{{ content['text'] }}{% endif %}{% endfor %}{% endif %}{{'<|im_end|>
5
+ '}}{% endfor %}{% if add_generation_prompt %}{{'<|im_start|>assistant
6
+ ' }}{% endif %}
processor_config.json ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "image_processor": {
3
+ "crop_to_patches": false,
4
+ "data_format": "channels_first",
5
+ "default_to_square": true,
6
+ "do_convert_rgb": true,
7
+ "do_normalize": true,
8
+ "do_rescale": true,
9
+ "do_resize": true,
10
+ "image_mean": [
11
+ 0.485,
12
+ 0.456,
13
+ 0.406
14
+ ],
15
+ "image_processor_type": "GotOcr2ImageProcessorFast",
16
+ "image_std": [
17
+ 0.229,
18
+ 0.224,
19
+ 0.225
20
+ ],
21
+ "max_patches": 12,
22
+ "min_patches": 1,
23
+ "resample": 3,
24
+ "rescale_factor": 0.00392156862745098,
25
+ "size": {
26
+ "height": 448,
27
+ "width": 448
28
+ }
29
+ },
30
+ "image_seq_length": 256,
31
+ "processor_class": "InternVLProcessor",
32
+ "video_processor": {
33
+ "data_format": "channels_first",
34
+ "default_to_square": true,
35
+ "do_convert_rgb": true,
36
+ "do_normalize": true,
37
+ "do_rescale": true,
38
+ "do_resize": true,
39
+ "do_sample_frames": false,
40
+ "image_mean": [
41
+ 0.48145466,
42
+ 0.4578275,
43
+ 0.40821073
44
+ ],
45
+ "image_std": [
46
+ 0.26862954,
47
+ 0.26130258,
48
+ 0.27577711
49
+ ],
50
+ "initial_shift": true,
51
+ "resample": 3,
52
+ "rescale_factor": 0.00392156862745098,
53
+ "return_metadata": false,
54
+ "size": {
55
+ "height": 384,
56
+ "width": 384
57
+ },
58
+ "video_processor_type": "InternVLVideoProcessor"
59
+ }
60
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14ee001cb526cf3fd358f671849ce7839ae2bf56b8b557bd7fbd259ade40f6ae
3
+ size 11424751
tokenizer_config.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "backend": "tokenizers",
4
+ "bos_token": null,
5
+ "clean_up_tokenization_spaces": false,
6
+ "context_image_token": "<IMG_CONTEXT>",
7
+ "end_image_token": "</img>",
8
+ "eos_token": "<|im_end|>",
9
+ "errors": "replace",
10
+ "extra_special_tokens": [
11
+ "<|im_start|>",
12
+ "<|im_end|>",
13
+ "<|object_ref_start|>",
14
+ "<|object_ref_end|>",
15
+ "<|box_start|>",
16
+ "<|box_end|>",
17
+ "<|quad_start|>",
18
+ "<|quad_end|>",
19
+ "<|vision_start|>",
20
+ "<|vision_end|>",
21
+ "<|vision_pad|>",
22
+ "<|image_pad|>",
23
+ "<|video_pad|>",
24
+ "<img>",
25
+ "</img>",
26
+ "<IMG_CONTEXT>",
27
+ "<quad>",
28
+ "</quad>",
29
+ "<ref>",
30
+ "</ref>",
31
+ "<box>",
32
+ "</box>"
33
+ ],
34
+ "is_local": false,
35
+ "model_max_length": 40960,
36
+ "model_specific_special_tokens": {
37
+ "context_image_token": "<IMG_CONTEXT>",
38
+ "end_image_token": "</img>",
39
+ "start_image_token": "<img>",
40
+ "video_token": "<video>"
41
+ },
42
+ "pad_token": "<|endoftext|>",
43
+ "processor_class": "InternVLProcessor",
44
+ "split_special_tokens": false,
45
+ "start_image_token": "<img>",
46
+ "tokenizer_class": "Qwen2Tokenizer",
47
+ "unk_token": null,
48
+ "video_token": "<video>"
49
+ }