andito HF Staff commited on
Commit
40c845e
·
verified ·
1 Parent(s): b709208

Upload nanoVLM using push_to_hub

Browse files
Files changed (2) hide show
  1. config.json +3 -3
  2. model.safetensors +2 -2
config.json CHANGED
@@ -2,13 +2,13 @@
2
  "vit_hidden_dim": 768,
3
  "vit_inter_dim": 3072,
4
  "vit_patch_size": 16,
5
- "vit_img_size": 512,
6
  "vit_n_heads": 12,
7
  "vit_dropout": 0.0,
8
  "vit_n_blocks": 12,
9
  "vit_ln_eps": 1e-06,
10
  "vit_cls_flag": false,
11
- "vit_model_type": "google/siglip2-base-patch16-512",
12
  "lm_hidden_dim": 960,
13
  "lm_inter_dim": 2560,
14
  "lm_rms_eps": 1e-05,
@@ -29,7 +29,7 @@
29
  "lm_tokenizer": "HuggingFaceTB/SmolLM2-360M-Instruct",
30
  "lm_chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
31
  "lm_eos_token_id": 0,
32
- "mp_pixel_shuffle_factor": 4,
33
  "mp_image_token_length": 64,
34
  "vlm_extra_tokens": {
35
  "image_token": "<|image|>"
 
2
  "vit_hidden_dim": 768,
3
  "vit_inter_dim": 3072,
4
  "vit_patch_size": 16,
5
+ "vit_img_size": 256,
6
  "vit_n_heads": 12,
7
  "vit_dropout": 0.0,
8
  "vit_n_blocks": 12,
9
  "vit_ln_eps": 1e-06,
10
  "vit_cls_flag": false,
11
+ "vit_model_type": "google/siglip2-base-patch16-256",
12
  "lm_hidden_dim": 960,
13
  "lm_inter_dim": 2560,
14
  "lm_rms_eps": 1e-05,
 
29
  "lm_tokenizer": "HuggingFaceTB/SmolLM2-360M-Instruct",
30
  "lm_chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
31
  "lm_eos_token_id": 0,
32
+ "mp_pixel_shuffle_factor": 2,
33
  "mp_image_token_length": 64,
34
  "vlm_extra_tokens": {
35
  "image_token": "<|image|>"
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18d0df67f25cc65078214d3e7e241c3c71fadc637bd409be9fae02992bbe37eb
3
- size 1840254904
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a270f1eb5d3c832f762ae2f92225a56e4d68ffcff8e5b4f3ffc3efce01af9ac5
3
+ size 1802506128