h0witended commited on
Commit
f04681d
·
verified ·
1 Parent(s): cf72633

Upload folder using huggingface_hub

Browse files
Files changed (3) hide show
  1. config.json +8 -8
  2. modeling_minicpmo.py +1 -1
  3. pytorch_model.bin +2 -2
config.json CHANGED
@@ -146,20 +146,20 @@
146
  "drop_vision_last_layer": false,
147
  "eos_token_id": 151645,
148
  "hidden_act": "silu",
149
- "hidden_size": 256,
150
  "image_size": 448,
151
  "init_audio": false,
152
  "init_tts": false,
153
  "init_vision": true,
154
  "initializer_range": 0.02,
155
- "intermediate_size": 512,
156
  "listen_speak_type": "asr",
157
- "max_position_embeddings": 128,
158
  "max_window_layers": 28,
159
  "model_type": "minicpmo",
160
- "num_attention_heads": 4,
161
- "num_hidden_layers": 2,
162
- "num_key_value_heads": 4,
163
  "patch_size": 14,
164
  "query_num": 64,
165
  "rms_norm_eps": 1e-06,
@@ -172,7 +172,7 @@
172
  "slice_mode": true,
173
  "sliding_window": null,
174
  "stream_input": false,
175
- "tie_word_embeddings": false,
176
  "torch_dtype": "bfloat16",
177
  "transformers_version": "4.46.2",
178
  "tts_config": {
@@ -193,5 +193,5 @@
193
  "num_hidden_layers": 1,
194
  "patch_size": 14
195
  },
196
- "vocab_size": 320
197
  }
 
146
  "drop_vision_last_layer": false,
147
  "eos_token_id": 151645,
148
  "hidden_act": "silu",
149
+ "hidden_size": 16,
150
  "image_size": 448,
151
  "init_audio": false,
152
  "init_tts": false,
153
  "init_vision": true,
154
  "initializer_range": 0.02,
155
+ "intermediate_size": 32,
156
  "listen_speak_type": "asr",
157
+ "max_position_embeddings": 2048,
158
  "max_window_layers": 28,
159
  "model_type": "minicpmo",
160
+ "num_attention_heads": 2,
161
+ "num_hidden_layers": 1,
162
+ "num_key_value_heads": 2,
163
  "patch_size": 14,
164
  "query_num": 64,
165
  "rms_norm_eps": 1e-06,
 
172
  "slice_mode": true,
173
  "sliding_window": null,
174
  "stream_input": false,
175
+ "tie_word_embeddings": true,
176
  "torch_dtype": "bfloat16",
177
  "transformers_version": "4.46.2",
178
  "tts_config": {
 
193
  "num_hidden_layers": 1,
194
  "patch_size": 14
195
  },
196
+ "vocab_size": 151700
197
  }
modeling_minicpmo.py CHANGED
@@ -206,7 +206,7 @@ class MiniCPMO(MiniCPMOPreTrainedModel):
206
  return Resampler(
207
  num_queries=self.config.query_num,
208
  embed_dim=embed_dim,
209
- num_heads=embed_dim // 128,
210
  kv_dim=vision_dim,
211
  adaptive=True,
212
  )
 
206
  return Resampler(
207
  num_queries=self.config.query_num,
208
  embed_dim=embed_dim,
209
+ num_heads=max(1, embed_dim // 128),
210
  kv_dim=vision_dim,
211
  adaptive=True,
212
  )
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c91ebd65c3f39ed36a031a9eb5722a54facafece3b60bcc554b6e02d624cadc4
3
- size 3760638
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5d5eb21618db4f4f5c73a408cae4a9d842e334d4419a3b278a7ec5bdb1970a2
3
+ size 4968727