Tibron commited on
Commit
b6abd7b
·
verified ·
1 Parent(s): 7bb3b26

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +25 -14
config.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "add_classification_head": false,
3
  "anyres_pooling_size": 2,
4
  "anyres_vit_max_image_size": null,
@@ -6,14 +7,14 @@
6
  "architectures": [
7
  "HunyuanImage3ForCausalMM"
8
  ],
 
 
 
 
 
9
  "attention_bias": false,
10
  "attention_dropout": 0.0,
11
  "attention_head_dim": 128,
12
- "auto_map": {
13
- "AutoConfig": "configuration_hunyuan.HunyuanImage3Config",
14
- "AutoModel": "hunyuan.HunyuanImage3Model",
15
- "AutoModelForCausalLM": "hunyuan.HunyuanImage3ForCausalMM"
16
- },
17
  "bos_token_id": 127958,
18
  "cla_share_factor": 2,
19
  "class_num": 0,
@@ -34,7 +35,7 @@
34
  "intermediate_size": 3072,
35
  "kv_lora_rank": null,
36
  "mask_init_id": 12,
37
- "max_position_embeddings": 12800,
38
  "mlp_bias": false,
39
  "model_type": "hunyuan_image_3_moe",
40
  "moe_drop_tokens": false,
@@ -194,15 +195,25 @@
194
  "vit_path": null,
195
  "vit_remove_prenorm": false,
196
  "vit_token": 64,
197
- "vit_type": null,
198
  "vit_used_rms_norm": false,
199
  "vocab_size": 133120,
200
  "xdrope_section": null,
201
  "head_dim": 128,
 
202
  "vae_downsample_factor": [
203
  16,
204
  16
205
  ],
 
 
 
 
 
 
 
 
 
206
  "vae": {
207
  "_class_name": "AutoencoderKLConv3D",
208
  "block_out_channels": [
@@ -247,15 +258,15 @@
247
  "do_rescale": true,
248
  "do_resize": true,
249
  "image_mean": [
250
- 0.5,
251
- 0.5,
252
- 0.5
253
  ],
254
  "image_processor_type": "Siglip2ImageProcessorFast",
255
  "image_std": [
256
- 0.5,
257
- 0.5,
258
- 0.5
259
  ],
260
  "max_num_patches": 1024,
261
  "patch_size": 16,
@@ -270,4 +281,4 @@
270
  "depth": 2,
271
  "torch_dtype": "float32"
272
  }
273
- }
 
1
  {
2
+ "model_version": "HunyuanImage-3.0",
3
  "add_classification_head": false,
4
  "anyres_pooling_size": 2,
5
  "anyres_vit_max_image_size": null,
 
7
  "architectures": [
8
  "HunyuanImage3ForCausalMM"
9
  ],
10
+ "auto_map": {
11
+ "AutoConfig": "configuration_hunyuan_image_3.HunyuanImage3Config",
12
+ "AutoModel": "modeling_hunyuan_image_3.HunyuanImage3Model",
13
+ "AutoModelForCausalLM": "modeling_hunyuan_image_3.HunyuanImage3ForCausalMM"
14
+ },
15
  "attention_bias": false,
16
  "attention_dropout": 0.0,
17
  "attention_head_dim": 128,
 
 
 
 
 
18
  "bos_token_id": 127958,
19
  "cla_share_factor": 2,
20
  "class_num": 0,
 
35
  "intermediate_size": 3072,
36
  "kv_lora_rank": null,
37
  "mask_init_id": 12,
38
+ "max_position_embeddings": 22800,
39
  "mlp_bias": false,
40
  "model_type": "hunyuan_image_3_moe",
41
  "moe_drop_tokens": false,
 
195
  "vit_path": null,
196
  "vit_remove_prenorm": false,
197
  "vit_token": 64,
198
+ "vit_type": "siglip2-so400m-patch16-naflex",
199
  "vit_used_rms_norm": false,
200
  "vocab_size": 133120,
201
  "xdrope_section": null,
202
  "head_dim": 128,
203
+ "rope_type": "2d",
204
  "vae_downsample_factor": [
205
  16,
206
  16
207
  ],
208
+ "vit_downsample_factor": [
209
+ 16,
210
+ 16
211
+ ],
212
+ "cond_token_attn_type": "joint_full",
213
+ "cond_image_type": "vae_vit",
214
+ "vae_type": "hunyuan-image-vae-v1",
215
+ "vae_dtype": "float32",
216
+ "vae_autocast_dtype": "float16",
217
  "vae": {
218
  "_class_name": "AutoencoderKLConv3D",
219
  "block_out_channels": [
 
258
  "do_rescale": true,
259
  "do_resize": true,
260
  "image_mean": [
261
+ 0.5,
262
+ 0.5,
263
+ 0.5
264
  ],
265
  "image_processor_type": "Siglip2ImageProcessorFast",
266
  "image_std": [
267
+ 0.5,
268
+ 0.5,
269
+ 0.5
270
  ],
271
  "max_num_patches": 1024,
272
  "patch_size": 16,
 
281
  "depth": 2,
282
  "torch_dtype": "float32"
283
  }
284
+ }