Update config.json
Browse files- config.json +25 -14
config.json
CHANGED
|
@@ -1,4 +1,5 @@
|
|
| 1 |
{
|
|
|
|
| 2 |
"add_classification_head": false,
|
| 3 |
"anyres_pooling_size": 2,
|
| 4 |
"anyres_vit_max_image_size": null,
|
|
@@ -6,14 +7,14 @@
|
|
| 6 |
"architectures": [
|
| 7 |
"HunyuanImage3ForCausalMM"
|
| 8 |
],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 9 |
"attention_bias": false,
|
| 10 |
"attention_dropout": 0.0,
|
| 11 |
"attention_head_dim": 128,
|
| 12 |
-
"auto_map": {
|
| 13 |
-
"AutoConfig": "configuration_hunyuan.HunyuanImage3Config",
|
| 14 |
-
"AutoModel": "hunyuan.HunyuanImage3Model",
|
| 15 |
-
"AutoModelForCausalLM": "hunyuan.HunyuanImage3ForCausalMM"
|
| 16 |
-
},
|
| 17 |
"bos_token_id": 127958,
|
| 18 |
"cla_share_factor": 2,
|
| 19 |
"class_num": 0,
|
|
@@ -34,7 +35,7 @@
|
|
| 34 |
"intermediate_size": 3072,
|
| 35 |
"kv_lora_rank": null,
|
| 36 |
"mask_init_id": 12,
|
| 37 |
-
"max_position_embeddings":
|
| 38 |
"mlp_bias": false,
|
| 39 |
"model_type": "hunyuan_image_3_moe",
|
| 40 |
"moe_drop_tokens": false,
|
|
@@ -194,15 +195,25 @@
|
|
| 194 |
"vit_path": null,
|
| 195 |
"vit_remove_prenorm": false,
|
| 196 |
"vit_token": 64,
|
| 197 |
-
"vit_type":
|
| 198 |
"vit_used_rms_norm": false,
|
| 199 |
"vocab_size": 133120,
|
| 200 |
"xdrope_section": null,
|
| 201 |
"head_dim": 128,
|
|
|
|
| 202 |
"vae_downsample_factor": [
|
| 203 |
16,
|
| 204 |
16
|
| 205 |
],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 206 |
"vae": {
|
| 207 |
"_class_name": "AutoencoderKLConv3D",
|
| 208 |
"block_out_channels": [
|
|
@@ -247,15 +258,15 @@
|
|
| 247 |
"do_rescale": true,
|
| 248 |
"do_resize": true,
|
| 249 |
"image_mean": [
|
| 250 |
-
|
| 251 |
-
|
| 252 |
-
|
| 253 |
],
|
| 254 |
"image_processor_type": "Siglip2ImageProcessorFast",
|
| 255 |
"image_std": [
|
| 256 |
-
|
| 257 |
-
|
| 258 |
-
|
| 259 |
],
|
| 260 |
"max_num_patches": 1024,
|
| 261 |
"patch_size": 16,
|
|
@@ -270,4 +281,4 @@
|
|
| 270 |
"depth": 2,
|
| 271 |
"torch_dtype": "float32"
|
| 272 |
}
|
| 273 |
-
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"model_version": "HunyuanImage-3.0",
|
| 3 |
"add_classification_head": false,
|
| 4 |
"anyres_pooling_size": 2,
|
| 5 |
"anyres_vit_max_image_size": null,
|
|
|
|
| 7 |
"architectures": [
|
| 8 |
"HunyuanImage3ForCausalMM"
|
| 9 |
],
|
| 10 |
+
"auto_map": {
|
| 11 |
+
"AutoConfig": "configuration_hunyuan_image_3.HunyuanImage3Config",
|
| 12 |
+
"AutoModel": "modeling_hunyuan_image_3.HunyuanImage3Model",
|
| 13 |
+
"AutoModelForCausalLM": "modeling_hunyuan_image_3.HunyuanImage3ForCausalMM"
|
| 14 |
+
},
|
| 15 |
"attention_bias": false,
|
| 16 |
"attention_dropout": 0.0,
|
| 17 |
"attention_head_dim": 128,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 18 |
"bos_token_id": 127958,
|
| 19 |
"cla_share_factor": 2,
|
| 20 |
"class_num": 0,
|
|
|
|
| 35 |
"intermediate_size": 3072,
|
| 36 |
"kv_lora_rank": null,
|
| 37 |
"mask_init_id": 12,
|
| 38 |
+
"max_position_embeddings": 22800,
|
| 39 |
"mlp_bias": false,
|
| 40 |
"model_type": "hunyuan_image_3_moe",
|
| 41 |
"moe_drop_tokens": false,
|
|
|
|
| 195 |
"vit_path": null,
|
| 196 |
"vit_remove_prenorm": false,
|
| 197 |
"vit_token": 64,
|
| 198 |
+
"vit_type": "siglip2-so400m-patch16-naflex",
|
| 199 |
"vit_used_rms_norm": false,
|
| 200 |
"vocab_size": 133120,
|
| 201 |
"xdrope_section": null,
|
| 202 |
"head_dim": 128,
|
| 203 |
+
"rope_type": "2d",
|
| 204 |
"vae_downsample_factor": [
|
| 205 |
16,
|
| 206 |
16
|
| 207 |
],
|
| 208 |
+
"vit_downsample_factor": [
|
| 209 |
+
16,
|
| 210 |
+
16
|
| 211 |
+
],
|
| 212 |
+
"cond_token_attn_type": "joint_full",
|
| 213 |
+
"cond_image_type": "vae_vit",
|
| 214 |
+
"vae_type": "hunyuan-image-vae-v1",
|
| 215 |
+
"vae_dtype": "float32",
|
| 216 |
+
"vae_autocast_dtype": "float16",
|
| 217 |
"vae": {
|
| 218 |
"_class_name": "AutoencoderKLConv3D",
|
| 219 |
"block_out_channels": [
|
|
|
|
| 258 |
"do_rescale": true,
|
| 259 |
"do_resize": true,
|
| 260 |
"image_mean": [
|
| 261 |
+
0.5,
|
| 262 |
+
0.5,
|
| 263 |
+
0.5
|
| 264 |
],
|
| 265 |
"image_processor_type": "Siglip2ImageProcessorFast",
|
| 266 |
"image_std": [
|
| 267 |
+
0.5,
|
| 268 |
+
0.5,
|
| 269 |
+
0.5
|
| 270 |
],
|
| 271 |
"max_num_patches": 1024,
|
| 272 |
"patch_size": 16,
|
|
|
|
| 281 |
"depth": 2,
|
| 282 |
"torch_dtype": "float32"
|
| 283 |
}
|
| 284 |
+
}
|