Nucleus-Image / transformer /config.json
sippycoder's picture
Update transformer/config.json
6d4c738 verified
raw
history blame contribute delete
887 Bytes
{
"_class_name": "NucleusMoEImageTransformer2DModel",
"_diffusers_version": "0.38.0.dev0",
"patch_size": 2,
"in_channels": 64,
"out_channels": 16,
"num_layers": 32,
"attention_head_dim": 128,
"num_attention_heads": 16,
"num_key_value_heads": 4,
"joint_attention_dim": 4096,
"axes_dims_rope": [
16,
56,
56
],
"mlp_ratio": 4.0,
"moe_enabled": true,
"dense_moe_strategy": "leave_first_three_blocks_dense",
"num_experts": 64,
"moe_intermediate_dim": 1344,
"capacity_factors": [
0.0,
0.0,
0.0,
4.0,
4.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0,
2.0
],
"use_sigmoid": false,
"route_scale": 2.5,
"use_grouped_mm": true
}