muse-coyo-f8 / config.json
valhalla's picture
add model
cabf5e3
{
"_class_name": "MaskGiTUViT",
"_version": "0.0.1",
"add_cond_embeds": false,
"add_cross_attention": true,
"attention_dropout": 0.0,
"block_out_channels": [
384,
768
],
"codebook_size": 8192,
"cond_embed_dim": null,
"encoder_hidden_size": 768,
"hidden_dropout": 0.0,
"hidden_size": 1024,
"in_channels": 384,
"initializer_range": 0.02,
"intermediate_size": 4096,
"layer_norm_before_mlm": true,
"layer_norm_embedddings": true,
"layer_norm_eps": 1e-06,
"learn_uncond_embeds": false,
"ln_elementwise_affine": true,
"mask_token_id": 8255,
"max_position_embeddings": 256,
"norm_type": "rmsnorm",
"num_attention_heads": 16,
"num_classes": null,
"num_hidden_layers": 22,
"num_res_blocks": 3,
"num_vq_tokens": 1024,
"patch_size": 1,
"project_encoder_hidden_states": false,
"use_bias": false,
"use_codebook_size_for_output": true,
"use_empty_embeds_for_uncond": false,
"use_encoder_layernorm": true,
"use_normformer": false,
"use_position_embeddings": false,
"use_vannilla_resblock": false,
"vocab_size": 8256,
"xavier_init_embed": true
}