unified_vit_v40-vision-decoder / open_clip_config.json
Letian2003's picture
Upload standalone vision decoder: vit-only first commit
20c59d9 verified
{
"model_cfg": {
"embed_dim": 768,
"vision_cfg": {
"width": 768,
"layers": 12,
"patch_size": 1,
"image_size": 16,
"no_ln_pre": true,
"pool_type": "avg",
"final_ln_after_pool": true,
"norm_kwargs": {
"eps": 1e-06
},
"output_tokens": true,
"head_width": 64,
"in_channels": 1024
},
"text_cfg": {
"context_length": 77,
"vocab_size": 49408,
"width": 512,
"heads": 8,
"layers": 12
}
}
}