Letian2003 commited on
Commit
4e43ee1
·
verified ·
1 Parent(s): f1e4101

Upload standalone vision decoder: vit-only first commit

Browse files
open_clip_config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_cfg": {
3
+ "embed_dim": 768,
4
+ "vision_cfg": {
5
+ "width": 768,
6
+ "layers": 12,
7
+ "patch_size": 1,
8
+ "image_size": 16,
9
+ "no_ln_pre": true,
10
+ "pool_type": "avg",
11
+ "final_ln_after_pool": true,
12
+ "norm_kwargs": {
13
+ "eps": 1e-06
14
+ },
15
+ "output_tokens": true,
16
+ "head_width": 64,
17
+ "in_channels": 768
18
+ },
19
+ "text_cfg": {
20
+ "context_length": 77,
21
+ "vocab_size": 49408,
22
+ "width": 512,
23
+ "heads": 8,
24
+ "layers": 12
25
+ }
26
+ }
27
+ }
open_clip_pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d533f5f95157903cecc2a9b3d380e8af47de71c7a11867108f8dfbcc15c4bde
3
+ size 345785299