Letian2003 commited on
Commit
5d2f844
·
verified ·
1 Parent(s): a96fa6f

Upload standalone vision decoder: vit-only first commit

Browse files
open_clip_config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_cfg": {
3
+ "embed_dim": 512,
4
+ "vision_cfg": {
5
+ "width": 512,
6
+ "layers": 12,
7
+ "patch_size": 1,
8
+ "image_size": 16,
9
+ "no_ln_pre": true,
10
+ "pool_type": "avg",
11
+ "final_ln_after_pool": true,
12
+ "norm_kwargs": {
13
+ "eps": 1e-06
14
+ },
15
+ "output_tokens": true,
16
+ "head_width": 64,
17
+ "in_channels": 1024
18
+ },
19
+ "text_cfg": {
20
+ "context_length": 77,
21
+ "vocab_size": 49408,
22
+ "width": 512,
23
+ "heads": 8,
24
+ "layers": 12
25
+ }
26
+ }
27
+ }
open_clip_pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fb5e333c2856c25227aa43e43ae3a7dc6bb27d450f620a813c8b3309a8731ab
3
+ size 155042771