Letian2003 commited on
Commit
f9009f7
·
verified ·
1 Parent(s): 12f66a5

Upload standalone vision encoder: vit-only first commit

Browse files
open_clip_config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_cfg": {
3
+ "embed_dim": 1024,
4
+ "vision_cfg": {
5
+ "layers": 24,
6
+ "width": 1024,
7
+ "patch_size": 2,
8
+ "image_size": 32,
9
+ "no_ln_pre": true,
10
+ "pool_type": "avg",
11
+ "final_ln_after_pool": true,
12
+ "norm_kwargs": {
13
+ "eps": 1e-06
14
+ },
15
+ "output_tokens": true,
16
+ "head_width": 64,
17
+ "in_channels": 16
18
+ },
19
+ "text_cfg": {
20
+ "context_length": 77,
21
+ "vocab_size": 49408,
22
+ "width": 512,
23
+ "heads": 8,
24
+ "layers": 12
25
+ }
26
+ }
27
+ }
open_clip_pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e08712b727e58f1e539f15a2eed96869972cd0f1cfe5baf9ef0b03207999eb69
3
+ size 1214856883