Yanqing0327 commited on
Commit
31d4f53
·
verified ·
1 Parent(s): e334466

Upload standalone vision encoder: vit-only first commit

Browse files
open_clip_config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_cfg": {
3
+ "embed_dim": 1024,
4
+ "vision_cfg": {
5
+ "layers": 24,
6
+ "width": 1024,
7
+ "patch_size": 14,
8
+ "image_size": 336,
9
+ "no_ln_pre": true,
10
+ "pool_type": "avg",
11
+ "final_ln_after_pool": true,
12
+ "norm_kwargs": {
13
+ "eps": 1e-06
14
+ },
15
+ "output_tokens": true,
16
+ "head_width": 64
17
+ },
18
+ "text_cfg": {
19
+ "context_length": 77,
20
+ "vocab_size": 49408,
21
+ "width": 512,
22
+ "heads": 8,
23
+ "layers": 12
24
+ }
25
+ }
26
+ }
open_clip_pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35dcc0fa28f26a88467b36c551806f91d983caab9be00366761613c8e909dc57
3
+ size 1218313907