Yanqing0327's picture
Upload standalone vision encoder: vit-only first commit
ed61fa3 verified
raw
history blame contribute delete
529 Bytes
{
"model_cfg": {
"embed_dim": 1408,
"vision_cfg": {
"layers": 40,
"width": 1408,
"patch_size": 14,
"image_size": 224,
"no_ln_pre": true,
"pool_type": "avg",
"final_ln_after_pool": true,
"mlp_ratio": 4.363636363636363,
"norm_kwargs": {
"eps": 1e-06
},
"output_tokens": true,
"head_width": 88
},
"text_cfg": {
"context_length": 77,
"vocab_size": 49408,
"width": 512,
"heads": 8,
"layers": 12
}
}
}