{ "embed_dim": 768, "vision_cfg": { "image_size": 224, "layers": 24, "width": 1024, "patch_size": 14, "attentional_pool": true, "attn_pooler_heads": 8, "output_tokens": true }, "text_cfg": { "context_length": 76, "vocab_size": 49408, "width": 768, "heads": 12, "layers": 12, "embed_cls": true, "output_tokens": true }, "multimodal_cfg": { "context_length": 76, "vocab_size": 49408, "width": 768, "heads": 12, "layers": 12, "attn_pooler_heads": 12 }, "custom_text": true }