{ "embed_dim": 256, "vision_cfg": { "image_size": 224, "layers": 12, "width": 384, "patch_size": 32 }, "text_cfg": { "context_length": 77, "vocab_size": 49408, "width": 256, "heads": 4, "layers": 10 } }