{ "architectures": [ "CLIPModel" ], "initializer_factor": 1.0, "logit_scale_init_value": 2.6592, "model_type": "clip", "projection_dim": 512, "text_config": { "eos_token_id": 1, "model_type": "clip_text_model", "pad_token_id": 0, "vocab_size": 32100 }, "torch_dtype": "float32", "transformers_version": "4.38.1", "vision_config": { "model_type": "clip_vision_model", "patch_size": 16 } }