Spaces:
Sleeping
Sleeping
Add VQA
Browse files- prismer/model/modules/vit.py +2 -0
- prismer_model.py +1 -0
prismer/model/modules/vit.py
CHANGED
@@ -213,6 +213,8 @@ def load_encoder(name: str, experts: dict, image_resolution: int):
|
|
213 |
vision_layers = len([k for k in state_dict.keys() if k.endswith(".attn.in_proj_weight")])
|
214 |
vision_heads = vision_width // 64
|
215 |
|
|
|
|
|
216 |
ViT = VisionTransformer(input_resolution=image_resolution,
|
217 |
patch_size=vision_patch_size,
|
218 |
width=vision_width,
|
|
|
213 |
vision_layers = len([k for k in state_dict.keys() if k.endswith(".attn.in_proj_weight")])
|
214 |
vision_heads = vision_width // 64
|
215 |
|
216 |
+
print(vision_width, vision_patch_size, vision_layers, vision_heads)
|
217 |
+
|
218 |
ViT = VisionTransformer(input_resolution=image_resolution,
|
219 |
patch_size=vision_patch_size,
|
220 |
width=vision_width,
|
prismer_model.py
CHANGED
@@ -103,6 +103,7 @@ class Model:
|
|
103 |
'image_resolution': 480,
|
104 |
'prismer_model': model_name,
|
105 |
'freeze': 'freeze_vision',
|
|
|
106 |
}
|
107 |
|
108 |
model = PrismerVQA(config)
|
|
|
103 |
'image_resolution': 480,
|
104 |
'prismer_model': model_name,
|
105 |
'freeze': 'freeze_vision',
|
106 |
+
'prefix': '',
|
107 |
}
|
108 |
|
109 |
model = PrismerVQA(config)
|