shikunl commited on
Commit
539688d
β€’
1 Parent(s): 073a46b
Files changed (2) hide show
  1. prismer/model/modules/vit.py +2 -0
  2. prismer_model.py +1 -0
prismer/model/modules/vit.py CHANGED
@@ -213,6 +213,8 @@ def load_encoder(name: str, experts: dict, image_resolution: int):
213
  vision_layers = len([k for k in state_dict.keys() if k.endswith(".attn.in_proj_weight")])
214
  vision_heads = vision_width // 64
215
 
 
 
216
  ViT = VisionTransformer(input_resolution=image_resolution,
217
  patch_size=vision_patch_size,
218
  width=vision_width,
 
213
  vision_layers = len([k for k in state_dict.keys() if k.endswith(".attn.in_proj_weight")])
214
  vision_heads = vision_width // 64
215
 
216
+ print(vision_width, vision_patch_size, vision_layers, vision_heads)
217
+
218
  ViT = VisionTransformer(input_resolution=image_resolution,
219
  patch_size=vision_patch_size,
220
  width=vision_width,
prismer_model.py CHANGED
@@ -103,6 +103,7 @@ class Model:
103
  'image_resolution': 480,
104
  'prismer_model': model_name,
105
  'freeze': 'freeze_vision',
 
106
  }
107
 
108
  model = PrismerVQA(config)
 
103
  'image_resolution': 480,
104
  'prismer_model': model_name,
105
  'freeze': 'freeze_vision',
106
+ 'prefix': '',
107
  }
108
 
109
  model = PrismerVQA(config)