Spaces:
Runtime error
Runtime error
Add VQA
Browse files- prismer/model/modules/vit.py +2 -0
- prismer_model.py +1 -0
prismer/model/modules/vit.py
CHANGED
|
@@ -213,6 +213,8 @@ def load_encoder(name: str, experts: dict, image_resolution: int):
|
|
| 213 |
vision_layers = len([k for k in state_dict.keys() if k.endswith(".attn.in_proj_weight")])
|
| 214 |
vision_heads = vision_width // 64
|
| 215 |
|
|
|
|
|
|
|
| 216 |
ViT = VisionTransformer(input_resolution=image_resolution,
|
| 217 |
patch_size=vision_patch_size,
|
| 218 |
width=vision_width,
|
|
|
|
| 213 |
vision_layers = len([k for k in state_dict.keys() if k.endswith(".attn.in_proj_weight")])
|
| 214 |
vision_heads = vision_width // 64
|
| 215 |
|
| 216 |
+
print(vision_width, vision_patch_size, vision_layers, vision_heads)
|
| 217 |
+
|
| 218 |
ViT = VisionTransformer(input_resolution=image_resolution,
|
| 219 |
patch_size=vision_patch_size,
|
| 220 |
width=vision_width,
|
prismer_model.py
CHANGED
|
@@ -103,6 +103,7 @@ class Model:
|
|
| 103 |
'image_resolution': 480,
|
| 104 |
'prismer_model': model_name,
|
| 105 |
'freeze': 'freeze_vision',
|
|
|
|
| 106 |
}
|
| 107 |
|
| 108 |
model = PrismerVQA(config)
|
|
|
|
| 103 |
'image_resolution': 480,
|
| 104 |
'prismer_model': model_name,
|
| 105 |
'freeze': 'freeze_vision',
|
| 106 |
+
'prefix': '',
|
| 107 |
}
|
| 108 |
|
| 109 |
model = PrismerVQA(config)
|