Spaces:
Sleeping
Sleeping
Add VQA
Browse files
prismer/model/modules/vit.py
CHANGED
@@ -213,8 +213,6 @@ def load_encoder(name: str, experts: dict, image_resolution: int):
|
|
213 |
vision_layers = len([k for k in state_dict.keys() if k.endswith(".attn.in_proj_weight")])
|
214 |
vision_heads = vision_width // 64
|
215 |
|
216 |
-
print(vision_width, vision_patch_size, vision_layers, vision_heads)
|
217 |
-
|
218 |
ViT = VisionTransformer(input_resolution=image_resolution,
|
219 |
patch_size=vision_patch_size,
|
220 |
width=vision_width,
|
|
|
213 |
vision_layers = len([k for k in state_dict.keys() if k.endswith(".attn.in_proj_weight")])
|
214 |
vision_heads = vision_width // 64
|
215 |
|
|
|
|
|
216 |
ViT = VisionTransformer(input_resolution=image_resolution,
|
217 |
patch_size=vision_patch_size,
|
218 |
width=vision_width,
|