abetlen commited on
Commit
3d55748
1 Parent(s): 095de53

Update mmproj conversion

Browse files
Phi-3.5-3.8B-vision-instruct-mmproj-F16.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a7383c19d46afba480b39fda2ed75bfb19e3ca68932105a85aa1286bd861dad
3
  size 652183008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab8449cc7527c21d7082a6ca8266f67a71b459019f67e814ae1683700e61f3f9
3
  size 652183008
convert_image_gguf.py CHANGED
@@ -59,14 +59,14 @@ def main():
59
  # initializer_range=0.02,
60
  # initializer_factor=1.0,
61
  clip_vision_config = {
62
- "hidden_size": 1024,
63
- "intermediate_size": 4096,
64
- "projection_dim": 1024,
65
- "num_hidden_layers": 24,
66
- "num_attention_heads": 16,
67
  "num_channels": 3,
68
  "image_size": 224,
69
- "patch_size": 14,
70
  "hidden_act": "quick_gelu",
71
  "layer_norm_eps": 1e-5,
72
  "attention_dropout": 0.0,
@@ -94,7 +94,7 @@ def main():
94
  dropout=0.0,
95
  hidden_act="quick_gelu",
96
  hidden_size=1024,
97
- image_size=224,
98
  initializer_factor=1.0,
99
  initializer_range=0.02,
100
  intermediate_size=4096,
@@ -103,7 +103,7 @@ def main():
103
  num_channels=3,
104
  num_hidden_layers=24,
105
  patch_size=14,
106
- projection_dim=1024
107
  ))
108
 
109
 
 
59
  # initializer_range=0.02,
60
  # initializer_factor=1.0,
61
  clip_vision_config = {
62
+ "hidden_size": 768,
63
+ "intermediate_size": 3072,
64
+ "projection_dim": 512,
65
+ "num_hidden_layers": 12,
66
+ "num_attention_heads": 12,
67
  "num_channels": 3,
68
  "image_size": 224,
69
+ "patch_size": 32,
70
  "hidden_act": "quick_gelu",
71
  "layer_norm_eps": 1e-5,
72
  "attention_dropout": 0.0,
 
94
  dropout=0.0,
95
  hidden_act="quick_gelu",
96
  hidden_size=1024,
97
+ image_size=336,
98
  initializer_factor=1.0,
99
  initializer_range=0.02,
100
  intermediate_size=4096,
 
103
  num_channels=3,
104
  num_hidden_layers=24,
105
  patch_size=14,
106
+ projection_dim=768
107
  ))
108
 
109