kobiakor15 commited on
Commit
d443538
·
verified ·
1 Parent(s): f214cd0

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +27 -26
config.json CHANGED
@@ -6,31 +6,33 @@
6
 
7
  "vision_encoders": {
8
  "dinov3": {
9
- "path": "vision_encoders/dinov2-large",
10
- "model_id": "facebook/dinov3-large",
11
- "hidden_size": 1024,
12
- "num_layers": 24,
13
- "num_heads": 16
 
 
14
  },
15
- "siglip": {
16
- "path": "vision_encoders/siglip-base",
17
- "model_id": "google/siglip-base-patch16-224",
18
- "hidden_size": 768,
19
- "num_layers": 12,
20
- "num_heads": 12
 
 
21
  }
22
  },
23
 
24
  "language_model": {
25
- "captioning": {
26
- "path": "language_model/blip-captioning",
27
- "model_id": "Salesforce/blip-image-captioning-base"
28
- },
29
- "vqa": {
30
- "path": "language_model/blip-vqa-finetuned",
31
- "base_model_id": "Salesforce/blip-vqa-base",
32
- "finetuned": true
33
- }
34
  },
35
 
36
  "trained_components": {
@@ -39,15 +41,14 @@
39
  },
40
 
41
  "projector_config": {
42
- "fused_vision_dim": 1792,
43
- "hidden_dim": 2048,
44
- "num_tokens": 64,
45
- "output_dim": 768
46
  },
47
 
48
  "task_heads": {
49
- "detection_classes": 80,
50
- "segmentation_classes": 150
51
  },
52
 
53
  "instruct_enabled": true,
 
6
 
7
  "vision_encoders": {
8
  "dinov3": {
9
+ "path": "vision_encoders/dinov3-large",
10
+ "model_id": "facebook/dinov3-vith16plus-pretrain-lvd1689m",
11
+ "hidden_size": 1280,
12
+ "num_layers": 32,
13
+ "num_heads": 16,
14
+ "image_size": 224,
15
+ "patch_size": 16
16
  },
17
+ "siglip2": {
18
+ "path": "vision_encoders/siglip2-so400m",
19
+ "model_id": "google/siglip2-so400m-patch16-naflex",
20
+ "hidden_size": 1152,
21
+ "num_layers": 27,
22
+ "num_heads": 16,
23
+ "image_size": 384,
24
+ "patch_size": 16
25
  }
26
  },
27
 
28
  "language_model": {
29
+ "path": "language_model/lfm2.5-1.2b",
30
+ "model_id": "LiquidAI/LFM2.5-1.2B-Base",
31
+ "hidden_size": 1536,
32
+ "num_layers": 16,
33
+ "num_heads": 24,
34
+ "vocab_size": 131072,
35
+ "max_position_embeddings": 32768
 
 
36
  },
37
 
38
  "trained_components": {
 
41
  },
42
 
43
  "projector_config": {
44
+ "fused_vision_dim": 2432,
45
+ "hidden_dim": 4864,
46
+ "output_dim": 1536
 
47
  },
48
 
49
  "task_heads": {
50
+ "segmentation_classes": 150,
51
+ "detection_classes": 80
52
  },
53
 
54
  "instruct_enabled": true,