kobiakor15 commited on
Commit
a26f847
·
verified ·
1 Parent(s): 57a52a8

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +6 -12
config.json CHANGED
@@ -1,21 +1,18 @@
1
  {
2
  "model_type": "oculus",
3
  "architectures": ["OculusForConditionalGeneration"],
4
- "variant": "Unified",
5
  "version": "0.1",
6
 
7
  "vision_encoders": {
8
  "dinov3": {
9
- "path": "vision_encoders/dinov3-large",
10
- "model_id": "facebook/dinov3-vith16plus-pretrain-lvd1689m",
11
- "hidden_size": 1280,
12
- "num_layers": 32,
13
  "num_heads": 16,
14
  "image_size": 224,
15
  "patch_size": 16
16
  },
17
  "siglip2": {
18
- "path": "vision_encoders/siglip2-so400m",
19
  "model_id": "google/siglip2-so400m-patch16-naflex",
20
  "hidden_size": 1152,
21
  "num_layers": 27,
@@ -26,7 +23,6 @@
26
  },
27
 
28
  "language_model": {
29
- "path": "language_model/lfm2.5-1.2b",
30
  "model_id": "LiquidAI/LFM2.5-1.2B-Base",
31
  "hidden_size": 1536,
32
  "num_layers": 16,
@@ -41,8 +37,8 @@
41
  },
42
 
43
  "projector_config": {
44
- "fused_vision_dim": 2432,
45
- "hidden_dim": 4864,
46
  "output_dim": 1536
47
  },
48
 
@@ -51,10 +47,8 @@
51
  "detection_classes": 80
52
  },
53
 
54
- "instruct_enabled": true,
55
  "reasoning_enabled": true,
56
  "thinking_token": "<think>",
57
  "thinking_end_token": "</think>",
58
- "max_thinking_tokens": 256,
59
- "standalone": true
60
  }
 
1
  {
2
  "model_type": "oculus",
3
  "architectures": ["OculusForConditionalGeneration"],
 
4
  "version": "0.1",
5
 
6
  "vision_encoders": {
7
  "dinov3": {
8
+ "model_id": "facebook/dinov3-vitl16-pretrain-lvd1689m",
9
+ "hidden_size": 1024,
10
+ "num_layers": 24,
 
11
  "num_heads": 16,
12
  "image_size": 224,
13
  "patch_size": 16
14
  },
15
  "siglip2": {
 
16
  "model_id": "google/siglip2-so400m-patch16-naflex",
17
  "hidden_size": 1152,
18
  "num_layers": 27,
 
23
  },
24
 
25
  "language_model": {
 
26
  "model_id": "LiquidAI/LFM2.5-1.2B-Base",
27
  "hidden_size": 1536,
28
  "num_layers": 16,
 
37
  },
38
 
39
  "projector_config": {
40
+ "fused_vision_dim": 2176,
41
+ "hidden_dim": 4352,
42
  "output_dim": 1536
43
  },
44
 
 
47
  "detection_classes": 80
48
  },
49
 
 
50
  "reasoning_enabled": true,
51
  "thinking_token": "<think>",
52
  "thinking_end_token": "</think>",
53
+ "max_thinking_tokens": 256
 
54
  }