File size: 1,678 Bytes
ff21a21
 
 
c027646
ff21a21
 
c027646
 
 
 
 
 
ff21a21
 
c027646
d443538
 
 
 
 
ff21a21
 
 
 
 
 
 
 
a26f847
 
7483603
 
ff21a21
 
 
d443538
7483603
 
ff21a21
 
7483603
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
c027646
 
 
 
 
7483603
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
ff21a21
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
{
  "model_type": "oculus",
  "architectures": ["OculusForConditionalGeneration"],
  "architecture_name": "Oceanir-Oculus OO1",
  "version": "0.1",

  "vision_config": {
    "hidden_size": 1024,
    "num_layers": 24,
    "num_heads": 16,
    "image_size": 224,
    "patch_size": 16
  },

  "language_config": {
    "hidden_size": 1536,
    "num_layers": 16,
    "num_heads": 24,
    "vocab_size": 131072,
    "max_position_embeddings": 32768
  },

  "trained_components": {
    "projector": "trained_components/projector.npz",
    "heads": "trained_components/heads.pth"
  },

  "projector_config": {
    "fused_vision_dim": 2176,
    "hidden_dim": 4352,
    "output_dim": 1536,
    "num_tokens": 64
  },

  "task_heads": {
    "segmentation_classes": 150,
    "detection_classes": 80,
    "ui_element_classes": 50
  },

  "reasoning": {
    "enabled": true,
    "thinking_token": "<think>",
    "thinking_end_token": "</think>",
    "max_thinking_tokens": 256,
    "style": "structured"
  },

  "focus_system": {
    "enabled": true,
    "focus_token": "<focus>",
    "focus_end_token": "</focus>",
    "max_regions": 4,
    "min_crop_size": 64,
    "auto_threshold": 0.7
  },

  "structured_output": {
    "enabled": true,
    "json_token": "<json>",
    "json_end_token": "</json>",
    "box_token": "<box>",
    "box_end_token": "</box>",
    "point_token": "<point>",
    "point_end_token": "</point>"
  },

  "ocr": {
    "enabled": true,
    "languages": ["en"],
    "confidence_threshold": 0.5
  },

  "ui_understanding": {
    "enabled": true,
    "element_classes": 50
  },

  "generation": {
    "max_new_tokens": 512,
    "temperature": 0.7,
    "top_p": 0.95
  }
}