File size: 1,769 Bytes
ece60a1
 
 
 
aab7dd7
ece60a1
 
 
 
aab7dd7
ece60a1
776e91c
ece60a1
2a6d098
ece60a1
 
 
 
2a6d098
 
ece60a1
 
 
 
2a6d098
a64ea3e
ece60a1
b0b2701
 
ece60a1
a64ea3e
ece60a1
 
 
 
2a6d098
ece60a1
 
2a6d098
ece60a1
a64ea3e
 
ece60a1
 
0342b92
c13e105
ece60a1
 
 
 
 
 
 
 
 
2a6d098
ece60a1
2a6d098
ece60a1
 
 
 
2a6d098
776e91c
ece60a1
 
2a6d098
ece60a1
2a6d098
ece60a1
 
1b6f2c8
 
a64ea3e
ece60a1
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
{
  "architectures": [
    "Qwen2_5_VLForConditionalGeneration"
  ],
  "dtype": "bfloat16",
  "image_token_id": 151655,
  "model_type": "qwen2_5_vl",
  "text_config": {
    "attention_dropout": 0.0,
    "dtype": "bfloat16",
    "hidden_act": "silu",
    "hidden_size": 16,
    "initializer_range": 0.02,
    "intermediate_size": 11008,
    "layer_types": [
      "full_attention",
      "full_attention"
    ],
    "max_position_embeddings": 128000,
    "max_window_layers": 70,
    "model_type": "qwen2_5_vl_text",
    "num_attention_heads": 4,
    "num_hidden_layers": 2,
    "num_key_value_heads": 2,
    "rms_norm_eps": 1e-06,
    "rope_parameters": {
      "mrope_section": [
        1,
        1
      ],
      "rope_theta": 1000000.0,
      "rope_type": "default",
      "type": "default"
    },
    "sliding_window": null,
    "tie_word_embeddings": true,
    "use_cache": true,
    "use_sliding_window": false,
    "vocab_size": 151936
  },
  "tie_word_embeddings": true,
  "transformers_version": "5.0.0.dev0",
  "video_token_id": 151656,
  "vision_config": {
    "depth": 32,
    "embed_dim": 64,
    "fullatt_block_indexes": [
      7,
      15,
      23,
      31
    ],
    "hidden_act": "silu",
    "hidden_size": 16,
    "in_channels": 3,
    "in_chans": 3,
    "initializer_range": 0.02,
    "intermediate_size": 3420,
    "model_type": "qwen2_5_vl",
    "num_attention_heads": 4,
    "num_heads": 16,
    "num_hidden_layers": 2,
    "num_key_value_heads": 2,
    "out_hidden_size": 16,
    "patch_size": 14,
    "spatial_merge_size": 2,
    "spatial_patch_size": 14,
    "temporal_patch_size": 2,
    "tokens_per_second": 2,
    "window_size": 112
  },
  "vision_end_token_id": 151653,
  "vision_start_token_id": 151652,
  "vision_token_id": 151654
}