File size: 1,360 Bytes
2a5e44b
 
 
 
956de1a
5899b79
2a5e44b
 
 
 
5899b79
2a5e44b
5899b79
2a5e44b
5899b79
 
2a5e44b
5899b79
2a5e44b
5899b79
2a5e44b
 
 
 
5899b79
 
2a5e44b
 
 
5899b79
2a5e44b
5899b79
2a5e44b
 
 
5899b79
2a5e44b
 
5899b79
 
 
2a5e44b
5899b79
2a5e44b
 
 
 
5899b79
2a5e44b
 
5899b79
 
2a5e44b
 
 
 
5899b79
 
2a5e44b
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
{
  "architectures": [
    "Qwen3VLForConditionalGeneration"
  ],
  "dtype": "float32",
  "image_token_id": 151655,
  "model_type": "qwen3_vl",
  "text_config": {
    "attention_bias": false,
    "attention_dropout": 0.0,
    "head_dim": 32,
    "hidden_act": "silu",
    "hidden_size": 8,
    "initializer_range": 0.02,
    "intermediate_size": 64,
    "max_position_embeddings": 262144,
    "model_type": "qwen3_vl_text",
    "num_attention_heads": 8,
    "num_hidden_layers": 2,
    "num_key_value_heads": 4,
    "rms_norm_eps": 1e-06,
    "rope_scaling": {
      "mrope_section": [
        8,
        4,
        4
      ],
      "rope_type": "default"
    },
    "rope_theta": 5000000,
    "use_cache": true,
    "vocab_size": 151936
  },
  "tie_word_embeddings": false,
  "transformers_version": "4.57.0.dev0",
  "video_token_id": 151656,
  "vision_config": {
    "deepstack_visual_indexes": [
      1,
      3,
      5
    ],
    "depth": 6,
    "hidden_act": "gelu_pytorch_tanh",
    "hidden_size": 128,
    "in_channels": 3,
    "initializer_range": 0.02,
    "intermediate_size": 64,
    "model_type": "qwen3_vl",
    "num_heads": 4,
    "num_position_embeddings": 2304,
    "out_hidden_size": 8,
    "patch_size": 16,
    "spatial_merge_size": 2,
    "temporal_patch_size": 2
  },
  "vision_end_token_id": 151653,
  "vision_start_token_id": 151652
}