kshitijthakkar commited on
Commit
19dae10
·
verified ·
1 Parent(s): a35eea5

Upload Qwen3.5 tiny test model (HF-aligned, random weights)

Browse files
config.json CHANGED
@@ -57,15 +57,15 @@
57
  }
58
  },
59
  "vision_config": {
60
- "depth": 27,
61
  "hidden_act": "gelu_pytorch_tanh",
62
- "hidden_size": 1152,
63
  "in_channels": 3,
64
  "initializer_range": 0.02,
65
- "intermediate_size": 4304,
66
  "model_type": "qwen3_5_moe",
67
- "num_heads": 16,
68
- "num_position_embeddings": 2304,
69
  "out_hidden_size": 256,
70
  "patch_size": 16,
71
  "spatial_merge_size": 2,
 
57
  }
58
  },
59
  "vision_config": {
60
+ "depth": 2,
61
  "hidden_act": "gelu_pytorch_tanh",
62
+ "hidden_size": 64,
63
  "in_channels": 3,
64
  "initializer_range": 0.02,
65
+ "intermediate_size": 128,
66
  "model_type": "qwen3_5_moe",
67
+ "num_heads": 4,
68
+ "num_position_embeddings": 64,
69
  "out_hidden_size": 256,
70
  "patch_size": 16,
71
  "spatial_merge_size": 2,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f2eb97338f4f89d7aadc264d9285423fbc4ffb74796a9afb62d5e9b2e02d660
3
  size 277156688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fb5a05ebf9a777cb65e697437df10f0ca90de994207c4c5443192765605e489
3
  size 277156688
preprocessor_config.json ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "size": {
3
+ "longest_edge": 16777216,
4
+ "shortest_edge": 65536
5
+ },
6
+ "patch_size": 16,
7
+ "temporal_patch_size": 2,
8
+ "merge_size": 2,
9
+ "image_mean": [
10
+ 0.5,
11
+ 0.5,
12
+ 0.5
13
+ ],
14
+ "image_std": [
15
+ 0.5,
16
+ 0.5,
17
+ 0.5
18
+ ],
19
+ "processor_class": "Qwen3VLProcessor",
20
+ "image_processor_type": "Qwen2VLImageProcessorFast"
21
+ }
video_preprocessor_config.json ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "size": {
3
+ "longest_edge": 25165824,
4
+ "shortest_edge": 4096
5
+ },
6
+ "patch_size": 16,
7
+ "temporal_patch_size": 2,
8
+ "merge_size": 2,
9
+ "image_mean": [
10
+ 0.5,
11
+ 0.5,
12
+ 0.5
13
+ ],
14
+ "image_std": [
15
+ 0.5,
16
+ 0.5,
17
+ 0.5
18
+ ],
19
+ "processor_class": "Qwen3VLProcessor",
20
+ "video_processor_type": "Qwen3VLVideoProcessor"
21
+ }