msluszniak commited on
Commit
1e50a8e
·
verified ·
1 Parent(s): 48c2dab

Add spec-compliant config.json files

Browse files
Files changed (2) hide show
  1. 0_8b/xnnpack/config.json +65 -1
  2. 2b/xnnpack/config.json +65 -1
0_8b/xnnpack/config.json CHANGED
@@ -12,7 +12,71 @@
12
  "file": "qwen_3_5_0_8b_xnnpack_8da4w.pte",
13
  "precision": "8da4w",
14
  "quantized": true,
15
- "default": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16
  }
17
  ],
18
  "size": "0_8b"
 
12
  "file": "qwen_3_5_0_8b_xnnpack_8da4w.pte",
13
  "precision": "8da4w",
14
  "quantized": true,
15
+ "default": true,
16
+ "methods": {
17
+ "enable_dynamic_shape": {
18
+ "inputs": [],
19
+ "outputs": []
20
+ },
21
+ "forward": {
22
+ "inputs": [
23
+ {
24
+ "shape": [
25
+ 1,
26
+ 1
27
+ ],
28
+ "dtype": "int64"
29
+ },
30
+ {
31
+ "shape": [
32
+ 1
33
+ ],
34
+ "dtype": "int64"
35
+ }
36
+ ],
37
+ "outputs": [
38
+ {
39
+ "shape": [
40
+ 1,
41
+ 248320
42
+ ],
43
+ "dtype": "float32"
44
+ }
45
+ ]
46
+ },
47
+ "get_bos_id": {
48
+ "inputs": [],
49
+ "outputs": []
50
+ },
51
+ "get_eos_ids": {
52
+ "inputs": [],
53
+ "outputs": []
54
+ },
55
+ "get_max_context_len": {
56
+ "inputs": [],
57
+ "outputs": []
58
+ },
59
+ "get_max_seq_len": {
60
+ "inputs": [],
61
+ "outputs": []
62
+ },
63
+ "get_n_layers": {
64
+ "inputs": [],
65
+ "outputs": []
66
+ },
67
+ "get_vocab_size": {
68
+ "inputs": [],
69
+ "outputs": []
70
+ },
71
+ "use_kv_cache": {
72
+ "inputs": [],
73
+ "outputs": []
74
+ },
75
+ "use_sdpa_with_kv_cache": {
76
+ "inputs": [],
77
+ "outputs": []
78
+ }
79
+ }
80
  }
81
  ],
82
  "size": "0_8b"
2b/xnnpack/config.json CHANGED
@@ -12,7 +12,71 @@
12
  "file": "qwen_3_5_2b_xnnpack_8da4w.pte",
13
  "precision": "8da4w",
14
  "quantized": true,
15
- "default": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16
  }
17
  ],
18
  "size": "2b"
 
12
  "file": "qwen_3_5_2b_xnnpack_8da4w.pte",
13
  "precision": "8da4w",
14
  "quantized": true,
15
+ "default": true,
16
+ "methods": {
17
+ "enable_dynamic_shape": {
18
+ "inputs": [],
19
+ "outputs": []
20
+ },
21
+ "forward": {
22
+ "inputs": [
23
+ {
24
+ "shape": [
25
+ 1,
26
+ 1
27
+ ],
28
+ "dtype": "int64"
29
+ },
30
+ {
31
+ "shape": [
32
+ 1
33
+ ],
34
+ "dtype": "int64"
35
+ }
36
+ ],
37
+ "outputs": [
38
+ {
39
+ "shape": [
40
+ 1,
41
+ 248320
42
+ ],
43
+ "dtype": "float32"
44
+ }
45
+ ]
46
+ },
47
+ "get_bos_id": {
48
+ "inputs": [],
49
+ "outputs": []
50
+ },
51
+ "get_eos_ids": {
52
+ "inputs": [],
53
+ "outputs": []
54
+ },
55
+ "get_max_context_len": {
56
+ "inputs": [],
57
+ "outputs": []
58
+ },
59
+ "get_max_seq_len": {
60
+ "inputs": [],
61
+ "outputs": []
62
+ },
63
+ "get_n_layers": {
64
+ "inputs": [],
65
+ "outputs": []
66
+ },
67
+ "get_vocab_size": {
68
+ "inputs": [],
69
+ "outputs": []
70
+ },
71
+ "use_kv_cache": {
72
+ "inputs": [],
73
+ "outputs": []
74
+ },
75
+ "use_sdpa_with_kv_cache": {
76
+ "inputs": [],
77
+ "outputs": []
78
+ }
79
+ }
80
  }
81
  ],
82
  "size": "2b"