3morixd commited on
Commit
a2ff38e
·
verified ·
1 Parent(s): 79dd298

Upload models.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. models.json +250 -0
models.json ADDED
@@ -0,0 +1,250 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "name": "SmolLM2-135M-Instruct-mobile",
4
+ "repo_id": "dispatchAI/SmolLM2-135M-Instruct-mobile",
5
+ "chat_format": "llama-3",
6
+ "cpu_tps": 59.7,
7
+ "phone_tps": 46.0,
8
+ "size_mb": 0
9
+ },
10
+ {
11
+ "name": "Qwen2.5-0.5B-Instruct-mobile-int4",
12
+ "repo_id": "dispatchAI/Qwen2.5-0.5B-Instruct-mobile-int4",
13
+ "chat_format": "chatml",
14
+ "cpu_tps": 12.5,
15
+ "phone_tps": 23.2,
16
+ "size_mb": 0
17
+ },
18
+ {
19
+ "name": "Llama-3.2-1B-Instruct-Q4-mobile",
20
+ "repo_id": "dispatchAI/Llama-3.2-1B-Instruct-Q4-mobile",
21
+ "chat_format": "chatml",
22
+ "cpu_tps": 11.3,
23
+ "phone_tps": 5.4,
24
+ "size_mb": 0
25
+ },
26
+ {
27
+ "name": "Gemma-2B-Arabic-mobile",
28
+ "repo_id": "dispatchAI/Gemma-2B-Arabic-mobile",
29
+ "chat_format": "gemma",
30
+ "cpu_tps": 14.8,
31
+ "phone_tps": null,
32
+ "size_mb": 1554.7
33
+ },
34
+ {
35
+ "name": "Llama-3.2-1B-FunctionCall-mobile",
36
+ "repo_id": "dispatchAI/Llama-3.2-1B-FunctionCall-mobile",
37
+ "chat_format": "chatml",
38
+ "cpu_tps": 8.9,
39
+ "phone_tps": null,
40
+ "size_mb": 1925.8
41
+ },
42
+ {
43
+ "name": "Qwen2.5-1.5B-Instruct-mobile-int4",
44
+ "repo_id": "dispatchAI/Qwen2.5-1.5B-Instruct-mobile-int4",
45
+ "chat_format": "chatml",
46
+ "cpu_tps": 7.7,
47
+ "phone_tps": "",
48
+ "size_mb": 1065.6
49
+ },
50
+ {
51
+ "name": "TinyLlama-1.1B-Chat-mobile-int4",
52
+ "repo_id": "dispatchAI/TinyLlama-1.1B-Chat-mobile-int4",
53
+ "chat_format": "chatml",
54
+ "cpu_tps": 17.6,
55
+ "phone_tps": "",
56
+ "size_mb": 637.8
57
+ },
58
+ {
59
+ "name": "Llama-3.2-1B-Instruct-mobile",
60
+ "repo_id": "dispatchAI/Llama-3.2-1B-Instruct-mobile",
61
+ "chat_format": "llama-3",
62
+ "cpu_tps": 4.9,
63
+ "phone_tps": "",
64
+ "size_mb": 1259.9
65
+ },
66
+ {
67
+ "name": "Llama-3.2-3B-Instruct-mobile",
68
+ "repo_id": "dispatchAI/Llama-3.2-3B-Instruct-mobile",
69
+ "chat_format": "llama-3",
70
+ "cpu_tps": 4.8,
71
+ "phone_tps": "",
72
+ "size_mb": 1925.8
73
+ },
74
+ {
75
+ "name": "SmolLM2-1.7B-Instruct-mobile",
76
+ "repo_id": "dispatchAI/SmolLM2-1.7B-Instruct-mobile",
77
+ "chat_format": "chatml",
78
+ "cpu_tps": 18.7,
79
+ "phone_tps": "",
80
+ "size_mb": 1006.7
81
+ },
82
+ {
83
+ "name": "Gemma-2-2B-IT-mobile",
84
+ "repo_id": "dispatchAI/Gemma-2-2B-IT-mobile",
85
+ "chat_format": "gemma",
86
+ "cpu_tps": 8.2,
87
+ "phone_tps": "",
88
+ "size_mb": 1629.4
89
+ },
90
+ {
91
+ "name": "Phi-3.5-mini-Instruct-mobile",
92
+ "repo_id": "dispatchAI/Phi-3.5-mini-Instruct-mobile",
93
+ "chat_format": "chatml",
94
+ "cpu_tps": 8.6,
95
+ "phone_tps": "",
96
+ "size_mb": 2282.4
97
+ },
98
+ {
99
+ "name": "MiniCPM5-1B-mobile",
100
+ "repo_id": "dispatchAI/MiniCPM5-1B-mobile",
101
+ "chat_format": null,
102
+ "cpu_tps": 18.1,
103
+ "phone_tps": "",
104
+ "size_mb": 656.2
105
+ },
106
+ {
107
+ "name": "MiniCPM-V-4.6-mobile",
108
+ "repo_id": "dispatchAI/MiniCPM-V-4.6-mobile",
109
+ "chat_format": "chatml",
110
+ "cpu_tps": 23.4,
111
+ "phone_tps": "",
112
+ "size_mb": 504.6
113
+ },
114
+ {
115
+ "name": "Qwen2.5-Coder-7B-mobile",
116
+ "repo_id": "dispatchAI/Qwen2.5-Coder-7B-mobile",
117
+ "chat_format": "chatml",
118
+ "cpu_tps": 3.0,
119
+ "phone_tps": "",
120
+ "size_mb": 4466.1
121
+ },
122
+ {
123
+ "name": "Llama-3.2-3B-FunctionCall-mobile",
124
+ "repo_id": "dispatchAI/Llama-3.2-3B-FunctionCall-mobile",
125
+ "chat_format": "llama-3",
126
+ "cpu_tps": 9.1,
127
+ "phone_tps": "",
128
+ "size_mb": 1925.8
129
+ },
130
+ {
131
+ "name": "Qwen2.5-0.5B-Coder-mobile",
132
+ "repo_id": "dispatchAI/Qwen2.5-0.5B-Coder-mobile",
133
+ "chat_format": "chatml",
134
+ "cpu_tps": 8.0,
135
+ "phone_tps": "",
136
+ "size_mb": 379.4
137
+ },
138
+ {
139
+ "name": "MiniCPM5-1B-multilingual-mobile",
140
+ "repo_id": "dispatchAI/MiniCPM5-1B-multilingual-mobile",
141
+ "chat_format": null,
142
+ "cpu_tps": 18.4,
143
+ "phone_tps": "",
144
+ "size_mb": 656.2
145
+ },
146
+ {
147
+ "name": "Qwen2.5-0.5B-Chinese-mobile",
148
+ "repo_id": "dispatchAI/Qwen2.5-0.5B-Chinese-mobile",
149
+ "chat_format": "chatml",
150
+ "cpu_tps": 16.4,
151
+ "phone_tps": "",
152
+ "size_mb": 400.6
153
+ },
154
+ {
155
+ "name": "Phi-3.5-mini-instruct-Q5-mobile",
156
+ "repo_id": "dispatchAI/Phi-3.5-mini-instruct-Q5-mobile",
157
+ "chat_format": "chatml",
158
+ "cpu_tps": 7.0,
159
+ "phone_tps": "",
160
+ "size_mb": 2684.9
161
+ },
162
+ {
163
+ "name": "Qwen2.5-0.5B-Instruct-Server-mobile",
164
+ "repo_id": "dispatchAI/Qwen2.5-0.5B-Instruct-Server-mobile",
165
+ "chat_format": "chatml",
166
+ "cpu_tps": 16.7,
167
+ "phone_tps": "",
168
+ "size_mb": 482.3
169
+ },
170
+ {
171
+ "name": "TinyLlama-1.1B-Chat-Q5-mobile",
172
+ "repo_id": "dispatchAI/TinyLlama-1.1B-Chat-Q5-mobile",
173
+ "chat_format": "chatml",
174
+ "cpu_tps": 10.9,
175
+ "phone_tps": "",
176
+ "size_mb": 746.7
177
+ },
178
+ {
179
+ "name": "Gemma-2-2B-IT-Q5-mobile",
180
+ "repo_id": "dispatchAI/Gemma-2-2B-IT-Q5-mobile",
181
+ "chat_format": "gemma",
182
+ "cpu_tps": 5.7,
183
+ "phone_tps": "",
184
+ "size_mb": 1834.2
185
+ },
186
+ {
187
+ "name": "Llama-3.2-1B-Instruct-Q6-mobile",
188
+ "repo_id": "dispatchAI/Llama-3.2-1B-Instruct-Q6-mobile",
189
+ "chat_format": "llama-3",
190
+ "cpu_tps": 5.0,
191
+ "phone_tps": "",
192
+ "size_mb": 974.5
193
+ },
194
+ {
195
+ "name": "SmolLM2-360M-Instruct-mobile",
196
+ "repo_id": "dispatchAI/SmolLM2-360M-Instruct-mobile",
197
+ "chat_format": "chatml",
198
+ "cpu_tps": 29.1,
199
+ "phone_tps": "",
200
+ "size_mb": 258.1
201
+ },
202
+ {
203
+ "name": "SmolLM2-1.7B-Instruct-Q5-mobile",
204
+ "repo_id": "dispatchAI/SmolLM2-1.7B-Instruct-Q5-mobile",
205
+ "chat_format": "chatml",
206
+ "cpu_tps": 10.8,
207
+ "phone_tps": "",
208
+ "size_mb": 1168.7
209
+ },
210
+ {
211
+ "name": "Qwen2.5-Coder-1.5B-mobile",
212
+ "repo_id": "dispatchAI/Qwen2.5-Coder-1.5B-mobile",
213
+ "chat_format": "chatml",
214
+ "cpu_tps": 7.8,
215
+ "phone_tps": "",
216
+ "size_mb": 940.4
217
+ },
218
+ {
219
+ "name": "Qwen2.5-Math-1.5B-mobile",
220
+ "repo_id": "dispatchAI/Qwen2.5-Math-1.5B-mobile",
221
+ "chat_format": "chatml",
222
+ "cpu_tps": 15.7,
223
+ "phone_tps": "",
224
+ "size_mb": 940.4
225
+ },
226
+ {
227
+ "name": "Qwen2.5-1.5B-Instruct-Q5-mobile",
228
+ "repo_id": "dispatchAI/Qwen2.5-1.5B-Instruct-Q5-mobile",
229
+ "chat_format": "chatml",
230
+ "cpu_tps": 4.4,
231
+ "phone_tps": "",
232
+ "size_mb": 1072.9
233
+ },
234
+ {
235
+ "name": "Qwen2.5-1.5B-Instruct-Q8-mobile",
236
+ "repo_id": "dispatchAI/Qwen2.5-1.5B-Instruct-Q8-mobile",
237
+ "chat_format": "chatml",
238
+ "cpu_tps": 8.7,
239
+ "phone_tps": "",
240
+ "size_mb": 1570.3
241
+ },
242
+ {
243
+ "name": "Llama-3.2-3B-Instruct-Q5-mobile",
244
+ "repo_id": "dispatchAI/Llama-3.2-3B-Instruct-Q5-mobile",
245
+ "chat_format": "llama-3",
246
+ "cpu_tps": 2.6,
247
+ "phone_tps": "",
248
+ "size_mb": 2214.6
249
+ }
250
+ ]