CrispStrobe commited on
Commit
131ab2f
·
1 Parent(s): 6f9105d

feat: add HF IDs and sizes for Voxtral and new Mistral models

Browse files
Files changed (2) hide show
  1. data/providers.json +712 -695
  2. scripts/fetch-providers.js +17 -0
data/providers.json CHANGED
@@ -378,8 +378,8 @@
378
  "capabilities": [
379
  "tools"
380
  ],
381
- "size_b": 675,
382
- "hf_id": "mistralai/Mistral-Large-Instruct-2411",
383
  "hf_private": false,
384
  "ollama_id": "mistral-large",
385
  "size_source": "manual"
@@ -1154,14 +1154,29 @@
1154
  "hf_private": false
1155
  },
1156
  {
1157
- "name": "novita/Sao10K/L3-8B-Stheno-v3.2",
1158
  "type": "chat",
1159
  "input_price_per_1m": 0.05,
1160
- "output_price_per_1m": 0.05,
1161
  "currency": "USD",
1162
- "context_window": 8192,
1163
- "size_b": 8,
1164
- "hf_private": false
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1165
  },
1166
  {
1167
  "name": "novita/meta-llama/llama-3.1-8b-instruct",
@@ -1188,40 +1203,25 @@
1188
  "hf_private": false
1189
  },
1190
  {
1191
- "name": "azure/gpt-5-nano",
1192
  "type": "chat",
1193
  "input_price_per_1m": 0.05,
1194
- "output_price_per_1m": 0.4,
1195
  "currency": "USD",
1196
- "capabilities": [
1197
- "reasoning"
1198
- ],
1199
- "context_window": 200000,
1200
- "hf_private": true
1201
  },
1202
  {
1203
- "name": "alibaba/qwen-turbo",
1204
  "type": "chat",
1205
  "input_price_per_1m": 0.05,
1206
- "output_price_per_1m": 0.2,
1207
- "currency": "USD",
1208
- "context_window": 1000000,
1209
- "capabilities": [
1210
- "tools"
1211
- ],
1212
- "hf_private": true
1213
- },
1214
- {
1215
- "name": "openai-responses/gpt-5-nano",
1216
- "type": "vision",
1217
- "input_price_per_1m": 0.05,
1218
  "output_price_per_1m": 0.4,
1219
  "currency": "USD",
1220
  "capabilities": [
1221
- "vision",
1222
  "reasoning"
1223
  ],
1224
- "context_window": 400000,
1225
  "hf_private": true
1226
  },
1227
  {
@@ -1235,26 +1235,26 @@
1235
  "hf_private": false
1236
  },
1237
  {
1238
- "name": "deepinfra/microsoft/phi-4",
1239
  "type": "chat",
1240
  "input_price_per_1m": 0.07,
1241
- "output_price_per_1m": 0.14,
1242
  "currency": "USD",
1243
  "context_window": 16384,
1244
- "hf_private": false,
1245
- "size_b": 14,
1246
- "size_source": "manual",
1247
- "hf_id": "microsoft/phi-4"
1248
  },
1249
  {
1250
- "name": "deepinfra/Qwen/Qwen2.5-Coder-32B-Instruct",
1251
  "type": "chat",
1252
  "input_price_per_1m": 0.07,
1253
- "output_price_per_1m": 0.16,
1254
  "currency": "USD",
1255
  "context_window": 16384,
1256
- "size_b": 32,
1257
- "hf_private": false
 
 
1258
  },
1259
  {
1260
  "name": "novita/gryphe/mythomax-l2-13b",
@@ -1268,7 +1268,7 @@
1268
  "hf_private": false
1269
  },
1270
  {
1271
- "name": "openai/gpt-4.1-nano",
1272
  "type": "vision",
1273
  "input_price_per_1m": 0.1,
1274
  "output_price_per_1m": 0.4,
@@ -1280,22 +1280,19 @@
1280
  "hf_private": true
1281
  },
1282
  {
1283
- "name": "deepinfra/Qwen/Qwen3-32B",
1284
- "type": "chat",
1285
  "input_price_per_1m": 0.1,
1286
- "output_price_per_1m": 0.3,
1287
  "currency": "USD",
1288
- "context_window": 40000,
1289
- "size_b": 32,
1290
  "capabilities": [
1291
- "tools",
1292
- "reasoning"
1293
  ],
1294
- "hf_id": "Qwen/Qwen3-32B",
1295
- "hf_private": false
1296
  },
1297
  {
1298
- "name": "azure/gpt-4.1-nano",
1299
  "type": "vision",
1300
  "input_price_per_1m": 0.1,
1301
  "output_price_per_1m": 0.4,
@@ -1303,38 +1300,49 @@
1303
  "capabilities": [
1304
  "vision"
1305
  ],
1306
- "context_window": 1047576,
1307
  "hf_private": true
1308
  },
1309
  {
1310
- "name": "azure/openai-responses/gpt-4.1-nano",
1311
  "type": "vision",
1312
  "input_price_per_1m": 0.1,
1313
  "output_price_per_1m": 0.4,
1314
  "currency": "USD",
1315
  "capabilities": [
1316
- "vision"
 
1317
  ],
1318
- "context_window": 1047576,
1319
  "hf_private": true
1320
  },
1321
  {
1322
- "name": "groq/openai/gpt-oss-20b",
1323
  "type": "chat",
1324
  "input_price_per_1m": 0.1,
1325
- "output_price_per_1m": 0.5,
1326
  "currency": "USD",
1327
- "context_window": 131072,
1328
- "size_b": 20,
 
 
 
 
 
 
 
 
 
 
1329
  "capabilities": [
1330
  "tools",
1331
  "reasoning"
1332
  ],
1333
- "hf_id": "openai/gpt-oss-20b",
1334
  "hf_private": false
1335
  },
1336
  {
1337
- "name": "google/gemini-2.5-flash-lite",
1338
  "type": "vision",
1339
  "input_price_per_1m": 0.1,
1340
  "output_price_per_1m": 0.4,
@@ -1347,7 +1355,7 @@
1347
  "hf_private": true
1348
  },
1349
  {
1350
- "name": "google/gemini-2.0-flash-001",
1351
  "type": "vision",
1352
  "input_price_per_1m": 0.1,
1353
  "output_price_per_1m": 0.4,
@@ -1355,11 +1363,11 @@
1355
  "capabilities": [
1356
  "vision"
1357
  ],
1358
- "context_window": 1048576,
1359
  "hf_private": true
1360
  },
1361
  {
1362
- "name": "openai-responses/gpt-4.1-nano",
1363
  "type": "vision",
1364
  "input_price_per_1m": 0.1,
1365
  "output_price_per_1m": 0.4,
@@ -1371,29 +1379,22 @@
1371
  "hf_private": true
1372
  },
1373
  {
1374
- "name": "vertex/gemini-2.5-flash-lite",
1375
- "type": "vision",
1376
  "input_price_per_1m": 0.1,
1377
- "output_price_per_1m": 0.4,
1378
  "currency": "USD",
 
 
1379
  "capabilities": [
1380
- "vision",
1381
  "reasoning"
1382
  ],
1383
- "context_window": 1048576,
1384
- "hf_private": true
1385
- },
1386
- {
1387
- "name": "mistral/mistral-small-2503",
1388
- "type": "chat",
1389
- "input_price_per_1m": 0.1,
1390
- "output_price_per_1m": 0.3,
1391
- "currency": "USD",
1392
- "context_window": 32768,
1393
- "hf_private": true
1394
  },
1395
  {
1396
- "name": "mistral/devstral-small-latest",
1397
  "type": "chat",
1398
  "input_price_per_1m": 0.1,
1399
  "output_price_per_1m": 0.3,
@@ -1407,7 +1408,7 @@
1407
  "hf_private": false
1408
  },
1409
  {
1410
- "name": "mistral/devstral-small-2507",
1411
  "type": "chat",
1412
  "input_price_per_1m": 0.1,
1413
  "output_price_per_1m": 0.3,
@@ -1421,14 +1422,13 @@
1421
  "hf_private": false
1422
  },
1423
  {
1424
- "name": "together/meta-llama/Meta-Llama-3-8B-Instruct-Lite",
1425
  "type": "chat",
1426
  "input_price_per_1m": 0.1,
1427
- "output_price_per_1m": 0.1,
1428
  "currency": "USD",
1429
- "context_window": 8192,
1430
- "size_b": 8,
1431
- "hf_private": false
1432
  },
1433
  {
1434
  "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct-Turbo",
@@ -1508,6 +1508,16 @@
1508
  "hf_id": "openai/gpt-oss-120b",
1509
  "hf_private": false
1510
  },
 
 
 
 
 
 
 
 
 
 
1511
  {
1512
  "name": "novita/deepseek/deepseek-r1-distill-qwen-14b",
1513
  "type": "chat",
@@ -1524,16 +1534,6 @@
1524
  "size_source": "manual",
1525
  "hf_private": false
1526
  },
1527
- {
1528
- "name": "parasail/parasail-qwen3-235b-a22b-instruct-2507",
1529
- "type": "chat",
1530
- "input_price_per_1m": 0.15,
1531
- "output_price_per_1m": 0.85,
1532
- "currency": "USD",
1533
- "context_window": 262144,
1534
- "size_b": 235,
1535
- "hf_private": false
1536
- },
1537
  {
1538
  "name": "groq/openai/gpt-oss-120b",
1539
  "type": "chat",
@@ -1550,7 +1550,7 @@
1550
  "hf_private": false
1551
  },
1552
  {
1553
- "name": "mistral/mistral-small-2603",
1554
  "type": "vision",
1555
  "input_price_per_1m": 0.15,
1556
  "output_price_per_1m": 0.6,
@@ -1560,12 +1560,10 @@
1560
  "reasoning"
1561
  ],
1562
  "context_window": 256000,
1563
- "size_b": 119,
1564
- "hf_id": "mistralai/Mistral-Small-4-119B-2603",
1565
- "hf_private": false
1566
  },
1567
  {
1568
- "name": "mistral/mistral-small-latest",
1569
  "type": "vision",
1570
  "input_price_per_1m": 0.15,
1571
  "output_price_per_1m": 0.6,
@@ -1575,7 +1573,9 @@
1575
  "reasoning"
1576
  ],
1577
  "context_window": 256000,
1578
- "hf_private": true
 
 
1579
  },
1580
  {
1581
  "name": "novita/mistralai/mistral-nemo",
@@ -1601,6 +1601,33 @@
1601
  "size_b": 8,
1602
  "hf_private": false
1603
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1604
  {
1605
  "name": "openai/gpt-5.4-nano",
1606
  "type": "vision",
@@ -1644,18 +1671,6 @@
1644
  "hf_id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct",
1645
  "hf_private": false
1646
  },
1647
- {
1648
- "name": "xai/grok-code-fast-1",
1649
- "type": "vision",
1650
- "input_price_per_1m": 0.2,
1651
- "output_price_per_1m": 1.5,
1652
- "currency": "USD",
1653
- "capabilities": [
1654
- "vision"
1655
- ],
1656
- "context_window": 256000,
1657
- "hf_private": true
1658
- },
1659
  {
1660
  "name": "xai/grok-4-fast-non-reasoning",
1661
  "type": "chat",
@@ -1670,6 +1685,18 @@
1670
  ],
1671
  "hf_private": true
1672
  },
 
 
 
 
 
 
 
 
 
 
 
 
1673
  {
1674
  "name": "xai/grok-4-fast",
1675
  "type": "chat",
@@ -1709,18 +1736,13 @@
1709
  "hf_private": true
1710
  },
1711
  {
1712
- "name": "deepinfra/Qwen/Qwen3-235B-A22B",
1713
  "type": "chat",
1714
  "input_price_per_1m": 0.2,
1715
- "output_price_per_1m": 0.6,
1716
  "currency": "USD",
1717
- "context_window": 40000,
1718
- "size_b": 235,
1719
- "capabilities": [
1720
- "tools",
1721
- "reasoning"
1722
- ],
1723
- "hf_id": "Qwen/Qwen3-235B-A22B",
1724
  "hf_private": false
1725
  },
1726
  {
@@ -1739,78 +1761,46 @@
1739
  "hf_private": false
1740
  },
1741
  {
1742
- "name": "alibaba/qwen3-30b-a3b-instruct-2507",
1743
- "type": "vision",
1744
- "input_price_per_1m": 0.2,
1745
- "output_price_per_1m": 0.8,
1746
- "currency": "USD",
1747
- "capabilities": [
1748
- "vision"
1749
- ],
1750
- "context_window": 131072,
1751
- "size_b": 30,
1752
- "hf_id": "Qwen/Qwen3-30B-A3B-Instruct-2507",
1753
- "hf_private": false
1754
- },
1755
- {
1756
- "name": "openai-responses/gpt-5.4-nano",
1757
- "type": "vision",
1758
  "input_price_per_1m": 0.2,
1759
- "output_price_per_1m": 1.25,
1760
  "currency": "USD",
 
 
1761
  "capabilities": [
1762
- "vision",
1763
  "reasoning"
1764
  ],
1765
- "context_window": 400000,
1766
- "hf_private": true
1767
- },
1768
- {
1769
- "name": "together/meta-llama/LlamaGuard-2-8b",
1770
- "type": "chat",
1771
- "input_price_per_1m": 0.2,
1772
- "output_price_per_1m": 0.2,
1773
- "currency": "USD",
1774
- "context_window": 8192,
1775
- "size_b": 8,
1776
  "hf_private": false
1777
  },
1778
  {
1779
- "name": "deepinfra/Qwen/Qwen2.5-72B-Instruct",
1780
  "type": "chat",
1781
  "input_price_per_1m": 0.23,
1782
  "output_price_per_1m": 0.4,
1783
  "currency": "USD",
1784
  "context_window": 131072,
1785
- "size_b": 72,
1786
  "capabilities": [
1787
- "vision"
1788
  ],
1789
- "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
1790
- "hf_private": false
1791
- },
1792
- {
1793
- "name": "deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct",
1794
- "type": "chat",
1795
- "input_price_per_1m": 0.23,
1796
- "output_price_per_1m": 0.4,
1797
- "currency": "USD",
1798
- "context_window": 130815,
1799
- "size_b": 70,
1800
  "hf_private": false
1801
  },
1802
  {
1803
- "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct",
1804
  "type": "chat",
1805
  "input_price_per_1m": 0.23,
1806
  "output_price_per_1m": 0.4,
1807
  "currency": "USD",
1808
  "context_window": 131072,
1809
- "size_b": 70,
1810
  "capabilities": [
1811
- "tools"
1812
  ],
1813
- "hf_id": "meta-llama/Llama-3.3-70B-Instruct",
1814
  "hf_private": false
1815
  },
1816
  {
@@ -1828,15 +1818,26 @@
1828
  "hf_private": false
1829
  },
1830
  {
1831
- "name": "azure/gpt-5-mini",
1832
  "type": "chat",
 
 
 
 
 
 
 
 
 
 
1833
  "input_price_per_1m": 0.25,
1834
  "output_price_per_1m": 2,
1835
  "currency": "USD",
1836
  "capabilities": [
 
1837
  "reasoning"
1838
  ],
1839
- "context_window": 200000,
1840
  "hf_private": true
1841
  },
1842
  {
@@ -1852,28 +1853,27 @@
1852
  "hf_private": true
1853
  },
1854
  {
1855
- "name": "openai-responses/gpt-5-mini",
1856
  "type": "vision",
1857
  "input_price_per_1m": 0.25,
1858
- "output_price_per_1m": 2,
1859
  "currency": "USD",
1860
  "capabilities": [
1861
- "vision",
1862
- "reasoning"
1863
  ],
1864
- "context_window": 400000,
1865
  "hf_private": true
1866
  },
1867
  {
1868
- "name": "vertex/gemini-3.1-flash-lite-preview",
1869
- "type": "vision",
1870
  "input_price_per_1m": 0.25,
1871
- "output_price_per_1m": 1.5,
1872
  "currency": "USD",
1873
  "capabilities": [
1874
- "vision"
1875
  ],
1876
- "context_window": 1048576,
1877
  "hf_private": true
1878
  },
1879
  {
@@ -1924,6 +1924,18 @@
1924
  "context_window": 128000,
1925
  "hf_private": true
1926
  },
 
 
 
 
 
 
 
 
 
 
 
 
1927
  {
1928
  "name": "nebius/deepseek-ai/DeepSeek-V3.2",
1929
  "type": "chat",
@@ -1953,23 +1965,30 @@
1953
  "hf_private": false
1954
  },
1955
  {
1956
- "name": "novita/minimax-m2.7",
 
 
 
 
 
 
 
 
 
 
1957
  "type": "vision",
1958
  "input_price_per_1m": 0.3,
1959
- "output_price_per_1m": 1.2,
1960
  "currency": "USD",
1961
  "capabilities": [
1962
  "vision",
1963
  "reasoning"
1964
  ],
1965
- "context_window": 200000,
1966
- "hf_id": "MiniMaxAI/MiniMax-M2.7",
1967
- "hf_private": false,
1968
- "size_b": 230,
1969
- "size_source": "manual"
1970
  },
1971
  {
1972
- "name": "novita/MiniMax-M2.7",
1973
  "type": "vision",
1974
  "input_price_per_1m": 0.3,
1975
  "output_price_per_1m": 1.2,
@@ -1999,22 +2018,7 @@
1999
  "hf_private": false
2000
  },
2001
  {
2002
- "name": "minimaxi/MiniMax-M2.5",
2003
- "type": "vision",
2004
- "input_price_per_1m": 0.3,
2005
- "output_price_per_1m": 1.2,
2006
- "currency": "USD",
2007
- "capabilities": [
2008
- "vision",
2009
- "reasoning"
2010
- ],
2011
- "context_window": 200000,
2012
- "hf_id": "MiniMaxAI/MiniMax-M2.5",
2013
- "size_b": 228.7,
2014
- "hf_private": false
2015
- },
2016
- {
2017
- "name": "minimaxi/MiniMax-M2.7",
2018
  "type": "vision",
2019
  "input_price_per_1m": 0.3,
2020
  "output_price_per_1m": 1.2,
@@ -2030,31 +2034,26 @@
2030
  "size_source": "manual"
2031
  },
2032
  {
2033
- "name": "minimaxi/MiniMax-M2",
2034
  "type": "chat",
2035
  "input_price_per_1m": 0.3,
2036
- "output_price_per_1m": 1.2,
2037
  "currency": "USD",
2038
- "context_window": 200000,
2039
  "capabilities": [
2040
- "tools",
2041
  "reasoning"
2042
  ],
2043
- "hf_id": "MiniMaxAI/MiniMax-M2",
2044
- "size_b": 228.7,
2045
- "hf_private": false
2046
  },
2047
  {
2048
- "name": "xai/grok-3-mini",
2049
  "type": "chat",
2050
  "input_price_per_1m": 0.3,
2051
- "output_price_per_1m": 0.5,
2052
  "currency": "USD",
2053
- "capabilities": [
2054
- "reasoning"
2055
- ],
2056
- "context_window": 131072,
2057
- "hf_private": true
2058
  },
2059
  {
2060
  "name": "deepinfra/deepseek-ai/DeepSeek-V3.1",
@@ -2072,7 +2071,7 @@
2072
  "hf_private": false
2073
  },
2074
  {
2075
- "name": "coding/gemini-2.5-flash",
2076
  "type": "vision",
2077
  "input_price_per_1m": 0.3,
2078
  "output_price_per_1m": 2.5,
@@ -2085,29 +2084,20 @@
2085
  "hf_private": true
2086
  },
2087
  {
2088
- "name": "parasail/parasail-gemma3-27b-it",
2089
- "type": "chat",
2090
- "input_price_per_1m": 0.3,
2091
- "output_price_per_1m": 0.5,
2092
- "currency": "USD",
2093
- "context_window": 128000,
2094
- "size_b": 27,
2095
- "hf_private": false
2096
- },
2097
- {
2098
- "name": "alibaba/qwen3-coder-flash",
2099
  "type": "vision",
2100
  "input_price_per_1m": 0.3,
2101
- "output_price_per_1m": 1.5,
2102
  "currency": "USD",
2103
  "capabilities": [
2104
- "vision"
 
2105
  ],
2106
  "context_window": 1048576,
2107
  "hf_private": true
2108
  },
2109
  {
2110
- "name": "google/gemini-2.5-flash",
2111
  "type": "vision",
2112
  "input_price_per_1m": 0.3,
2113
  "output_price_per_1m": 2.5,
@@ -2120,48 +2110,58 @@
2120
  "hf_private": true
2121
  },
2122
  {
2123
- "name": "vertex/gemini-2.5-flash",
2124
- "type": "vision",
2125
  "input_price_per_1m": 0.3,
2126
- "output_price_per_1m": 2.5,
2127
  "currency": "USD",
2128
- "capabilities": [
2129
- "vision",
2130
- "reasoning"
2131
- ],
2132
- "context_window": 1048576,
2133
  "hf_private": true
2134
  },
2135
  {
2136
- "name": "vertex/gemini-2.5-flash-image",
2137
- "type": "vision",
2138
  "input_price_per_1m": 0.3,
2139
- "output_price_per_1m": 2.5,
2140
  "currency": "USD",
 
2141
  "capabilities": [
2142
- "vision",
2143
  "reasoning"
2144
  ],
2145
- "context_window": 1048576,
2146
- "hf_private": true
 
2147
  },
2148
  {
2149
- "name": "mistral/codestral-latest",
2150
- "type": "chat",
2151
  "input_price_per_1m": 0.3,
2152
- "output_price_per_1m": 0.9,
2153
  "currency": "USD",
2154
- "context_window": 131072,
2155
- "hf_private": true
 
 
 
 
 
 
 
2156
  },
2157
  {
2158
- "name": "together/Qwen/Qwen2.5-7B-Instruct-Turbo",
2159
- "type": "chat",
2160
  "input_price_per_1m": 0.3,
2161
- "output_price_per_1m": 0.3,
2162
  "currency": "USD",
2163
- "context_window": 32768,
2164
- "size_b": 7,
 
 
 
 
 
2165
  "hf_private": false
2166
  },
2167
  {
@@ -2203,7 +2203,19 @@
2203
  "hf_private": false
2204
  },
2205
  {
2206
- "name": "openai/gpt-4.1-mini",
 
 
 
 
 
 
 
 
 
 
 
 
2207
  "type": "vision",
2208
  "input_price_per_1m": 0.4,
2209
  "output_price_per_1m": 1.6,
@@ -2215,18 +2227,16 @@
2215
  "hf_private": true
2216
  },
2217
  {
2218
- "name": "nebius/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2219
- "type": "chat",
2220
  "input_price_per_1m": 0.4,
2221
- "output_price_per_1m": 1.8,
2222
  "currency": "USD",
2223
- "context_window": 262000,
2224
- "size_b": 480,
2225
  "capabilities": [
2226
- "tools"
2227
  ],
2228
- "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct",
2229
- "hf_private": false
2230
  },
2231
  {
2232
  "name": "nebius/zai-org/GLM-4.7",
@@ -2243,18 +2253,17 @@
2243
  "hf_private": false
2244
  },
2245
  {
2246
- "name": "novita/deepseek/deepseek-v3-0324",
2247
  "type": "chat",
2248
  "input_price_per_1m": 0.4,
2249
- "output_price_per_1m": 1.3,
2250
  "currency": "USD",
2251
- "context_window": 128000,
 
2252
  "capabilities": [
2253
- "tools",
2254
- "reasoning"
2255
  ],
2256
- "size_b": 685,
2257
- "hf_id": "deepseek-ai/DeepSeek-V3-0324",
2258
  "hf_private": false
2259
  },
2260
  {
@@ -2266,6 +2275,21 @@
2266
  "context_window": 128000,
2267
  "hf_private": true
2268
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2269
  {
2270
  "name": "deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2271
  "type": "chat",
@@ -2305,27 +2329,24 @@
2305
  "hf_private": true
2306
  },
2307
  {
2308
- "name": "alibaba/qwen-plus",
2309
  "type": "chat",
2310
  "input_price_per_1m": 0.4,
2311
- "output_price_per_1m": 1.2,
2312
  "currency": "USD",
2313
  "context_window": 131072,
2314
- "capabilities": [
2315
- "tools"
2316
- ],
2317
  "hf_private": true
2318
  },
2319
  {
2320
- "name": "openai-responses/gpt-4.1-mini",
2321
- "type": "vision",
2322
  "input_price_per_1m": 0.4,
2323
- "output_price_per_1m": 1.6,
2324
  "currency": "USD",
 
2325
  "capabilities": [
2326
- "vision"
2327
  ],
2328
- "context_window": 1047576,
2329
  "hf_private": true
2330
  },
2331
  {
@@ -2338,25 +2359,19 @@
2338
  "hf_private": true
2339
  },
2340
  {
2341
- "name": "mistral/mistral-medium-latest",
2342
- "type": "chat",
2343
- "input_price_per_1m": 0.4,
2344
- "output_price_per_1m": 2,
2345
- "currency": "USD",
2346
- "context_window": 131072,
2347
- "hf_private": true
2348
- },
2349
- {
2350
- "name": "mistral/devstral-medium-2507",
2351
  "type": "chat",
2352
- "input_price_per_1m": 0.4,
2353
- "output_price_per_1m": 2,
2354
  "currency": "USD",
2355
- "context_window": 131072,
2356
  "capabilities": [
2357
- "tools"
 
2358
  ],
2359
- "hf_private": true
 
 
2360
  },
2361
  {
2362
  "name": "nebius/moonshotai/Kimi-K2-Instruct",
@@ -2369,22 +2384,7 @@
2369
  "tools"
2370
  ],
2371
  "hf_id": "moonshotai/Kimi-K2-Instruct",
2372
- "size_b": 1026.5,
2373
- "hf_private": false
2374
- },
2375
- {
2376
- "name": "nebius/deepseek-ai/DeepSeek-V3-0324",
2377
- "type": "chat",
2378
- "input_price_per_1m": 0.5,
2379
- "output_price_per_1m": 1.5,
2380
- "currency": "USD",
2381
- "context_window": 128000,
2382
- "capabilities": [
2383
- "tools",
2384
- "reasoning"
2385
- ],
2386
- "size_b": 685,
2387
- "hf_id": "deepseek-ai/DeepSeek-V3-0324",
2388
  "hf_private": false
2389
  },
2390
  {
@@ -2429,29 +2429,29 @@
2429
  "hf_private": true
2430
  },
2431
  {
2432
- "name": "vertex/gemini-3-flash-preview",
2433
  "type": "vision",
2434
  "input_price_per_1m": 0.5,
2435
- "output_price_per_1m": 3,
2436
  "currency": "USD",
2437
  "capabilities": [
2438
  "vision",
2439
  "reasoning"
2440
  ],
2441
- "context_window": 1048576,
2442
  "hf_private": true
2443
  },
2444
  {
2445
- "name": "vertex/gemini-3.1-flash-image-preview",
2446
  "type": "vision",
2447
  "input_price_per_1m": 0.5,
2448
- "output_price_per_1m": 2,
2449
  "currency": "USD",
2450
  "capabilities": [
2451
  "vision",
2452
  "reasoning"
2453
  ],
2454
- "context_window": 131072,
2455
  "hf_private": true
2456
  },
2457
  {
@@ -2521,6 +2521,21 @@
2521
  "size_b": 1026.5,
2522
  "hf_private": false
2523
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2524
  {
2525
  "name": "nebius/zai-org/GLM-4.5",
2526
  "type": "chat",
@@ -2567,48 +2582,45 @@
2567
  "hf_private": false
2568
  },
2569
  {
2570
- "name": "minimaxi/MiniMax-M2.5-highspeed",
2571
- "type": "vision",
2572
  "input_price_per_1m": 0.6,
2573
- "output_price_per_1m": 2.4,
2574
  "currency": "USD",
 
2575
  "capabilities": [
2576
- "vision",
2577
  "reasoning"
2578
  ],
2579
- "context_window": 200000,
2580
- "hf_id": "MiniMaxAI/MiniMax-M2.5",
2581
- "size_b": 228.7,
2582
  "hf_private": false
2583
  },
2584
  {
2585
- "name": "minimaxi/MiniMax-M2.7-highspeed",
2586
- "type": "vision",
2587
  "input_price_per_1m": 0.6,
2588
- "output_price_per_1m": 2.4,
2589
  "currency": "USD",
2590
  "capabilities": [
2591
- "vision",
2592
  "reasoning"
2593
  ],
2594
  "context_window": 200000,
2595
- "hf_id": "MiniMaxAI/MiniMax-M2.7",
2596
- "hf_private": false,
2597
- "size_b": 230,
2598
- "size_source": "manual"
2599
  },
2600
  {
2601
- "name": "deepinfra/zai-org/GLM-4.5",
2602
  "type": "chat",
2603
  "input_price_per_1m": 0.6,
2604
  "output_price_per_1m": 2.2,
2605
  "currency": "USD",
2606
- "context_window": 131072,
2607
  "capabilities": [
2608
- "tools",
2609
  "reasoning"
2610
  ],
2611
- "hf_id": "zai-org/GLM-4.5",
 
2612
  "size_b": 358.3,
2613
  "hf_private": false
2614
  },
@@ -2627,46 +2639,48 @@
2627
  "hf_private": false
2628
  },
2629
  {
2630
- "name": "zai/GLM-4.6",
2631
- "type": "chat",
2632
  "input_price_per_1m": 0.6,
2633
- "output_price_per_1m": 2.2,
2634
  "currency": "USD",
2635
  "capabilities": [
 
2636
  "reasoning"
2637
  ],
2638
  "context_window": 200000,
2639
- "hf_id": "zai-org/GLM-4.6",
2640
- "size_b": 356.8,
2641
- "hf_private": false
 
2642
  },
2643
  {
2644
- "name": "zai/GLM-4.7",
2645
- "type": "chat",
2646
  "input_price_per_1m": 0.6,
2647
- "output_price_per_1m": 2.2,
2648
  "currency": "USD",
2649
  "capabilities": [
 
2650
  "reasoning"
2651
  ],
2652
  "context_window": 200000,
2653
- "hf_id": "zai-org/GLM-4.7",
2654
- "size_b": 358.3,
2655
  "hf_private": false
2656
  },
2657
  {
2658
- "name": "alibaba/qwen3.5",
2659
- "type": "vision",
2660
  "input_price_per_1m": 0.6,
2661
- "output_price_per_1m": 3.6,
2662
  "currency": "USD",
 
2663
  "capabilities": [
2664
- "vision",
2665
- "reasoning"
2666
  ],
2667
- "context_window": 256000,
2668
- "size_b": 9,
2669
- "hf_id": "Qwen/Qwen3.5-9B",
2670
  "hf_private": false
2671
  },
2672
  {
@@ -2727,20 +2741,6 @@
2727
  "size_b": 1026.5,
2728
  "hf_private": false
2729
  },
2730
- {
2731
- "name": "moonshot/kimi-k2-thinking",
2732
- "type": "chat",
2733
- "input_price_per_1m": 0.6,
2734
- "output_price_per_1m": 2.5,
2735
- "currency": "USD",
2736
- "context_window": 131072,
2737
- "capabilities": [
2738
- "tools"
2739
- ],
2740
- "hf_id": "moonshotai/Kimi-K2-Instruct",
2741
- "size_b": 1026.5,
2742
- "hf_private": false
2743
- },
2744
  {
2745
  "name": "novita/microsoft/wizardlm-2-8x22b",
2746
  "type": "chat",
@@ -2765,6 +2765,19 @@
2765
  "context_window": 400000,
2766
  "hf_private": true
2767
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
2768
  {
2769
  "name": "novita/deepseek/deepseek-r1-turbo",
2770
  "type": "chat",
@@ -2792,20 +2805,7 @@
2792
  "hf_private": false
2793
  },
2794
  {
2795
- "name": "parasail/parasail-qwen25-vl-72b-instruct",
2796
- "type": "vision",
2797
- "input_price_per_1m": 0.7,
2798
- "output_price_per_1m": 0.7,
2799
- "currency": "USD",
2800
- "capabilities": [
2801
- "vision"
2802
- ],
2803
- "context_window": 32768,
2804
- "size_b": 72,
2805
- "hf_private": false
2806
- },
2807
- {
2808
- "name": "openai/gpt-5.4-mini",
2809
  "type": "vision",
2810
  "input_price_per_1m": 0.75,
2811
  "output_price_per_1m": 4.5,
@@ -2818,7 +2818,7 @@
2818
  "hf_private": true
2819
  },
2820
  {
2821
- "name": "openai-responses/gpt-5.4-mini",
2822
  "type": "vision",
2823
  "input_price_per_1m": 0.75,
2824
  "output_price_per_1m": 4.5,
@@ -2846,31 +2846,31 @@
2846
  "hf_private": false
2847
  },
2848
  {
2849
- "name": "novita/deepseek/deepseek-r1-distill-llama-70b",
2850
  "type": "chat",
2851
  "input_price_per_1m": 0.8,
2852
  "output_price_per_1m": 0.8,
2853
  "currency": "USD",
2854
- "context_window": 32000,
2855
- "size_b": 70,
2856
  "capabilities": [
2857
- "reasoning"
2858
  ],
2859
- "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
2860
  "hf_private": false
2861
  },
2862
  {
2863
- "name": "novita/qwen/qwen2.5-vl-72b-instruct",
2864
  "type": "chat",
2865
  "input_price_per_1m": 0.8,
2866
  "output_price_per_1m": 0.8,
2867
  "currency": "USD",
2868
- "context_window": 96000,
2869
- "size_b": 72,
2870
  "capabilities": [
2871
- "vision"
2872
  ],
2873
- "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
2874
  "hf_private": false
2875
  },
2876
  {
@@ -2884,34 +2884,34 @@
2884
  "hf_private": false
2885
  },
2886
  {
2887
- "name": "deepinfra/deepseek-ai/DeepSeek-R1",
2888
  "type": "chat",
2889
  "input_price_per_1m": 0.85,
2890
- "output_price_per_1m": 2.5,
2891
  "currency": "USD",
2892
- "context_window": 64000,
2893
  "capabilities": [
2894
  "tools",
2895
  "reasoning"
2896
  ],
2897
- "hf_id": "deepseek-ai/DeepSeek-R1",
2898
  "size_b": 671,
2899
- "size_source": "manual",
2900
  "hf_private": false
2901
  },
2902
  {
2903
- "name": "deepinfra/deepseek-ai/DeepSeek-V3",
2904
  "type": "chat",
2905
  "input_price_per_1m": 0.85,
2906
- "output_price_per_1m": 0.9,
2907
  "currency": "USD",
2908
- "context_window": 128000,
2909
  "capabilities": [
2910
  "tools",
2911
  "reasoning"
2912
  ],
2913
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
2914
  "size_b": 671,
 
2915
  "hf_private": false
2916
  },
2917
  {
@@ -2927,27 +2927,27 @@
2927
  "hf_private": true
2928
  },
2929
  {
2930
- "name": "together/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
2931
  "type": "chat",
2932
  "input_price_per_1m": 0.88,
2933
  "output_price_per_1m": 0.88,
2934
  "currency": "USD",
2935
  "context_window": 131072,
2936
  "size_b": 70,
 
 
 
 
2937
  "hf_private": false
2938
  },
2939
  {
2940
- "name": "together/meta-llama/Llama-3.3-70B-Instruct-Turbo",
2941
  "type": "chat",
2942
  "input_price_per_1m": 0.88,
2943
  "output_price_per_1m": 0.88,
2944
  "currency": "USD",
2945
  "context_window": 131072,
2946
  "size_b": 70,
2947
- "capabilities": [
2948
- "tools"
2949
- ],
2950
- "hf_id": "meta-llama/Llama-3.3-70B-Instruct",
2951
  "hf_private": false
2952
  },
2953
  {
@@ -2974,6 +2974,18 @@
2974
  "context_window": 131072,
2975
  "hf_private": true
2976
  },
 
 
 
 
 
 
 
 
 
 
 
 
2977
  {
2978
  "name": "openai/o3",
2979
  "type": "vision",
@@ -2988,36 +3000,31 @@
2988
  "hf_private": true
2989
  },
2990
  {
2991
- "name": "novita/GLM-5",
2992
  "type": "chat",
2993
  "input_price_per_1m": 1,
2994
- "output_price_per_1m": 3.2,
2995
  "currency": "USD",
 
2996
  "capabilities": [
2997
- "reasoning"
2998
  ],
2999
- "context_window": 202800,
3000
- "hf_id": "zai-org/GLM-5",
3001
- "size_b": 753.9,
3002
- "hf_private": false
3003
  },
3004
  {
3005
- "name": "zai/GLM-5",
3006
  "type": "vision",
3007
  "input_price_per_1m": 1,
3008
- "output_price_per_1m": 3.2,
3009
  "currency": "USD",
3010
  "capabilities": [
3011
- "vision",
3012
- "reasoning"
3013
  ],
3014
  "context_window": 200000,
3015
- "hf_id": "zai-org/GLM-5",
3016
- "size_b": 753.9,
3017
- "hf_private": false
3018
  },
3019
  {
3020
- "name": "bedrock/claude-haiku-4-5",
3021
  "type": "vision",
3022
  "input_price_per_1m": 1,
3023
  "output_price_per_1m": 5,
@@ -3029,7 +3036,21 @@
3029
  "hf_private": true
3030
  },
3031
  {
3032
- "name": "alibaba/qwen3-coder-plus",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3033
  "type": "vision",
3034
  "input_price_per_1m": 1,
3035
  "output_price_per_1m": 5,
@@ -3037,21 +3058,22 @@
3037
  "capabilities": [
3038
  "vision"
3039
  ],
3040
- "context_window": 1048576,
3041
  "hf_private": true
3042
  },
3043
  {
3044
- "name": "groq/moonshotai/kimi-k2-instruct",
3045
- "type": "chat",
3046
  "input_price_per_1m": 1,
3047
- "output_price_per_1m": 3,
3048
  "currency": "USD",
3049
- "context_window": 131072,
3050
  "capabilities": [
3051
- "tools"
 
3052
  ],
3053
- "hf_id": "moonshotai/Kimi-K2-Instruct",
3054
- "size_b": 1026.5,
 
3055
  "hf_private": false
3056
  },
3057
  {
@@ -3069,43 +3091,21 @@
3069
  "hf_private": false
3070
  },
3071
  {
3072
- "name": "perplexity/sonar",
3073
  "type": "chat",
3074
  "input_price_per_1m": 1,
3075
- "output_price_per_1m": 1,
3076
  "currency": "USD",
3077
  "context_window": 131072,
3078
  "capabilities": [
3079
- "vision"
3080
- ],
3081
- "hf_private": true
3082
- },
3083
- {
3084
- "name": "vertex/claude-haiku-4-5",
3085
- "type": "vision",
3086
- "input_price_per_1m": 1,
3087
- "output_price_per_1m": 5,
3088
- "currency": "USD",
3089
- "capabilities": [
3090
- "vision"
3091
- ],
3092
- "context_window": 200000,
3093
- "hf_private": true
3094
- },
3095
- {
3096
- "name": "anthropic/claude-haiku-4-5",
3097
- "type": "vision",
3098
- "input_price_per_1m": 1,
3099
- "output_price_per_1m": 5,
3100
- "currency": "USD",
3101
- "capabilities": [
3102
- "vision"
3103
  ],
3104
- "context_window": 200000,
3105
- "hf_private": true
 
3106
  },
3107
  {
3108
- "name": "openai/o3-mini",
3109
  "type": "chat",
3110
  "input_price_per_1m": 1.1,
3111
  "output_price_per_1m": 4.4,
@@ -3117,7 +3117,7 @@
3117
  "hf_private": true
3118
  },
3119
  {
3120
- "name": "azure/o4-mini",
3121
  "type": "chat",
3122
  "input_price_per_1m": 1.1,
3123
  "output_price_per_1m": 4.4,
@@ -3129,7 +3129,7 @@
3129
  "hf_private": true
3130
  },
3131
  {
3132
- "name": "openai-responses/o4-mini",
3133
  "type": "chat",
3134
  "input_price_per_1m": 1.1,
3135
  "output_price_per_1m": 4.4,
@@ -3141,7 +3141,7 @@
3141
  "hf_private": true
3142
  },
3143
  {
3144
- "name": "openai-responses/o3-mini",
3145
  "type": "chat",
3146
  "input_price_per_1m": 1.1,
3147
  "output_price_per_1m": 4.4,
@@ -3152,6 +3152,16 @@
3152
  "context_window": 200000,
3153
  "hf_private": true
3154
  },
 
 
 
 
 
 
 
 
 
 
3155
  {
3156
  "name": "moonshot/kimi-k2-turbo-preview",
3157
  "type": "chat",
@@ -3167,17 +3177,7 @@
3167
  "hf_private": false
3168
  },
3169
  {
3170
- "name": "together/Qwen/Qwen2.5-72B-Instruct-Turbo",
3171
- "type": "chat",
3172
- "input_price_per_1m": 1.2,
3173
- "output_price_per_1m": 1.2,
3174
- "currency": "USD",
3175
- "context_window": 32768,
3176
- "size_b": 72,
3177
- "hf_private": false
3178
- },
3179
- {
3180
- "name": "openai/gpt-5.1-chat",
3181
  "type": "vision",
3182
  "input_price_per_1m": 1.25,
3183
  "output_price_per_1m": 10,
@@ -3186,11 +3186,11 @@
3186
  "vision",
3187
  "reasoning"
3188
  ],
3189
- "context_window": 128000,
3190
  "hf_private": true
3191
  },
3192
  {
3193
- "name": "openai/gpt-5.1",
3194
  "type": "vision",
3195
  "input_price_per_1m": 1.25,
3196
  "output_price_per_1m": 10,
@@ -3203,7 +3203,7 @@
3203
  "hf_private": true
3204
  },
3205
  {
3206
- "name": "openai/gpt-5-chat",
3207
  "type": "vision",
3208
  "input_price_per_1m": 1.25,
3209
  "output_price_per_1m": 10,
@@ -3212,35 +3212,37 @@
3212
  "vision",
3213
  "reasoning"
3214
  ],
3215
- "context_window": 128000,
3216
  "hf_private": true
3217
  },
3218
  {
3219
- "name": "azure/gpt-5",
3220
- "type": "chat",
3221
  "input_price_per_1m": 1.25,
3222
  "output_price_per_1m": 10,
3223
  "currency": "USD",
3224
  "capabilities": [
 
3225
  "reasoning"
3226
  ],
3227
- "context_window": 200000,
3228
  "hf_private": true
3229
  },
3230
  {
3231
- "name": "azure/gpt-5.1",
3232
- "type": "chat",
3233
  "input_price_per_1m": 1.25,
3234
  "output_price_per_1m": 10,
3235
  "currency": "USD",
3236
  "capabilities": [
 
3237
  "reasoning"
3238
  ],
3239
- "context_window": 200000,
3240
  "hf_private": true
3241
  },
3242
  {
3243
- "name": "coding/gemini-2.5-pro",
3244
  "type": "vision",
3245
  "input_price_per_1m": 1.25,
3246
  "output_price_per_1m": 10,
@@ -3249,11 +3251,11 @@
3249
  "vision",
3250
  "reasoning"
3251
  ],
3252
- "context_window": 1048576,
3253
  "hf_private": true
3254
  },
3255
  {
3256
- "name": "google/gemini-2.5-pro",
3257
  "type": "vision",
3258
  "input_price_per_1m": 1.25,
3259
  "output_price_per_1m": 10,
@@ -3262,11 +3264,11 @@
3262
  "vision",
3263
  "reasoning"
3264
  ],
3265
- "context_window": 1048576,
3266
  "hf_private": true
3267
  },
3268
  {
3269
- "name": "openai-responses/gpt-5-codex",
3270
  "type": "vision",
3271
  "input_price_per_1m": 1.25,
3272
  "output_price_per_1m": 10,
@@ -3275,24 +3277,26 @@
3275
  "vision",
3276
  "reasoning"
3277
  ],
3278
- "context_window": 400000,
3279
  "hf_private": true
3280
  },
3281
  {
3282
- "name": "openai-responses/gpt-5.1-codex",
3283
- "type": "vision",
3284
  "input_price_per_1m": 1.25,
3285
- "output_price_per_1m": 10,
3286
  "currency": "USD",
 
3287
  "capabilities": [
3288
- "vision",
3289
  "reasoning"
3290
  ],
3291
- "context_window": 400000,
3292
- "hf_private": true
 
3293
  },
3294
  {
3295
- "name": "openai-responses/gpt-5",
3296
  "type": "vision",
3297
  "input_price_per_1m": 1.25,
3298
  "output_price_per_1m": 10,
@@ -3301,52 +3305,48 @@
3301
  "vision",
3302
  "reasoning"
3303
  ],
3304
- "context_window": 400000,
3305
  "hf_private": true
3306
  },
3307
  {
3308
- "name": "openai-responses/gpt-5.1",
3309
- "type": "vision",
3310
  "input_price_per_1m": 1.25,
3311
  "output_price_per_1m": 10,
3312
  "currency": "USD",
3313
  "capabilities": [
3314
- "vision",
3315
  "reasoning"
3316
  ],
3317
- "context_window": 400000,
3318
  "hf_private": true
3319
  },
3320
  {
3321
- "name": "vertex/gemini-2.5-pro",
3322
- "type": "vision",
3323
  "input_price_per_1m": 1.25,
3324
  "output_price_per_1m": 10,
3325
  "currency": "USD",
3326
  "capabilities": [
3327
- "vision",
3328
  "reasoning"
3329
  ],
3330
- "context_window": 1048576,
3331
  "hf_private": true
3332
  },
3333
  {
3334
- "name": "together/deepseek-ai/DeepSeek-V3",
3335
- "type": "chat",
3336
  "input_price_per_1m": 1.25,
3337
- "output_price_per_1m": 1.25,
3338
  "currency": "USD",
3339
- "context_window": 131072,
3340
  "capabilities": [
3341
- "tools",
3342
  "reasoning"
3343
  ],
3344
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
3345
- "size_b": 671,
3346
- "hf_private": false
3347
  },
3348
  {
3349
- "name": "novita/sao10k/l31-70b-euryale-v2.2",
3350
  "type": "chat",
3351
  "input_price_per_1m": 1.48,
3352
  "output_price_per_1m": 1.48,
@@ -3356,7 +3356,7 @@
3356
  "hf_private": false
3357
  },
3358
  {
3359
- "name": "novita/sao10k/l3-70b-euryale-v2.1",
3360
  "type": "chat",
3361
  "input_price_per_1m": 1.48,
3362
  "output_price_per_1m": 1.48,
@@ -3378,7 +3378,7 @@
3378
  "hf_private": true
3379
  },
3380
  {
3381
- "name": "openai/gpt-5.2-chat",
3382
  "type": "vision",
3383
  "input_price_per_1m": 1.75,
3384
  "output_price_per_1m": 14,
@@ -3387,11 +3387,11 @@
3387
  "vision",
3388
  "reasoning"
3389
  ],
3390
- "context_window": 128000,
3391
  "hf_private": true
3392
  },
3393
  {
3394
- "name": "openai/gpt-5.2",
3395
  "type": "vision",
3396
  "input_price_per_1m": 1.75,
3397
  "output_price_per_1m": 14,
@@ -3404,7 +3404,7 @@
3404
  "hf_private": true
3405
  },
3406
  {
3407
- "name": "openai/gpt-5.3-chat",
3408
  "type": "vision",
3409
  "input_price_per_1m": 1.75,
3410
  "output_price_per_1m": 14,
@@ -3417,19 +3417,20 @@
3417
  "hf_private": true
3418
  },
3419
  {
3420
- "name": "azure/gpt-5.2",
3421
- "type": "chat",
3422
  "input_price_per_1m": 1.75,
3423
  "output_price_per_1m": 14,
3424
  "currency": "USD",
3425
  "capabilities": [
 
3426
  "reasoning"
3427
  ],
3428
- "context_window": 200000,
3429
  "hf_private": true
3430
  },
3431
  {
3432
- "name": "azure/gpt-5.3-codex",
3433
  "type": "vision",
3434
  "input_price_per_1m": 1.75,
3435
  "output_price_per_1m": 14,
@@ -3438,11 +3439,11 @@
3438
  "vision",
3439
  "reasoning"
3440
  ],
3441
- "context_window": 400000,
3442
  "hf_private": true
3443
  },
3444
  {
3445
- "name": "azure/openai-responses/gpt-5.2-codex",
3446
  "type": "vision",
3447
  "input_price_per_1m": 1.75,
3448
  "output_price_per_1m": 14,
@@ -3455,7 +3456,7 @@
3455
  "hf_private": true
3456
  },
3457
  {
3458
- "name": "openai-responses/gpt-5.3-codex",
3459
  "type": "vision",
3460
  "input_price_per_1m": 1.75,
3461
  "output_price_per_1m": 14,
@@ -3464,24 +3465,23 @@
3464
  "vision",
3465
  "reasoning"
3466
  ],
3467
- "context_window": 400000,
3468
  "hf_private": true
3469
  },
3470
  {
3471
- "name": "openai-responses/gpt-5.2-codex",
3472
- "type": "vision",
3473
  "input_price_per_1m": 1.75,
3474
  "output_price_per_1m": 14,
3475
  "currency": "USD",
3476
  "capabilities": [
3477
- "vision",
3478
  "reasoning"
3479
  ],
3480
- "context_window": 400000,
3481
  "hf_private": true
3482
  },
3483
  {
3484
- "name": "openai-responses/gpt-5.3-chat",
3485
  "type": "vision",
3486
  "input_price_per_1m": 1.75,
3487
  "output_price_per_1m": 14,
@@ -3490,11 +3490,11 @@
3490
  "vision",
3491
  "reasoning"
3492
  ],
3493
- "context_window": 128000,
3494
  "hf_private": true
3495
  },
3496
  {
3497
- "name": "openai-responses/gpt-5.2",
3498
  "type": "vision",
3499
  "input_price_per_1m": 1.75,
3500
  "output_price_per_1m": 14,
@@ -3506,6 +3506,18 @@
3506
  "context_window": 400000,
3507
  "hf_private": true
3508
  },
 
 
 
 
 
 
 
 
 
 
 
 
3509
  {
3510
  "name": "openai/o4-mini-deep-research",
3511
  "type": "vision",
@@ -3541,62 +3553,29 @@
3541
  "hf_private": true
3542
  },
3543
  {
3544
- "name": "xai/grok-4.2-beta",
3545
- "type": "vision",
3546
- "input_price_per_1m": 2,
3547
- "output_price_per_1m": 6,
3548
- "currency": "USD",
3549
- "capabilities": [
3550
- "vision",
3551
- "reasoning"
3552
- ],
3553
- "context_window": 2000000,
3554
- "hf_private": true
3555
- },
3556
- {
3557
- "name": "xai/grok-2-1212",
3558
  "type": "chat",
3559
  "input_price_per_1m": 2,
3560
- "output_price_per_1m": 10,
3561
- "currency": "USD",
3562
- "context_window": 131072,
3563
- "hf_private": true
3564
- },
3565
- {
3566
- "name": "azure/openai-responses/gpt-4.1",
3567
- "type": "vision",
3568
- "input_price_per_1m": 2,
3569
  "output_price_per_1m": 8,
3570
  "currency": "USD",
 
3571
  "capabilities": [
3572
- "vision"
 
3573
  ],
3574
- "context_window": 1047576,
3575
  "hf_private": true
3576
  },
3577
  {
3578
- "name": "azure/gpt-4.1",
3579
  "type": "vision",
3580
  "input_price_per_1m": 2,
3581
- "output_price_per_1m": 8,
3582
- "currency": "USD",
3583
- "capabilities": [
3584
- "vision"
3585
- ],
3586
- "context_window": 1047576,
3587
- "hf_private": true
3588
- },
3589
- {
3590
- "name": "perplexity/sonar-reasoning-pro",
3591
- "type": "chat",
3592
- "input_price_per_1m": 2,
3593
- "output_price_per_1m": 8,
3594
  "currency": "USD",
3595
- "context_window": 131072,
3596
  "capabilities": [
3597
  "vision",
3598
  "reasoning"
3599
  ],
 
3600
  "hf_private": true
3601
  },
3602
  {
@@ -3613,28 +3592,25 @@
3613
  "hf_private": true
3614
  },
3615
  {
3616
- "name": "google/gemini-3.1-pro-preview",
3617
  "type": "vision",
3618
  "input_price_per_1m": 2,
3619
- "output_price_per_1m": 12,
3620
  "currency": "USD",
3621
  "capabilities": [
3622
  "vision",
3623
  "reasoning"
3624
  ],
3625
- "context_window": 1048576,
3626
  "hf_private": true
3627
  },
3628
  {
3629
- "name": "openai-responses/gpt-4.1",
3630
- "type": "vision",
3631
  "input_price_per_1m": 2,
3632
- "output_price_per_1m": 8,
3633
  "currency": "USD",
3634
- "capabilities": [
3635
- "vision"
3636
- ],
3637
- "context_window": 1047576,
3638
  "hf_private": true
3639
  },
3640
  {
@@ -3676,6 +3652,30 @@
3676
  "context_window": 1048576,
3677
  "hf_private": true
3678
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3679
  {
3680
  "name": "mistral/pixtral-large-latest",
3681
  "type": "chat",
@@ -3686,7 +3686,7 @@
3686
  "hf_private": true
3687
  },
3688
  {
3689
- "name": "openai/gpt-5.4",
3690
  "type": "vision",
3691
  "input_price_per_1m": 2.5,
3692
  "output_price_per_1m": 15,
@@ -3699,7 +3699,7 @@
3699
  "hf_private": true
3700
  },
3701
  {
3702
- "name": "openai/gpt-4o-2024-11-20",
3703
  "type": "vision",
3704
  "input_price_per_1m": 2.5,
3705
  "output_price_per_1m": 10,
@@ -3711,19 +3711,20 @@
3711
  "hf_private": true
3712
  },
3713
  {
3714
- "name": "openai/gpt-4o-2024-08-06",
3715
  "type": "vision",
3716
  "input_price_per_1m": 2.5,
3717
- "output_price_per_1m": 10,
3718
  "currency": "USD",
3719
  "capabilities": [
3720
- "vision"
 
3721
  ],
3722
- "context_window": 128000,
3723
  "hf_private": true
3724
  },
3725
  {
3726
- "name": "openai/gpt-4o-2024-05-13",
3727
  "type": "vision",
3728
  "input_price_per_1m": 2.5,
3729
  "output_price_per_1m": 10,
@@ -3735,7 +3736,7 @@
3735
  "hf_private": true
3736
  },
3737
  {
3738
- "name": "openai/gpt-4o",
3739
  "type": "vision",
3740
  "input_price_per_1m": 2.5,
3741
  "output_price_per_1m": 10,
@@ -3747,20 +3748,19 @@
3747
  "hf_private": true
3748
  },
3749
  {
3750
- "name": "azure/openai-responses/gpt-5.4",
3751
  "type": "vision",
3752
  "input_price_per_1m": 2.5,
3753
- "output_price_per_1m": 15,
3754
  "currency": "USD",
3755
  "capabilities": [
3756
- "vision",
3757
- "reasoning"
3758
  ],
3759
- "context_window": 1050000,
3760
  "hf_private": true
3761
  },
3762
  {
3763
- "name": "openai-responses/gpt-5.4",
3764
  "type": "vision",
3765
  "input_price_per_1m": 2.5,
3766
  "output_price_per_1m": 15,
@@ -3773,19 +3773,19 @@
3773
  "hf_private": true
3774
  },
3775
  {
3776
- "name": "xai/grok-4",
3777
- "type": "vision",
3778
  "input_price_per_1m": 3,
3779
  "output_price_per_1m": 15,
3780
  "currency": "USD",
 
3781
  "capabilities": [
3782
  "vision"
3783
  ],
3784
- "context_window": 256000,
3785
  "hf_private": true
3786
  },
3787
  {
3788
- "name": "bedrock/claude-sonnet-4-6",
3789
  "type": "vision",
3790
  "input_price_per_1m": 3,
3791
  "output_price_per_1m": 15,
@@ -3794,11 +3794,11 @@
3794
  "vision",
3795
  "reasoning"
3796
  ],
3797
- "context_window": 1000000,
3798
  "hf_private": true
3799
  },
3800
  {
3801
- "name": "bedrock/claude-sonnet-4",
3802
  "type": "vision",
3803
  "input_price_per_1m": 3,
3804
  "output_price_per_1m": 15,
@@ -3807,7 +3807,7 @@
3807
  "vision",
3808
  "reasoning"
3809
  ],
3810
- "context_window": 200000,
3811
  "hf_private": true
3812
  },
3813
  {
@@ -3824,7 +3824,7 @@
3824
  "hf_private": true
3825
  },
3826
  {
3827
- "name": "bedrock/claude-3-7-sonnet",
3828
  "type": "vision",
3829
  "input_price_per_1m": 3,
3830
  "output_price_per_1m": 15,
@@ -3837,7 +3837,7 @@
3837
  "hf_private": true
3838
  },
3839
  {
3840
- "name": "coding/claude-sonnet-4-20250514",
3841
  "type": "vision",
3842
  "input_price_per_1m": 3,
3843
  "output_price_per_1m": 15,
@@ -3846,23 +3846,24 @@
3846
  "vision",
3847
  "reasoning"
3848
  ],
3849
- "context_window": 200000,
3850
  "hf_private": true
3851
  },
3852
  {
3853
- "name": "perplexity/sonar-pro",
3854
- "type": "chat",
3855
  "input_price_per_1m": 3,
3856
  "output_price_per_1m": 15,
3857
  "currency": "USD",
3858
- "context_window": 204800,
3859
  "capabilities": [
3860
- "vision"
 
3861
  ],
 
3862
  "hf_private": true
3863
  },
3864
  {
3865
- "name": "vertex/claude-3-7-sonnet",
3866
  "type": "vision",
3867
  "input_price_per_1m": 3,
3868
  "output_price_per_1m": 15,
@@ -3871,11 +3872,11 @@
3871
  "vision",
3872
  "reasoning"
3873
  ],
3874
- "context_window": 200000,
3875
  "hf_private": true
3876
  },
3877
  {
3878
- "name": "vertex/claude-3-5-sonnet",
3879
  "type": "vision",
3880
  "input_price_per_1m": 3,
3881
  "output_price_per_1m": 15,
@@ -3883,37 +3884,39 @@
3883
  "capabilities": [
3884
  "vision"
3885
  ],
3886
- "context_window": 200000,
3887
  "hf_private": true
3888
  },
3889
  {
3890
- "name": "vertex/claude-sonnet-4-5",
3891
- "type": "vision",
3892
  "input_price_per_1m": 3,
3893
- "output_price_per_1m": 15,
3894
  "currency": "USD",
 
3895
  "capabilities": [
3896
- "vision",
3897
  "reasoning"
3898
  ],
3899
- "context_window": 200000,
3900
- "hf_private": true
 
 
3901
  },
3902
  {
3903
- "name": "vertex/claude-sonnet-4",
3904
  "type": "vision",
3905
  "input_price_per_1m": 3,
3906
  "output_price_per_1m": 15,
3907
  "currency": "USD",
3908
  "capabilities": [
3909
- "vision",
3910
- "reasoning"
3911
  ],
3912
  "context_window": 200000,
3913
  "hf_private": true
3914
  },
3915
  {
3916
- "name": "anthropic/claude-sonnet-4",
3917
  "type": "vision",
3918
  "input_price_per_1m": 3,
3919
  "output_price_per_1m": 15,
@@ -3922,11 +3925,11 @@
3922
  "vision",
3923
  "reasoning"
3924
  ],
3925
- "context_window": 1000000,
3926
  "hf_private": true
3927
  },
3928
  {
3929
- "name": "anthropic/claude-sonnet-4-5",
3930
  "type": "vision",
3931
  "input_price_per_1m": 3,
3932
  "output_price_per_1m": 15,
@@ -3935,11 +3938,11 @@
3935
  "vision",
3936
  "reasoning"
3937
  ],
3938
- "context_window": 1000000,
3939
  "hf_private": true
3940
  },
3941
  {
3942
- "name": "anthropic/claude-sonnet-4-6",
3943
  "type": "vision",
3944
  "input_price_per_1m": 3,
3945
  "output_price_per_1m": 15,
@@ -3948,24 +3951,21 @@
3948
  "vision",
3949
  "reasoning"
3950
  ],
3951
- "context_window": 1000000,
3952
  "hf_private": true
3953
  },
3954
  {
3955
- "name": "together/deepseek-ai/DeepSeek-R1",
3956
- "type": "chat",
3957
  "input_price_per_1m": 3,
3958
- "output_price_per_1m": 7,
3959
  "currency": "USD",
3960
- "context_window": 64000,
3961
  "capabilities": [
3962
- "tools",
3963
  "reasoning"
3964
  ],
3965
- "hf_id": "deepseek-ai/DeepSeek-R1",
3966
- "size_b": 671,
3967
- "size_source": "manual",
3968
- "hf_private": false
3969
  },
3970
  {
3971
  "name": "novita/deepseek/deepseek-r1",
@@ -3995,18 +3995,6 @@
3995
  "context_window": 128000,
3996
  "hf_private": true
3997
  },
3998
- {
3999
- "name": "xai/grok-3",
4000
- "type": "chat",
4001
- "input_price_per_1m": 5,
4002
- "output_price_per_1m": 25,
4003
- "currency": "USD",
4004
- "context_window": 131072,
4005
- "capabilities": [
4006
- "tools"
4007
- ],
4008
- "hf_private": true
4009
- },
4010
  {
4011
  "name": "bedrock/claude-opus-4-5",
4012
  "type": "vision",
@@ -4034,7 +4022,7 @@
4034
  "hf_private": true
4035
  },
4036
  {
4037
- "name": "vertex/claude-opus-4-6",
4038
  "type": "vision",
4039
  "input_price_per_1m": 5,
4040
  "output_price_per_1m": 25,
@@ -4047,7 +4035,7 @@
4047
  "hf_private": true
4048
  },
4049
  {
4050
- "name": "vertex/claude-opus-4-5",
4051
  "type": "vision",
4052
  "input_price_per_1m": 5,
4053
  "output_price_per_1m": 25,
@@ -4060,7 +4048,19 @@
4060
  "hf_private": true
4061
  },
4062
  {
4063
- "name": "anthropic/claude-opus-4-6",
 
 
 
 
 
 
 
 
 
 
 
 
4064
  "type": "vision",
4065
  "input_price_per_1m": 5,
4066
  "output_price_per_1m": 25,
@@ -4069,11 +4069,11 @@
4069
  "vision",
4070
  "reasoning"
4071
  ],
4072
- "context_window": 1000000,
4073
  "hf_private": true
4074
  },
4075
  {
4076
- "name": "anthropic/claude-opus-4-5",
4077
  "type": "vision",
4078
  "input_price_per_1m": 5,
4079
  "output_price_per_1m": 25,
@@ -4082,7 +4082,7 @@
4082
  "vision",
4083
  "reasoning"
4084
  ],
4085
- "context_window": 200000,
4086
  "hf_private": true
4087
  },
4088
  {
@@ -4099,23 +4099,23 @@
4099
  "hf_private": true
4100
  },
4101
  {
4102
- "name": "openai/o1",
4103
  "type": "vision",
4104
  "input_price_per_1m": 15,
4105
- "output_price_per_1m": 60,
4106
  "currency": "USD",
4107
  "capabilities": [
4108
  "vision",
4109
  "reasoning"
4110
  ],
4111
- "context_window": 200000,
4112
  "hf_private": true
4113
  },
4114
  {
4115
- "name": "bedrock/claude-opus-4",
4116
  "type": "vision",
4117
  "input_price_per_1m": 15,
4118
- "output_price_per_1m": 75,
4119
  "currency": "USD",
4120
  "capabilities": [
4121
  "vision",
@@ -4125,7 +4125,7 @@
4125
  "hf_private": true
4126
  },
4127
  {
4128
- "name": "coding/claude-opus-4-20250514",
4129
  "type": "vision",
4130
  "input_price_per_1m": 15,
4131
  "output_price_per_1m": 75,
@@ -4138,20 +4138,20 @@
4138
  "hf_private": true
4139
  },
4140
  {
4141
- "name": "openai-responses/gpt-5-pro",
4142
  "type": "vision",
4143
  "input_price_per_1m": 15,
4144
- "output_price_per_1m": 120,
4145
  "currency": "USD",
4146
  "capabilities": [
4147
  "vision",
4148
  "reasoning"
4149
  ],
4150
- "context_window": 400000,
4151
  "hf_private": true
4152
  },
4153
  {
4154
- "name": "vertex/claude-opus-4-1",
4155
  "type": "vision",
4156
  "input_price_per_1m": 15,
4157
  "output_price_per_1m": 75,
@@ -4177,7 +4177,7 @@
4177
  "hf_private": true
4178
  },
4179
  {
4180
- "name": "anthropic/claude-opus-4",
4181
  "type": "vision",
4182
  "input_price_per_1m": 15,
4183
  "output_price_per_1m": 75,
@@ -4190,7 +4190,7 @@
4190
  "hf_private": true
4191
  },
4192
  {
4193
- "name": "anthropic/claude-opus-4-1",
4194
  "type": "vision",
4195
  "input_price_per_1m": 15,
4196
  "output_price_per_1m": 75,
@@ -4216,7 +4216,7 @@
4216
  "hf_private": true
4217
  },
4218
  {
4219
- "name": "openai/gpt-5.4-pro",
4220
  "type": "vision",
4221
  "input_price_per_1m": 30,
4222
  "output_price_per_1m": 180,
@@ -4229,7 +4229,7 @@
4229
  "hf_private": true
4230
  },
4231
  {
4232
- "name": "azure/openai-responses/gpt-5.4-pro",
4233
  "type": "vision",
4234
  "input_price_per_1m": 30,
4235
  "output_price_per_1m": 180,
@@ -4242,7 +4242,7 @@
4242
  "hf_private": true
4243
  },
4244
  {
4245
- "name": "openai-responses/gpt-5.4-pro",
4246
  "type": "vision",
4247
  "input_price_per_1m": 30,
4248
  "output_price_per_1m": 180,
@@ -5091,7 +5091,8 @@
5091
  ],
5092
  "hf_id": "mistralai/Voxtral-Small-24B-2507",
5093
  "hf_private": false,
5094
- "price_per_minute": 0.15
 
5095
  },
5096
  {
5097
  "name": "gemma-3-27b-it",
@@ -5175,8 +5176,8 @@
5175
  "capabilities": [
5176
  "tools"
5177
  ],
5178
- "size_b": 675,
5179
- "hf_id": "mistralai/Mistral-Large-Instruct-2411",
5180
  "hf_private": false,
5181
  "ollama_id": "mistral-large",
5182
  "size_source": "manual"
@@ -5221,9 +5222,13 @@
5221
  "currency": "USD",
5222
  "api_endpoint": "devstral-medium-latest",
5223
  "ollama_id": "devstral-2",
5224
- "size_b": 7.242,
5225
- "hf_id": "mistralai/Mistral-7B-v0.1",
5226
- "hf_private": false
 
 
 
 
5227
  },
5228
  {
5229
  "name": "Devstral Small 2",
@@ -5332,24 +5337,30 @@
5332
  "type": "audio",
5333
  "currency": "USD",
5334
  "api_endpoint": "voxtral-mini-latest",
5335
- "hf_private": true,
5336
  "price_per_minute": 0.003,
5337
  "capabilities": [
5338
  "audio",
5339
  "tools"
5340
- ]
 
 
 
5341
  },
5342
  {
5343
  "name": "Voxtral Realtime",
5344
  "type": "audio",
5345
  "currency": "USD",
5346
  "api_endpoint": "voxtral-mini-latest",
5347
- "hf_private": true,
5348
  "price_per_minute": 0.006,
5349
  "capabilities": [
5350
  "audio",
5351
  "tools"
5352
- ]
 
 
 
5353
  },
5354
  {
5355
  "name": "Voxtral Small",
@@ -5364,7 +5375,8 @@
5364
  ],
5365
  "size_b": 24,
5366
  "hf_id": "mistralai/Voxtral-Small-24B-2507",
5367
- "hf_private": false
 
5368
  },
5369
  {
5370
  "name": "Voxtral Mini",
@@ -5373,11 +5385,14 @@
5373
  "output_price_per_1m": 0.04,
5374
  "currency": "USD",
5375
  "api_endpoint": "voxtral-mini-latest",
5376
- "hf_private": true,
5377
  "capabilities": [
5378
  "audio",
5379
  "tools"
5380
- ]
 
 
 
5381
  },
5382
  {
5383
  "name": "Classifier API model 8B",
@@ -6329,7 +6344,8 @@
6329
  ],
6330
  "size_b": 24,
6331
  "hf_private": false,
6332
- "audio_price_per_1m": 100
 
6333
  },
6334
  {
6335
  "name": "nvidia/llama-3.3-nemotron-super-49b-v1.5",
@@ -7728,7 +7744,8 @@
7728
  "tools"
7729
  ],
7730
  "size_b": 123,
7731
- "hf_private": false
 
7732
  },
7733
  {
7734
  "name": "deepseek/deepseek-v3.2-speciale",
 
378
  "capabilities": [
379
  "tools"
380
  ],
381
+ "size_b": 123,
382
+ "hf_id": "mistralai/Mistral-Large-Instruct-2407",
383
  "hf_private": false,
384
  "ollama_id": "mistral-large",
385
  "size_source": "manual"
 
1154
  "hf_private": false
1155
  },
1156
  {
1157
+ "name": "alibaba/qwen-turbo",
1158
  "type": "chat",
1159
  "input_price_per_1m": 0.05,
1160
+ "output_price_per_1m": 0.2,
1161
  "currency": "USD",
1162
+ "context_window": 1000000,
1163
+ "capabilities": [
1164
+ "tools"
1165
+ ],
1166
+ "hf_private": true
1167
+ },
1168
+ {
1169
+ "name": "openai-responses/gpt-5-nano",
1170
+ "type": "vision",
1171
+ "input_price_per_1m": 0.05,
1172
+ "output_price_per_1m": 0.4,
1173
+ "currency": "USD",
1174
+ "capabilities": [
1175
+ "vision",
1176
+ "reasoning"
1177
+ ],
1178
+ "context_window": 400000,
1179
+ "hf_private": true
1180
  },
1181
  {
1182
  "name": "novita/meta-llama/llama-3.1-8b-instruct",
 
1203
  "hf_private": false
1204
  },
1205
  {
1206
+ "name": "novita/Sao10K/L3-8B-Stheno-v3.2",
1207
  "type": "chat",
1208
  "input_price_per_1m": 0.05,
1209
+ "output_price_per_1m": 0.05,
1210
  "currency": "USD",
1211
+ "context_window": 8192,
1212
+ "size_b": 8,
1213
+ "hf_private": false
 
 
1214
  },
1215
  {
1216
+ "name": "azure/gpt-5-nano",
1217
  "type": "chat",
1218
  "input_price_per_1m": 0.05,
 
 
 
 
 
 
 
 
 
 
 
 
1219
  "output_price_per_1m": 0.4,
1220
  "currency": "USD",
1221
  "capabilities": [
 
1222
  "reasoning"
1223
  ],
1224
+ "context_window": 200000,
1225
  "hf_private": true
1226
  },
1227
  {
 
1235
  "hf_private": false
1236
  },
1237
  {
1238
+ "name": "deepinfra/Qwen/Qwen2.5-Coder-32B-Instruct",
1239
  "type": "chat",
1240
  "input_price_per_1m": 0.07,
1241
+ "output_price_per_1m": 0.16,
1242
  "currency": "USD",
1243
  "context_window": 16384,
1244
+ "size_b": 32,
1245
+ "hf_private": false
 
 
1246
  },
1247
  {
1248
+ "name": "deepinfra/microsoft/phi-4",
1249
  "type": "chat",
1250
  "input_price_per_1m": 0.07,
1251
+ "output_price_per_1m": 0.14,
1252
  "currency": "USD",
1253
  "context_window": 16384,
1254
+ "hf_private": false,
1255
+ "size_b": 14,
1256
+ "size_source": "manual",
1257
+ "hf_id": "microsoft/phi-4"
1258
  },
1259
  {
1260
  "name": "novita/gryphe/mythomax-l2-13b",
 
1268
  "hf_private": false
1269
  },
1270
  {
1271
+ "name": "openai-responses/gpt-4.1-nano",
1272
  "type": "vision",
1273
  "input_price_per_1m": 0.1,
1274
  "output_price_per_1m": 0.4,
 
1280
  "hf_private": true
1281
  },
1282
  {
1283
+ "name": "openai/gpt-4.1-nano",
1284
+ "type": "vision",
1285
  "input_price_per_1m": 0.1,
1286
+ "output_price_per_1m": 0.4,
1287
  "currency": "USD",
 
 
1288
  "capabilities": [
1289
+ "vision"
 
1290
  ],
1291
+ "context_window": 1047576,
1292
+ "hf_private": true
1293
  },
1294
  {
1295
+ "name": "google/gemini-2.0-flash-001",
1296
  "type": "vision",
1297
  "input_price_per_1m": 0.1,
1298
  "output_price_per_1m": 0.4,
 
1300
  "capabilities": [
1301
  "vision"
1302
  ],
1303
+ "context_window": 1048576,
1304
  "hf_private": true
1305
  },
1306
  {
1307
+ "name": "google/gemini-2.5-flash-lite",
1308
  "type": "vision",
1309
  "input_price_per_1m": 0.1,
1310
  "output_price_per_1m": 0.4,
1311
  "currency": "USD",
1312
  "capabilities": [
1313
+ "vision",
1314
+ "reasoning"
1315
  ],
1316
+ "context_window": 1048576,
1317
  "hf_private": true
1318
  },
1319
  {
1320
+ "name": "together/meta-llama/Meta-Llama-3-8B-Instruct-Lite",
1321
  "type": "chat",
1322
  "input_price_per_1m": 0.1,
1323
+ "output_price_per_1m": 0.1,
1324
  "currency": "USD",
1325
+ "context_window": 8192,
1326
+ "size_b": 8,
1327
+ "hf_private": false
1328
+ },
1329
+ {
1330
+ "name": "deepinfra/Qwen/Qwen3-32B",
1331
+ "type": "chat",
1332
+ "input_price_per_1m": 0.1,
1333
+ "output_price_per_1m": 0.3,
1334
+ "currency": "USD",
1335
+ "context_window": 40000,
1336
+ "size_b": 32,
1337
  "capabilities": [
1338
  "tools",
1339
  "reasoning"
1340
  ],
1341
+ "hf_id": "Qwen/Qwen3-32B",
1342
  "hf_private": false
1343
  },
1344
  {
1345
+ "name": "vertex/gemini-2.5-flash-lite",
1346
  "type": "vision",
1347
  "input_price_per_1m": 0.1,
1348
  "output_price_per_1m": 0.4,
 
1355
  "hf_private": true
1356
  },
1357
  {
1358
+ "name": "azure/openai-responses/gpt-4.1-nano",
1359
  "type": "vision",
1360
  "input_price_per_1m": 0.1,
1361
  "output_price_per_1m": 0.4,
 
1363
  "capabilities": [
1364
  "vision"
1365
  ],
1366
+ "context_window": 1047576,
1367
  "hf_private": true
1368
  },
1369
  {
1370
+ "name": "azure/gpt-4.1-nano",
1371
  "type": "vision",
1372
  "input_price_per_1m": 0.1,
1373
  "output_price_per_1m": 0.4,
 
1379
  "hf_private": true
1380
  },
1381
  {
1382
+ "name": "groq/openai/gpt-oss-20b",
1383
+ "type": "chat",
1384
  "input_price_per_1m": 0.1,
1385
+ "output_price_per_1m": 0.5,
1386
  "currency": "USD",
1387
+ "context_window": 131072,
1388
+ "size_b": 20,
1389
  "capabilities": [
1390
+ "tools",
1391
  "reasoning"
1392
  ],
1393
+ "hf_id": "openai/gpt-oss-20b",
1394
+ "hf_private": false
 
 
 
 
 
 
 
 
 
1395
  },
1396
  {
1397
+ "name": "mistral/devstral-small-2507",
1398
  "type": "chat",
1399
  "input_price_per_1m": 0.1,
1400
  "output_price_per_1m": 0.3,
 
1408
  "hf_private": false
1409
  },
1410
  {
1411
+ "name": "mistral/devstral-small-latest",
1412
  "type": "chat",
1413
  "input_price_per_1m": 0.1,
1414
  "output_price_per_1m": 0.3,
 
1422
  "hf_private": false
1423
  },
1424
  {
1425
+ "name": "mistral/mistral-small-2503",
1426
  "type": "chat",
1427
  "input_price_per_1m": 0.1,
1428
+ "output_price_per_1m": 0.3,
1429
  "currency": "USD",
1430
+ "context_window": 32768,
1431
+ "hf_private": true
 
1432
  },
1433
  {
1434
  "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct-Turbo",
 
1508
  "hf_id": "openai/gpt-oss-120b",
1509
  "hf_private": false
1510
  },
1511
+ {
1512
+ "name": "parasail/parasail-qwen3-235b-a22b-instruct-2507",
1513
+ "type": "chat",
1514
+ "input_price_per_1m": 0.15,
1515
+ "output_price_per_1m": 0.85,
1516
+ "currency": "USD",
1517
+ "context_window": 262144,
1518
+ "size_b": 235,
1519
+ "hf_private": false
1520
+ },
1521
  {
1522
  "name": "novita/deepseek/deepseek-r1-distill-qwen-14b",
1523
  "type": "chat",
 
1534
  "size_source": "manual",
1535
  "hf_private": false
1536
  },
 
 
 
 
 
 
 
 
 
 
1537
  {
1538
  "name": "groq/openai/gpt-oss-120b",
1539
  "type": "chat",
 
1550
  "hf_private": false
1551
  },
1552
  {
1553
+ "name": "mistral/mistral-small-latest",
1554
  "type": "vision",
1555
  "input_price_per_1m": 0.15,
1556
  "output_price_per_1m": 0.6,
 
1560
  "reasoning"
1561
  ],
1562
  "context_window": 256000,
1563
+ "hf_private": true
 
 
1564
  },
1565
  {
1566
+ "name": "mistral/mistral-small-2603",
1567
  "type": "vision",
1568
  "input_price_per_1m": 0.15,
1569
  "output_price_per_1m": 0.6,
 
1573
  "reasoning"
1574
  ],
1575
  "context_window": 256000,
1576
+ "size_b": 119,
1577
+ "hf_id": "mistralai/Mistral-Small-4-119B-2603",
1578
+ "hf_private": false
1579
  },
1580
  {
1581
  "name": "novita/mistralai/mistral-nemo",
 
1601
  "size_b": 8,
1602
  "hf_private": false
1603
  },
1604
+ {
1605
+ "name": "alibaba/qwen3-30b-a3b-instruct-2507",
1606
+ "type": "vision",
1607
+ "input_price_per_1m": 0.2,
1608
+ "output_price_per_1m": 0.8,
1609
+ "currency": "USD",
1610
+ "capabilities": [
1611
+ "vision"
1612
+ ],
1613
+ "context_window": 131072,
1614
+ "size_b": 30,
1615
+ "hf_id": "Qwen/Qwen3-30B-A3B-Instruct-2507",
1616
+ "hf_private": false
1617
+ },
1618
+ {
1619
+ "name": "openai-responses/gpt-5.4-nano",
1620
+ "type": "vision",
1621
+ "input_price_per_1m": 0.2,
1622
+ "output_price_per_1m": 1.25,
1623
+ "currency": "USD",
1624
+ "capabilities": [
1625
+ "vision",
1626
+ "reasoning"
1627
+ ],
1628
+ "context_window": 400000,
1629
+ "hf_private": true
1630
+ },
1631
  {
1632
  "name": "openai/gpt-5.4-nano",
1633
  "type": "vision",
 
1671
  "hf_id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct",
1672
  "hf_private": false
1673
  },
 
 
 
 
 
 
 
 
 
 
 
 
1674
  {
1675
  "name": "xai/grok-4-fast-non-reasoning",
1676
  "type": "chat",
 
1685
  ],
1686
  "hf_private": true
1687
  },
1688
+ {
1689
+ "name": "xai/grok-code-fast-1",
1690
+ "type": "vision",
1691
+ "input_price_per_1m": 0.2,
1692
+ "output_price_per_1m": 1.5,
1693
+ "currency": "USD",
1694
+ "capabilities": [
1695
+ "vision"
1696
+ ],
1697
+ "context_window": 256000,
1698
+ "hf_private": true
1699
+ },
1700
  {
1701
  "name": "xai/grok-4-fast",
1702
  "type": "chat",
 
1736
  "hf_private": true
1737
  },
1738
  {
1739
+ "name": "together/meta-llama/LlamaGuard-2-8b",
1740
  "type": "chat",
1741
  "input_price_per_1m": 0.2,
1742
+ "output_price_per_1m": 0.2,
1743
  "currency": "USD",
1744
+ "context_window": 8192,
1745
+ "size_b": 8,
 
 
 
 
 
1746
  "hf_private": false
1747
  },
1748
  {
 
1761
  "hf_private": false
1762
  },
1763
  {
1764
+ "name": "deepinfra/Qwen/Qwen3-235B-A22B",
1765
+ "type": "chat",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1766
  "input_price_per_1m": 0.2,
1767
+ "output_price_per_1m": 0.6,
1768
  "currency": "USD",
1769
+ "context_window": 40000,
1770
+ "size_b": 235,
1771
  "capabilities": [
1772
+ "tools",
1773
  "reasoning"
1774
  ],
1775
+ "hf_id": "Qwen/Qwen3-235B-A22B",
 
 
 
 
 
 
 
 
 
 
1776
  "hf_private": false
1777
  },
1778
  {
1779
+ "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct",
1780
  "type": "chat",
1781
  "input_price_per_1m": 0.23,
1782
  "output_price_per_1m": 0.4,
1783
  "currency": "USD",
1784
  "context_window": 131072,
1785
+ "size_b": 70,
1786
  "capabilities": [
1787
+ "tools"
1788
  ],
1789
+ "hf_id": "meta-llama/Llama-3.3-70B-Instruct",
 
 
 
 
 
 
 
 
 
 
1790
  "hf_private": false
1791
  },
1792
  {
1793
+ "name": "deepinfra/Qwen/Qwen2.5-72B-Instruct",
1794
  "type": "chat",
1795
  "input_price_per_1m": 0.23,
1796
  "output_price_per_1m": 0.4,
1797
  "currency": "USD",
1798
  "context_window": 131072,
1799
+ "size_b": 72,
1800
  "capabilities": [
1801
+ "vision"
1802
  ],
1803
+ "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
1804
  "hf_private": false
1805
  },
1806
  {
 
1818
  "hf_private": false
1819
  },
1820
  {
1821
+ "name": "deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct",
1822
  "type": "chat",
1823
+ "input_price_per_1m": 0.23,
1824
+ "output_price_per_1m": 0.4,
1825
+ "currency": "USD",
1826
+ "context_window": 130815,
1827
+ "size_b": 70,
1828
+ "hf_private": false
1829
+ },
1830
+ {
1831
+ "name": "openai-responses/gpt-5-mini",
1832
+ "type": "vision",
1833
  "input_price_per_1m": 0.25,
1834
  "output_price_per_1m": 2,
1835
  "currency": "USD",
1836
  "capabilities": [
1837
+ "vision",
1838
  "reasoning"
1839
  ],
1840
+ "context_window": 400000,
1841
  "hf_private": true
1842
  },
1843
  {
 
1853
  "hf_private": true
1854
  },
1855
  {
1856
+ "name": "vertex/gemini-3.1-flash-lite-preview",
1857
  "type": "vision",
1858
  "input_price_per_1m": 0.25,
1859
+ "output_price_per_1m": 1.5,
1860
  "currency": "USD",
1861
  "capabilities": [
1862
+ "vision"
 
1863
  ],
1864
+ "context_window": 1048576,
1865
  "hf_private": true
1866
  },
1867
  {
1868
+ "name": "azure/gpt-5-mini",
1869
+ "type": "chat",
1870
  "input_price_per_1m": 0.25,
1871
+ "output_price_per_1m": 2,
1872
  "currency": "USD",
1873
  "capabilities": [
1874
+ "reasoning"
1875
  ],
1876
+ "context_window": 200000,
1877
  "hf_private": true
1878
  },
1879
  {
 
1924
  "context_window": 128000,
1925
  "hf_private": true
1926
  },
1927
+ {
1928
+ "name": "alibaba/qwen3-coder-flash",
1929
+ "type": "vision",
1930
+ "input_price_per_1m": 0.3,
1931
+ "output_price_per_1m": 1.5,
1932
+ "currency": "USD",
1933
+ "capabilities": [
1934
+ "vision"
1935
+ ],
1936
+ "context_window": 1048576,
1937
+ "hf_private": true
1938
+ },
1939
  {
1940
  "name": "nebius/deepseek-ai/DeepSeek-V3.2",
1941
  "type": "chat",
 
1965
  "hf_private": false
1966
  },
1967
  {
1968
+ "name": "parasail/parasail-gemma3-27b-it",
1969
+ "type": "chat",
1970
+ "input_price_per_1m": 0.3,
1971
+ "output_price_per_1m": 0.5,
1972
+ "currency": "USD",
1973
+ "context_window": 128000,
1974
+ "size_b": 27,
1975
+ "hf_private": false
1976
+ },
1977
+ {
1978
+ "name": "google/gemini-2.5-flash",
1979
  "type": "vision",
1980
  "input_price_per_1m": 0.3,
1981
+ "output_price_per_1m": 2.5,
1982
  "currency": "USD",
1983
  "capabilities": [
1984
  "vision",
1985
  "reasoning"
1986
  ],
1987
+ "context_window": 1048576,
1988
+ "hf_private": true
 
 
 
1989
  },
1990
  {
1991
+ "name": "novita/minimax-m2.7",
1992
  "type": "vision",
1993
  "input_price_per_1m": 0.3,
1994
  "output_price_per_1m": 1.2,
 
2018
  "hf_private": false
2019
  },
2020
  {
2021
+ "name": "novita/MiniMax-M2.7",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2022
  "type": "vision",
2023
  "input_price_per_1m": 0.3,
2024
  "output_price_per_1m": 1.2,
 
2034
  "size_source": "manual"
2035
  },
2036
  {
2037
+ "name": "xai/grok-3-mini",
2038
  "type": "chat",
2039
  "input_price_per_1m": 0.3,
2040
+ "output_price_per_1m": 0.5,
2041
  "currency": "USD",
 
2042
  "capabilities": [
 
2043
  "reasoning"
2044
  ],
2045
+ "context_window": 131072,
2046
+ "hf_private": true
 
2047
  },
2048
  {
2049
+ "name": "together/Qwen/Qwen2.5-7B-Instruct-Turbo",
2050
  "type": "chat",
2051
  "input_price_per_1m": 0.3,
2052
+ "output_price_per_1m": 0.3,
2053
  "currency": "USD",
2054
+ "context_window": 32768,
2055
+ "size_b": 7,
2056
+ "hf_private": false
 
 
2057
  },
2058
  {
2059
  "name": "deepinfra/deepseek-ai/DeepSeek-V3.1",
 
2071
  "hf_private": false
2072
  },
2073
  {
2074
+ "name": "vertex/gemini-2.5-flash",
2075
  "type": "vision",
2076
  "input_price_per_1m": 0.3,
2077
  "output_price_per_1m": 2.5,
 
2084
  "hf_private": true
2085
  },
2086
  {
2087
+ "name": "vertex/gemini-2.5-flash-image",
 
 
 
 
 
 
 
 
 
 
2088
  "type": "vision",
2089
  "input_price_per_1m": 0.3,
2090
+ "output_price_per_1m": 2.5,
2091
  "currency": "USD",
2092
  "capabilities": [
2093
+ "vision",
2094
+ "reasoning"
2095
  ],
2096
  "context_window": 1048576,
2097
  "hf_private": true
2098
  },
2099
  {
2100
+ "name": "coding/gemini-2.5-flash",
2101
  "type": "vision",
2102
  "input_price_per_1m": 0.3,
2103
  "output_price_per_1m": 2.5,
 
2110
  "hf_private": true
2111
  },
2112
  {
2113
+ "name": "mistral/codestral-latest",
2114
+ "type": "chat",
2115
  "input_price_per_1m": 0.3,
2116
+ "output_price_per_1m": 0.9,
2117
  "currency": "USD",
2118
+ "context_window": 131072,
 
 
 
 
2119
  "hf_private": true
2120
  },
2121
  {
2122
+ "name": "minimaxi/MiniMax-M2",
2123
+ "type": "chat",
2124
  "input_price_per_1m": 0.3,
2125
+ "output_price_per_1m": 1.2,
2126
  "currency": "USD",
2127
+ "context_window": 200000,
2128
  "capabilities": [
2129
+ "tools",
2130
  "reasoning"
2131
  ],
2132
+ "hf_id": "MiniMaxAI/MiniMax-M2",
2133
+ "size_b": 228.7,
2134
+ "hf_private": false
2135
  },
2136
  {
2137
+ "name": "minimaxi/MiniMax-M2.7",
2138
+ "type": "vision",
2139
  "input_price_per_1m": 0.3,
2140
+ "output_price_per_1m": 1.2,
2141
  "currency": "USD",
2142
+ "capabilities": [
2143
+ "vision",
2144
+ "reasoning"
2145
+ ],
2146
+ "context_window": 200000,
2147
+ "hf_id": "MiniMaxAI/MiniMax-M2.7",
2148
+ "hf_private": false,
2149
+ "size_b": 230,
2150
+ "size_source": "manual"
2151
  },
2152
  {
2153
+ "name": "minimaxi/MiniMax-M2.5",
2154
+ "type": "vision",
2155
  "input_price_per_1m": 0.3,
2156
+ "output_price_per_1m": 1.2,
2157
  "currency": "USD",
2158
+ "capabilities": [
2159
+ "vision",
2160
+ "reasoning"
2161
+ ],
2162
+ "context_window": 200000,
2163
+ "hf_id": "MiniMaxAI/MiniMax-M2.5",
2164
+ "size_b": 228.7,
2165
  "hf_private": false
2166
  },
2167
  {
 
2203
  "hf_private": false
2204
  },
2205
  {
2206
+ "name": "alibaba/qwen-plus",
2207
+ "type": "chat",
2208
+ "input_price_per_1m": 0.4,
2209
+ "output_price_per_1m": 1.2,
2210
+ "currency": "USD",
2211
+ "context_window": 131072,
2212
+ "capabilities": [
2213
+ "tools"
2214
+ ],
2215
+ "hf_private": true
2216
+ },
2217
+ {
2218
+ "name": "openai-responses/gpt-4.1-mini",
2219
  "type": "vision",
2220
  "input_price_per_1m": 0.4,
2221
  "output_price_per_1m": 1.6,
 
2227
  "hf_private": true
2228
  },
2229
  {
2230
+ "name": "openai/gpt-4.1-mini",
2231
+ "type": "vision",
2232
  "input_price_per_1m": 0.4,
2233
+ "output_price_per_1m": 1.6,
2234
  "currency": "USD",
 
 
2235
  "capabilities": [
2236
+ "vision"
2237
  ],
2238
+ "context_window": 1047576,
2239
+ "hf_private": true
2240
  },
2241
  {
2242
  "name": "nebius/zai-org/GLM-4.7",
 
2253
  "hf_private": false
2254
  },
2255
  {
2256
+ "name": "nebius/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2257
  "type": "chat",
2258
  "input_price_per_1m": 0.4,
2259
+ "output_price_per_1m": 1.8,
2260
  "currency": "USD",
2261
+ "context_window": 262000,
2262
+ "size_b": 480,
2263
  "capabilities": [
2264
+ "tools"
 
2265
  ],
2266
+ "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct",
 
2267
  "hf_private": false
2268
  },
2269
  {
 
2275
  "context_window": 128000,
2276
  "hf_private": true
2277
  },
2278
+ {
2279
+ "name": "novita/deepseek/deepseek-v3-0324",
2280
+ "type": "chat",
2281
+ "input_price_per_1m": 0.4,
2282
+ "output_price_per_1m": 1.3,
2283
+ "currency": "USD",
2284
+ "context_window": 128000,
2285
+ "capabilities": [
2286
+ "tools",
2287
+ "reasoning"
2288
+ ],
2289
+ "size_b": 685,
2290
+ "hf_id": "deepseek-ai/DeepSeek-V3-0324",
2291
+ "hf_private": false
2292
+ },
2293
  {
2294
  "name": "deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2295
  "type": "chat",
 
2329
  "hf_private": true
2330
  },
2331
  {
2332
+ "name": "mistral/mistral-medium-latest",
2333
  "type": "chat",
2334
  "input_price_per_1m": 0.4,
2335
+ "output_price_per_1m": 2,
2336
  "currency": "USD",
2337
  "context_window": 131072,
 
 
 
2338
  "hf_private": true
2339
  },
2340
  {
2341
+ "name": "mistral/devstral-medium-2507",
2342
+ "type": "chat",
2343
  "input_price_per_1m": 0.4,
2344
+ "output_price_per_1m": 2,
2345
  "currency": "USD",
2346
+ "context_window": 131072,
2347
  "capabilities": [
2348
+ "tools"
2349
  ],
 
2350
  "hf_private": true
2351
  },
2352
  {
 
2359
  "hf_private": true
2360
  },
2361
  {
2362
+ "name": "nebius/deepseek-ai/DeepSeek-V3-0324",
 
 
 
 
 
 
 
 
 
2363
  "type": "chat",
2364
+ "input_price_per_1m": 0.5,
2365
+ "output_price_per_1m": 1.5,
2366
  "currency": "USD",
2367
+ "context_window": 128000,
2368
  "capabilities": [
2369
+ "tools",
2370
+ "reasoning"
2371
  ],
2372
+ "size_b": 685,
2373
+ "hf_id": "deepseek-ai/DeepSeek-V3-0324",
2374
+ "hf_private": false
2375
  },
2376
  {
2377
  "name": "nebius/moonshotai/Kimi-K2-Instruct",
 
2384
  "tools"
2385
  ],
2386
  "hf_id": "moonshotai/Kimi-K2-Instruct",
2387
+ "size_b": 1026.5,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2388
  "hf_private": false
2389
  },
2390
  {
 
2429
  "hf_private": true
2430
  },
2431
  {
2432
+ "name": "vertex/gemini-3.1-flash-image-preview",
2433
  "type": "vision",
2434
  "input_price_per_1m": 0.5,
2435
+ "output_price_per_1m": 2,
2436
  "currency": "USD",
2437
  "capabilities": [
2438
  "vision",
2439
  "reasoning"
2440
  ],
2441
+ "context_window": 131072,
2442
  "hf_private": true
2443
  },
2444
  {
2445
+ "name": "vertex/gemini-3-flash-preview",
2446
  "type": "vision",
2447
  "input_price_per_1m": 0.5,
2448
+ "output_price_per_1m": 3,
2449
  "currency": "USD",
2450
  "capabilities": [
2451
  "vision",
2452
  "reasoning"
2453
  ],
2454
+ "context_window": 1048576,
2455
  "hf_private": true
2456
  },
2457
  {
 
2521
  "size_b": 1026.5,
2522
  "hf_private": false
2523
  },
2524
+ {
2525
+ "name": "alibaba/qwen3.5",
2526
+ "type": "vision",
2527
+ "input_price_per_1m": 0.6,
2528
+ "output_price_per_1m": 3.6,
2529
+ "currency": "USD",
2530
+ "capabilities": [
2531
+ "vision",
2532
+ "reasoning"
2533
+ ],
2534
+ "context_window": 256000,
2535
+ "size_b": 9,
2536
+ "hf_id": "Qwen/Qwen3.5-9B",
2537
+ "hf_private": false
2538
+ },
2539
  {
2540
  "name": "nebius/zai-org/GLM-4.5",
2541
  "type": "chat",
 
2582
  "hf_private": false
2583
  },
2584
  {
2585
+ "name": "deepinfra/zai-org/GLM-4.5",
2586
+ "type": "chat",
2587
  "input_price_per_1m": 0.6,
2588
+ "output_price_per_1m": 2.2,
2589
  "currency": "USD",
2590
+ "context_window": 131072,
2591
  "capabilities": [
2592
+ "tools",
2593
  "reasoning"
2594
  ],
2595
+ "hf_id": "zai-org/GLM-4.5",
2596
+ "size_b": 358.3,
 
2597
  "hf_private": false
2598
  },
2599
  {
2600
+ "name": "zai/GLM-4.6",
2601
+ "type": "chat",
2602
  "input_price_per_1m": 0.6,
2603
+ "output_price_per_1m": 2.2,
2604
  "currency": "USD",
2605
  "capabilities": [
 
2606
  "reasoning"
2607
  ],
2608
  "context_window": 200000,
2609
+ "hf_id": "zai-org/GLM-4.6",
2610
+ "size_b": 356.8,
2611
+ "hf_private": false
 
2612
  },
2613
  {
2614
+ "name": "zai/GLM-4.7",
2615
  "type": "chat",
2616
  "input_price_per_1m": 0.6,
2617
  "output_price_per_1m": 2.2,
2618
  "currency": "USD",
 
2619
  "capabilities": [
 
2620
  "reasoning"
2621
  ],
2622
+ "context_window": 200000,
2623
+ "hf_id": "zai-org/GLM-4.7",
2624
  "size_b": 358.3,
2625
  "hf_private": false
2626
  },
 
2639
  "hf_private": false
2640
  },
2641
  {
2642
+ "name": "minimaxi/MiniMax-M2.7-highspeed",
2643
+ "type": "vision",
2644
  "input_price_per_1m": 0.6,
2645
+ "output_price_per_1m": 2.4,
2646
  "currency": "USD",
2647
  "capabilities": [
2648
+ "vision",
2649
  "reasoning"
2650
  ],
2651
  "context_window": 200000,
2652
+ "hf_id": "MiniMaxAI/MiniMax-M2.7",
2653
+ "hf_private": false,
2654
+ "size_b": 230,
2655
+ "size_source": "manual"
2656
  },
2657
  {
2658
+ "name": "minimaxi/MiniMax-M2.5-highspeed",
2659
+ "type": "vision",
2660
  "input_price_per_1m": 0.6,
2661
+ "output_price_per_1m": 2.4,
2662
  "currency": "USD",
2663
  "capabilities": [
2664
+ "vision",
2665
  "reasoning"
2666
  ],
2667
  "context_window": 200000,
2668
+ "hf_id": "MiniMaxAI/MiniMax-M2.5",
2669
+ "size_b": 228.7,
2670
  "hf_private": false
2671
  },
2672
  {
2673
+ "name": "moonshot/kimi-k2-thinking",
2674
+ "type": "chat",
2675
  "input_price_per_1m": 0.6,
2676
+ "output_price_per_1m": 2.5,
2677
  "currency": "USD",
2678
+ "context_window": 131072,
2679
  "capabilities": [
2680
+ "tools"
 
2681
  ],
2682
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
2683
+ "size_b": 1026.5,
 
2684
  "hf_private": false
2685
  },
2686
  {
 
2741
  "size_b": 1026.5,
2742
  "hf_private": false
2743
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2744
  {
2745
  "name": "novita/microsoft/wizardlm-2-8x22b",
2746
  "type": "chat",
 
2765
  "context_window": 400000,
2766
  "hf_private": true
2767
  },
2768
+ {
2769
+ "name": "parasail/parasail-qwen25-vl-72b-instruct",
2770
+ "type": "vision",
2771
+ "input_price_per_1m": 0.7,
2772
+ "output_price_per_1m": 0.7,
2773
+ "currency": "USD",
2774
+ "capabilities": [
2775
+ "vision"
2776
+ ],
2777
+ "context_window": 32768,
2778
+ "size_b": 72,
2779
+ "hf_private": false
2780
+ },
2781
  {
2782
  "name": "novita/deepseek/deepseek-r1-turbo",
2783
  "type": "chat",
 
2805
  "hf_private": false
2806
  },
2807
  {
2808
+ "name": "openai-responses/gpt-5.4-mini",
 
 
 
 
 
 
 
 
 
 
 
 
 
2809
  "type": "vision",
2810
  "input_price_per_1m": 0.75,
2811
  "output_price_per_1m": 4.5,
 
2818
  "hf_private": true
2819
  },
2820
  {
2821
+ "name": "openai/gpt-5.4-mini",
2822
  "type": "vision",
2823
  "input_price_per_1m": 0.75,
2824
  "output_price_per_1m": 4.5,
 
2846
  "hf_private": false
2847
  },
2848
  {
2849
+ "name": "novita/qwen/qwen2.5-vl-72b-instruct",
2850
  "type": "chat",
2851
  "input_price_per_1m": 0.8,
2852
  "output_price_per_1m": 0.8,
2853
  "currency": "USD",
2854
+ "context_window": 96000,
2855
+ "size_b": 72,
2856
  "capabilities": [
2857
+ "vision"
2858
  ],
2859
+ "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
2860
  "hf_private": false
2861
  },
2862
  {
2863
+ "name": "novita/deepseek/deepseek-r1-distill-llama-70b",
2864
  "type": "chat",
2865
  "input_price_per_1m": 0.8,
2866
  "output_price_per_1m": 0.8,
2867
  "currency": "USD",
2868
+ "context_window": 32000,
2869
+ "size_b": 70,
2870
  "capabilities": [
2871
+ "reasoning"
2872
  ],
2873
+ "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
2874
  "hf_private": false
2875
  },
2876
  {
 
2884
  "hf_private": false
2885
  },
2886
  {
2887
+ "name": "deepinfra/deepseek-ai/DeepSeek-V3",
2888
  "type": "chat",
2889
  "input_price_per_1m": 0.85,
2890
+ "output_price_per_1m": 0.9,
2891
  "currency": "USD",
2892
+ "context_window": 128000,
2893
  "capabilities": [
2894
  "tools",
2895
  "reasoning"
2896
  ],
2897
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
2898
  "size_b": 671,
 
2899
  "hf_private": false
2900
  },
2901
  {
2902
+ "name": "deepinfra/deepseek-ai/DeepSeek-R1",
2903
  "type": "chat",
2904
  "input_price_per_1m": 0.85,
2905
+ "output_price_per_1m": 2.5,
2906
  "currency": "USD",
2907
+ "context_window": 64000,
2908
  "capabilities": [
2909
  "tools",
2910
  "reasoning"
2911
  ],
2912
+ "hf_id": "deepseek-ai/DeepSeek-R1",
2913
  "size_b": 671,
2914
+ "size_source": "manual",
2915
  "hf_private": false
2916
  },
2917
  {
 
2927
  "hf_private": true
2928
  },
2929
  {
2930
+ "name": "together/meta-llama/Llama-3.3-70B-Instruct-Turbo",
2931
  "type": "chat",
2932
  "input_price_per_1m": 0.88,
2933
  "output_price_per_1m": 0.88,
2934
  "currency": "USD",
2935
  "context_window": 131072,
2936
  "size_b": 70,
2937
+ "capabilities": [
2938
+ "tools"
2939
+ ],
2940
+ "hf_id": "meta-llama/Llama-3.3-70B-Instruct",
2941
  "hf_private": false
2942
  },
2943
  {
2944
+ "name": "together/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
2945
  "type": "chat",
2946
  "input_price_per_1m": 0.88,
2947
  "output_price_per_1m": 0.88,
2948
  "currency": "USD",
2949
  "context_window": 131072,
2950
  "size_b": 70,
 
 
 
 
2951
  "hf_private": false
2952
  },
2953
  {
 
2974
  "context_window": 131072,
2975
  "hf_private": true
2976
  },
2977
+ {
2978
+ "name": "alibaba/qwen3-coder-plus",
2979
+ "type": "vision",
2980
+ "input_price_per_1m": 1,
2981
+ "output_price_per_1m": 5,
2982
+ "currency": "USD",
2983
+ "capabilities": [
2984
+ "vision"
2985
+ ],
2986
+ "context_window": 1048576,
2987
+ "hf_private": true
2988
+ },
2989
  {
2990
  "name": "openai/o3",
2991
  "type": "vision",
 
3000
  "hf_private": true
3001
  },
3002
  {
3003
+ "name": "perplexity/sonar",
3004
  "type": "chat",
3005
  "input_price_per_1m": 1,
3006
+ "output_price_per_1m": 1,
3007
  "currency": "USD",
3008
+ "context_window": 131072,
3009
  "capabilities": [
3010
+ "vision"
3011
  ],
3012
+ "hf_private": true
 
 
 
3013
  },
3014
  {
3015
+ "name": "bedrock/claude-haiku-4-5",
3016
  "type": "vision",
3017
  "input_price_per_1m": 1,
3018
+ "output_price_per_1m": 5,
3019
  "currency": "USD",
3020
  "capabilities": [
3021
+ "vision"
 
3022
  ],
3023
  "context_window": 200000,
3024
+ "hf_private": true
 
 
3025
  },
3026
  {
3027
+ "name": "anthropic/claude-haiku-4-5",
3028
  "type": "vision",
3029
  "input_price_per_1m": 1,
3030
  "output_price_per_1m": 5,
 
3036
  "hf_private": true
3037
  },
3038
  {
3039
+ "name": "novita/GLM-5",
3040
+ "type": "chat",
3041
+ "input_price_per_1m": 1,
3042
+ "output_price_per_1m": 3.2,
3043
+ "currency": "USD",
3044
+ "capabilities": [
3045
+ "reasoning"
3046
+ ],
3047
+ "context_window": 202800,
3048
+ "hf_id": "zai-org/GLM-5",
3049
+ "size_b": 753.9,
3050
+ "hf_private": false
3051
+ },
3052
+ {
3053
+ "name": "vertex/claude-haiku-4-5",
3054
  "type": "vision",
3055
  "input_price_per_1m": 1,
3056
  "output_price_per_1m": 5,
 
3058
  "capabilities": [
3059
  "vision"
3060
  ],
3061
+ "context_window": 200000,
3062
  "hf_private": true
3063
  },
3064
  {
3065
+ "name": "zai/GLM-5",
3066
+ "type": "vision",
3067
  "input_price_per_1m": 1,
3068
+ "output_price_per_1m": 3.2,
3069
  "currency": "USD",
 
3070
  "capabilities": [
3071
+ "vision",
3072
+ "reasoning"
3073
  ],
3074
+ "context_window": 200000,
3075
+ "hf_id": "zai-org/GLM-5",
3076
+ "size_b": 753.9,
3077
  "hf_private": false
3078
  },
3079
  {
 
3091
  "hf_private": false
3092
  },
3093
  {
3094
+ "name": "groq/moonshotai/kimi-k2-instruct",
3095
  "type": "chat",
3096
  "input_price_per_1m": 1,
3097
+ "output_price_per_1m": 3,
3098
  "currency": "USD",
3099
  "context_window": 131072,
3100
  "capabilities": [
3101
+ "tools"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3102
  ],
3103
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
3104
+ "size_b": 1026.5,
3105
+ "hf_private": false
3106
  },
3107
  {
3108
+ "name": "openai-responses/o3-mini",
3109
  "type": "chat",
3110
  "input_price_per_1m": 1.1,
3111
  "output_price_per_1m": 4.4,
 
3117
  "hf_private": true
3118
  },
3119
  {
3120
+ "name": "openai-responses/o4-mini",
3121
  "type": "chat",
3122
  "input_price_per_1m": 1.1,
3123
  "output_price_per_1m": 4.4,
 
3129
  "hf_private": true
3130
  },
3131
  {
3132
+ "name": "openai/o3-mini",
3133
  "type": "chat",
3134
  "input_price_per_1m": 1.1,
3135
  "output_price_per_1m": 4.4,
 
3141
  "hf_private": true
3142
  },
3143
  {
3144
+ "name": "azure/o4-mini",
3145
  "type": "chat",
3146
  "input_price_per_1m": 1.1,
3147
  "output_price_per_1m": 4.4,
 
3152
  "context_window": 200000,
3153
  "hf_private": true
3154
  },
3155
+ {
3156
+ "name": "together/Qwen/Qwen2.5-72B-Instruct-Turbo",
3157
+ "type": "chat",
3158
+ "input_price_per_1m": 1.2,
3159
+ "output_price_per_1m": 1.2,
3160
+ "currency": "USD",
3161
+ "context_window": 32768,
3162
+ "size_b": 72,
3163
+ "hf_private": false
3164
+ },
3165
  {
3166
  "name": "moonshot/kimi-k2-turbo-preview",
3167
  "type": "chat",
 
3177
  "hf_private": false
3178
  },
3179
  {
3180
+ "name": "openai-responses/gpt-5.1-codex",
 
 
 
 
 
 
 
 
 
 
3181
  "type": "vision",
3182
  "input_price_per_1m": 1.25,
3183
  "output_price_per_1m": 10,
 
3186
  "vision",
3187
  "reasoning"
3188
  ],
3189
+ "context_window": 400000,
3190
  "hf_private": true
3191
  },
3192
  {
3193
+ "name": "openai-responses/gpt-5",
3194
  "type": "vision",
3195
  "input_price_per_1m": 1.25,
3196
  "output_price_per_1m": 10,
 
3203
  "hf_private": true
3204
  },
3205
  {
3206
+ "name": "openai-responses/gpt-5-codex",
3207
  "type": "vision",
3208
  "input_price_per_1m": 1.25,
3209
  "output_price_per_1m": 10,
 
3212
  "vision",
3213
  "reasoning"
3214
  ],
3215
+ "context_window": 400000,
3216
  "hf_private": true
3217
  },
3218
  {
3219
+ "name": "openai-responses/gpt-5.1",
3220
+ "type": "vision",
3221
  "input_price_per_1m": 1.25,
3222
  "output_price_per_1m": 10,
3223
  "currency": "USD",
3224
  "capabilities": [
3225
+ "vision",
3226
  "reasoning"
3227
  ],
3228
+ "context_window": 400000,
3229
  "hf_private": true
3230
  },
3231
  {
3232
+ "name": "openai/gpt-5.1",
3233
+ "type": "vision",
3234
  "input_price_per_1m": 1.25,
3235
  "output_price_per_1m": 10,
3236
  "currency": "USD",
3237
  "capabilities": [
3238
+ "vision",
3239
  "reasoning"
3240
  ],
3241
+ "context_window": 400000,
3242
  "hf_private": true
3243
  },
3244
  {
3245
+ "name": "openai/gpt-5.1-chat",
3246
  "type": "vision",
3247
  "input_price_per_1m": 1.25,
3248
  "output_price_per_1m": 10,
 
3251
  "vision",
3252
  "reasoning"
3253
  ],
3254
+ "context_window": 128000,
3255
  "hf_private": true
3256
  },
3257
  {
3258
+ "name": "openai/gpt-5-chat",
3259
  "type": "vision",
3260
  "input_price_per_1m": 1.25,
3261
  "output_price_per_1m": 10,
 
3264
  "vision",
3265
  "reasoning"
3266
  ],
3267
+ "context_window": 128000,
3268
  "hf_private": true
3269
  },
3270
  {
3271
+ "name": "google/gemini-2.5-pro",
3272
  "type": "vision",
3273
  "input_price_per_1m": 1.25,
3274
  "output_price_per_1m": 10,
 
3277
  "vision",
3278
  "reasoning"
3279
  ],
3280
+ "context_window": 1048576,
3281
  "hf_private": true
3282
  },
3283
  {
3284
+ "name": "together/deepseek-ai/DeepSeek-V3",
3285
+ "type": "chat",
3286
  "input_price_per_1m": 1.25,
3287
+ "output_price_per_1m": 1.25,
3288
  "currency": "USD",
3289
+ "context_window": 131072,
3290
  "capabilities": [
3291
+ "tools",
3292
  "reasoning"
3293
  ],
3294
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
3295
+ "size_b": 671,
3296
+ "hf_private": false
3297
  },
3298
  {
3299
+ "name": "vertex/gemini-2.5-pro",
3300
  "type": "vision",
3301
  "input_price_per_1m": 1.25,
3302
  "output_price_per_1m": 10,
 
3305
  "vision",
3306
  "reasoning"
3307
  ],
3308
+ "context_window": 1048576,
3309
  "hf_private": true
3310
  },
3311
  {
3312
+ "name": "azure/gpt-5.1",
3313
+ "type": "chat",
3314
  "input_price_per_1m": 1.25,
3315
  "output_price_per_1m": 10,
3316
  "currency": "USD",
3317
  "capabilities": [
 
3318
  "reasoning"
3319
  ],
3320
+ "context_window": 200000,
3321
  "hf_private": true
3322
  },
3323
  {
3324
+ "name": "azure/gpt-5",
3325
+ "type": "chat",
3326
  "input_price_per_1m": 1.25,
3327
  "output_price_per_1m": 10,
3328
  "currency": "USD",
3329
  "capabilities": [
 
3330
  "reasoning"
3331
  ],
3332
+ "context_window": 200000,
3333
  "hf_private": true
3334
  },
3335
  {
3336
+ "name": "coding/gemini-2.5-pro",
3337
+ "type": "vision",
3338
  "input_price_per_1m": 1.25,
3339
+ "output_price_per_1m": 10,
3340
  "currency": "USD",
 
3341
  "capabilities": [
3342
+ "vision",
3343
  "reasoning"
3344
  ],
3345
+ "context_window": 1048576,
3346
+ "hf_private": true
 
3347
  },
3348
  {
3349
+ "name": "novita/sao10k/l3-70b-euryale-v2.1",
3350
  "type": "chat",
3351
  "input_price_per_1m": 1.48,
3352
  "output_price_per_1m": 1.48,
 
3356
  "hf_private": false
3357
  },
3358
  {
3359
+ "name": "novita/sao10k/l31-70b-euryale-v2.2",
3360
  "type": "chat",
3361
  "input_price_per_1m": 1.48,
3362
  "output_price_per_1m": 1.48,
 
3378
  "hf_private": true
3379
  },
3380
  {
3381
+ "name": "openai-responses/gpt-5.2",
3382
  "type": "vision",
3383
  "input_price_per_1m": 1.75,
3384
  "output_price_per_1m": 14,
 
3387
  "vision",
3388
  "reasoning"
3389
  ],
3390
+ "context_window": 400000,
3391
  "hf_private": true
3392
  },
3393
  {
3394
+ "name": "openai-responses/gpt-5.3-codex",
3395
  "type": "vision",
3396
  "input_price_per_1m": 1.75,
3397
  "output_price_per_1m": 14,
 
3404
  "hf_private": true
3405
  },
3406
  {
3407
+ "name": "openai-responses/gpt-5.3-chat",
3408
  "type": "vision",
3409
  "input_price_per_1m": 1.75,
3410
  "output_price_per_1m": 14,
 
3417
  "hf_private": true
3418
  },
3419
  {
3420
+ "name": "openai-responses/gpt-5.2-codex",
3421
+ "type": "vision",
3422
  "input_price_per_1m": 1.75,
3423
  "output_price_per_1m": 14,
3424
  "currency": "USD",
3425
  "capabilities": [
3426
+ "vision",
3427
  "reasoning"
3428
  ],
3429
+ "context_window": 400000,
3430
  "hf_private": true
3431
  },
3432
  {
3433
+ "name": "openai/gpt-5.3-chat",
3434
  "type": "vision",
3435
  "input_price_per_1m": 1.75,
3436
  "output_price_per_1m": 14,
 
3439
  "vision",
3440
  "reasoning"
3441
  ],
3442
+ "context_window": 128000,
3443
  "hf_private": true
3444
  },
3445
  {
3446
+ "name": "openai/gpt-5.2",
3447
  "type": "vision",
3448
  "input_price_per_1m": 1.75,
3449
  "output_price_per_1m": 14,
 
3456
  "hf_private": true
3457
  },
3458
  {
3459
+ "name": "openai/gpt-5.2-chat",
3460
  "type": "vision",
3461
  "input_price_per_1m": 1.75,
3462
  "output_price_per_1m": 14,
 
3465
  "vision",
3466
  "reasoning"
3467
  ],
3468
+ "context_window": 128000,
3469
  "hf_private": true
3470
  },
3471
  {
3472
+ "name": "azure/gpt-5.2",
3473
+ "type": "chat",
3474
  "input_price_per_1m": 1.75,
3475
  "output_price_per_1m": 14,
3476
  "currency": "USD",
3477
  "capabilities": [
 
3478
  "reasoning"
3479
  ],
3480
+ "context_window": 200000,
3481
  "hf_private": true
3482
  },
3483
  {
3484
+ "name": "azure/gpt-5.3-codex",
3485
  "type": "vision",
3486
  "input_price_per_1m": 1.75,
3487
  "output_price_per_1m": 14,
 
3490
  "vision",
3491
  "reasoning"
3492
  ],
3493
+ "context_window": 400000,
3494
  "hf_private": true
3495
  },
3496
  {
3497
+ "name": "azure/openai-responses/gpt-5.2-codex",
3498
  "type": "vision",
3499
  "input_price_per_1m": 1.75,
3500
  "output_price_per_1m": 14,
 
3506
  "context_window": 400000,
3507
  "hf_private": true
3508
  },
3509
+ {
3510
+ "name": "openai-responses/gpt-4.1",
3511
+ "type": "vision",
3512
+ "input_price_per_1m": 2,
3513
+ "output_price_per_1m": 8,
3514
+ "currency": "USD",
3515
+ "capabilities": [
3516
+ "vision"
3517
+ ],
3518
+ "context_window": 1047576,
3519
+ "hf_private": true
3520
+ },
3521
  {
3522
  "name": "openai/o4-mini-deep-research",
3523
  "type": "vision",
 
3553
  "hf_private": true
3554
  },
3555
  {
3556
+ "name": "perplexity/sonar-reasoning-pro",
 
 
 
 
 
 
 
 
 
 
 
 
 
3557
  "type": "chat",
3558
  "input_price_per_1m": 2,
 
 
 
 
 
 
 
 
 
3559
  "output_price_per_1m": 8,
3560
  "currency": "USD",
3561
+ "context_window": 131072,
3562
  "capabilities": [
3563
+ "vision",
3564
+ "reasoning"
3565
  ],
 
3566
  "hf_private": true
3567
  },
3568
  {
3569
+ "name": "google/gemini-3.1-pro-preview",
3570
  "type": "vision",
3571
  "input_price_per_1m": 2,
3572
+ "output_price_per_1m": 12,
 
 
 
 
 
 
 
 
 
 
 
 
3573
  "currency": "USD",
 
3574
  "capabilities": [
3575
  "vision",
3576
  "reasoning"
3577
  ],
3578
+ "context_window": 1048576,
3579
  "hf_private": true
3580
  },
3581
  {
 
3592
  "hf_private": true
3593
  },
3594
  {
3595
+ "name": "xai/grok-4.2-beta",
3596
  "type": "vision",
3597
  "input_price_per_1m": 2,
3598
+ "output_price_per_1m": 6,
3599
  "currency": "USD",
3600
  "capabilities": [
3601
  "vision",
3602
  "reasoning"
3603
  ],
3604
+ "context_window": 2000000,
3605
  "hf_private": true
3606
  },
3607
  {
3608
+ "name": "xai/grok-2-1212",
3609
+ "type": "chat",
3610
  "input_price_per_1m": 2,
3611
+ "output_price_per_1m": 10,
3612
  "currency": "USD",
3613
+ "context_window": 131072,
 
 
 
3614
  "hf_private": true
3615
  },
3616
  {
 
3652
  "context_window": 1048576,
3653
  "hf_private": true
3654
  },
3655
+ {
3656
+ "name": "azure/gpt-4.1",
3657
+ "type": "vision",
3658
+ "input_price_per_1m": 2,
3659
+ "output_price_per_1m": 8,
3660
+ "currency": "USD",
3661
+ "capabilities": [
3662
+ "vision"
3663
+ ],
3664
+ "context_window": 1047576,
3665
+ "hf_private": true
3666
+ },
3667
+ {
3668
+ "name": "azure/openai-responses/gpt-4.1",
3669
+ "type": "vision",
3670
+ "input_price_per_1m": 2,
3671
+ "output_price_per_1m": 8,
3672
+ "currency": "USD",
3673
+ "capabilities": [
3674
+ "vision"
3675
+ ],
3676
+ "context_window": 1047576,
3677
+ "hf_private": true
3678
+ },
3679
  {
3680
  "name": "mistral/pixtral-large-latest",
3681
  "type": "chat",
 
3686
  "hf_private": true
3687
  },
3688
  {
3689
+ "name": "openai-responses/gpt-5.4",
3690
  "type": "vision",
3691
  "input_price_per_1m": 2.5,
3692
  "output_price_per_1m": 15,
 
3699
  "hf_private": true
3700
  },
3701
  {
3702
+ "name": "openai/gpt-4o-2024-08-06",
3703
  "type": "vision",
3704
  "input_price_per_1m": 2.5,
3705
  "output_price_per_1m": 10,
 
3711
  "hf_private": true
3712
  },
3713
  {
3714
+ "name": "openai/gpt-5.4",
3715
  "type": "vision",
3716
  "input_price_per_1m": 2.5,
3717
+ "output_price_per_1m": 15,
3718
  "currency": "USD",
3719
  "capabilities": [
3720
+ "vision",
3721
+ "reasoning"
3722
  ],
3723
+ "context_window": 1050000,
3724
  "hf_private": true
3725
  },
3726
  {
3727
+ "name": "openai/gpt-4o",
3728
  "type": "vision",
3729
  "input_price_per_1m": 2.5,
3730
  "output_price_per_1m": 10,
 
3736
  "hf_private": true
3737
  },
3738
  {
3739
+ "name": "openai/gpt-4o-2024-11-20",
3740
  "type": "vision",
3741
  "input_price_per_1m": 2.5,
3742
  "output_price_per_1m": 10,
 
3748
  "hf_private": true
3749
  },
3750
  {
3751
+ "name": "openai/gpt-4o-2024-05-13",
3752
  "type": "vision",
3753
  "input_price_per_1m": 2.5,
3754
+ "output_price_per_1m": 10,
3755
  "currency": "USD",
3756
  "capabilities": [
3757
+ "vision"
 
3758
  ],
3759
+ "context_window": 128000,
3760
  "hf_private": true
3761
  },
3762
  {
3763
+ "name": "azure/openai-responses/gpt-5.4",
3764
  "type": "vision",
3765
  "input_price_per_1m": 2.5,
3766
  "output_price_per_1m": 15,
 
3773
  "hf_private": true
3774
  },
3775
  {
3776
+ "name": "perplexity/sonar-pro",
3777
+ "type": "chat",
3778
  "input_price_per_1m": 3,
3779
  "output_price_per_1m": 15,
3780
  "currency": "USD",
3781
+ "context_window": 204800,
3782
  "capabilities": [
3783
  "vision"
3784
  ],
 
3785
  "hf_private": true
3786
  },
3787
  {
3788
+ "name": "bedrock/claude-3-7-sonnet",
3789
  "type": "vision",
3790
  "input_price_per_1m": 3,
3791
  "output_price_per_1m": 15,
 
3794
  "vision",
3795
  "reasoning"
3796
  ],
3797
+ "context_window": 200000,
3798
  "hf_private": true
3799
  },
3800
  {
3801
+ "name": "bedrock/claude-sonnet-4-6",
3802
  "type": "vision",
3803
  "input_price_per_1m": 3,
3804
  "output_price_per_1m": 15,
 
3807
  "vision",
3808
  "reasoning"
3809
  ],
3810
+ "context_window": 1000000,
3811
  "hf_private": true
3812
  },
3813
  {
 
3824
  "hf_private": true
3825
  },
3826
  {
3827
+ "name": "bedrock/claude-sonnet-4",
3828
  "type": "vision",
3829
  "input_price_per_1m": 3,
3830
  "output_price_per_1m": 15,
 
3837
  "hf_private": true
3838
  },
3839
  {
3840
+ "name": "anthropic/claude-sonnet-4-6",
3841
  "type": "vision",
3842
  "input_price_per_1m": 3,
3843
  "output_price_per_1m": 15,
 
3846
  "vision",
3847
  "reasoning"
3848
  ],
3849
+ "context_window": 1000000,
3850
  "hf_private": true
3851
  },
3852
  {
3853
+ "name": "anthropic/claude-sonnet-4-5",
3854
+ "type": "vision",
3855
  "input_price_per_1m": 3,
3856
  "output_price_per_1m": 15,
3857
  "currency": "USD",
 
3858
  "capabilities": [
3859
+ "vision",
3860
+ "reasoning"
3861
  ],
3862
+ "context_window": 1000000,
3863
  "hf_private": true
3864
  },
3865
  {
3866
+ "name": "anthropic/claude-sonnet-4",
3867
  "type": "vision",
3868
  "input_price_per_1m": 3,
3869
  "output_price_per_1m": 15,
 
3872
  "vision",
3873
  "reasoning"
3874
  ],
3875
+ "context_window": 1000000,
3876
  "hf_private": true
3877
  },
3878
  {
3879
+ "name": "xai/grok-4",
3880
  "type": "vision",
3881
  "input_price_per_1m": 3,
3882
  "output_price_per_1m": 15,
 
3884
  "capabilities": [
3885
  "vision"
3886
  ],
3887
+ "context_window": 256000,
3888
  "hf_private": true
3889
  },
3890
  {
3891
+ "name": "together/deepseek-ai/DeepSeek-R1",
3892
+ "type": "chat",
3893
  "input_price_per_1m": 3,
3894
+ "output_price_per_1m": 7,
3895
  "currency": "USD",
3896
+ "context_window": 64000,
3897
  "capabilities": [
3898
+ "tools",
3899
  "reasoning"
3900
  ],
3901
+ "hf_id": "deepseek-ai/DeepSeek-R1",
3902
+ "size_b": 671,
3903
+ "size_source": "manual",
3904
+ "hf_private": false
3905
  },
3906
  {
3907
+ "name": "vertex/claude-3-5-sonnet",
3908
  "type": "vision",
3909
  "input_price_per_1m": 3,
3910
  "output_price_per_1m": 15,
3911
  "currency": "USD",
3912
  "capabilities": [
3913
+ "vision"
 
3914
  ],
3915
  "context_window": 200000,
3916
  "hf_private": true
3917
  },
3918
  {
3919
+ "name": "vertex/claude-sonnet-4",
3920
  "type": "vision",
3921
  "input_price_per_1m": 3,
3922
  "output_price_per_1m": 15,
 
3925
  "vision",
3926
  "reasoning"
3927
  ],
3928
+ "context_window": 200000,
3929
  "hf_private": true
3930
  },
3931
  {
3932
+ "name": "vertex/claude-sonnet-4-5",
3933
  "type": "vision",
3934
  "input_price_per_1m": 3,
3935
  "output_price_per_1m": 15,
 
3938
  "vision",
3939
  "reasoning"
3940
  ],
3941
+ "context_window": 200000,
3942
  "hf_private": true
3943
  },
3944
  {
3945
+ "name": "vertex/claude-3-7-sonnet",
3946
  "type": "vision",
3947
  "input_price_per_1m": 3,
3948
  "output_price_per_1m": 15,
 
3951
  "vision",
3952
  "reasoning"
3953
  ],
3954
+ "context_window": 200000,
3955
  "hf_private": true
3956
  },
3957
  {
3958
+ "name": "coding/claude-sonnet-4-20250514",
3959
+ "type": "vision",
3960
  "input_price_per_1m": 3,
3961
+ "output_price_per_1m": 15,
3962
  "currency": "USD",
 
3963
  "capabilities": [
3964
+ "vision",
3965
  "reasoning"
3966
  ],
3967
+ "context_window": 200000,
3968
+ "hf_private": true
 
 
3969
  },
3970
  {
3971
  "name": "novita/deepseek/deepseek-r1",
 
3995
  "context_window": 128000,
3996
  "hf_private": true
3997
  },
 
 
 
 
 
 
 
 
 
 
 
 
3998
  {
3999
  "name": "bedrock/claude-opus-4-5",
4000
  "type": "vision",
 
4022
  "hf_private": true
4023
  },
4024
  {
4025
+ "name": "anthropic/claude-opus-4-6",
4026
  "type": "vision",
4027
  "input_price_per_1m": 5,
4028
  "output_price_per_1m": 25,
 
4035
  "hf_private": true
4036
  },
4037
  {
4038
+ "name": "anthropic/claude-opus-4-5",
4039
  "type": "vision",
4040
  "input_price_per_1m": 5,
4041
  "output_price_per_1m": 25,
 
4048
  "hf_private": true
4049
  },
4050
  {
4051
+ "name": "xai/grok-3",
4052
+ "type": "chat",
4053
+ "input_price_per_1m": 5,
4054
+ "output_price_per_1m": 25,
4055
+ "currency": "USD",
4056
+ "context_window": 131072,
4057
+ "capabilities": [
4058
+ "tools"
4059
+ ],
4060
+ "hf_private": true
4061
+ },
4062
+ {
4063
+ "name": "vertex/claude-opus-4-5",
4064
  "type": "vision",
4065
  "input_price_per_1m": 5,
4066
  "output_price_per_1m": 25,
 
4069
  "vision",
4070
  "reasoning"
4071
  ],
4072
+ "context_window": 200000,
4073
  "hf_private": true
4074
  },
4075
  {
4076
+ "name": "vertex/claude-opus-4-6",
4077
  "type": "vision",
4078
  "input_price_per_1m": 5,
4079
  "output_price_per_1m": 25,
 
4082
  "vision",
4083
  "reasoning"
4084
  ],
4085
+ "context_window": 1000000,
4086
  "hf_private": true
4087
  },
4088
  {
 
4099
  "hf_private": true
4100
  },
4101
  {
4102
+ "name": "openai-responses/gpt-5-pro",
4103
  "type": "vision",
4104
  "input_price_per_1m": 15,
4105
+ "output_price_per_1m": 120,
4106
  "currency": "USD",
4107
  "capabilities": [
4108
  "vision",
4109
  "reasoning"
4110
  ],
4111
+ "context_window": 400000,
4112
  "hf_private": true
4113
  },
4114
  {
4115
+ "name": "openai/o1",
4116
  "type": "vision",
4117
  "input_price_per_1m": 15,
4118
+ "output_price_per_1m": 60,
4119
  "currency": "USD",
4120
  "capabilities": [
4121
  "vision",
 
4125
  "hf_private": true
4126
  },
4127
  {
4128
+ "name": "bedrock/claude-opus-4",
4129
  "type": "vision",
4130
  "input_price_per_1m": 15,
4131
  "output_price_per_1m": 75,
 
4138
  "hf_private": true
4139
  },
4140
  {
4141
+ "name": "anthropic/claude-opus-4",
4142
  "type": "vision",
4143
  "input_price_per_1m": 15,
4144
+ "output_price_per_1m": 75,
4145
  "currency": "USD",
4146
  "capabilities": [
4147
  "vision",
4148
  "reasoning"
4149
  ],
4150
+ "context_window": 200000,
4151
  "hf_private": true
4152
  },
4153
  {
4154
+ "name": "anthropic/claude-opus-4-1",
4155
  "type": "vision",
4156
  "input_price_per_1m": 15,
4157
  "output_price_per_1m": 75,
 
4177
  "hf_private": true
4178
  },
4179
  {
4180
+ "name": "vertex/claude-opus-4-1",
4181
  "type": "vision",
4182
  "input_price_per_1m": 15,
4183
  "output_price_per_1m": 75,
 
4190
  "hf_private": true
4191
  },
4192
  {
4193
+ "name": "coding/claude-opus-4-20250514",
4194
  "type": "vision",
4195
  "input_price_per_1m": 15,
4196
  "output_price_per_1m": 75,
 
4216
  "hf_private": true
4217
  },
4218
  {
4219
+ "name": "openai-responses/gpt-5.4-pro",
4220
  "type": "vision",
4221
  "input_price_per_1m": 30,
4222
  "output_price_per_1m": 180,
 
4229
  "hf_private": true
4230
  },
4231
  {
4232
+ "name": "openai/gpt-5.4-pro",
4233
  "type": "vision",
4234
  "input_price_per_1m": 30,
4235
  "output_price_per_1m": 180,
 
4242
  "hf_private": true
4243
  },
4244
  {
4245
+ "name": "azure/openai-responses/gpt-5.4-pro",
4246
  "type": "vision",
4247
  "input_price_per_1m": 30,
4248
  "output_price_per_1m": 180,
 
5091
  ],
5092
  "hf_id": "mistralai/Voxtral-Small-24B-2507",
5093
  "hf_private": false,
5094
+ "price_per_minute": 0.15,
5095
+ "size_source": "manual"
5096
  },
5097
  {
5098
  "name": "gemma-3-27b-it",
 
5176
  "capabilities": [
5177
  "tools"
5178
  ],
5179
+ "size_b": 123,
5180
+ "hf_id": "mistralai/Mistral-Large-Instruct-2407",
5181
  "hf_private": false,
5182
  "ollama_id": "mistral-large",
5183
  "size_source": "manual"
 
5222
  "currency": "USD",
5223
  "api_endpoint": "devstral-medium-latest",
5224
  "ollama_id": "devstral-2",
5225
+ "size_b": 123,
5226
+ "hf_id": "mistralai/Devstral-2-123B-Instruct-2512",
5227
+ "hf_private": false,
5228
+ "size_source": "manual",
5229
+ "capabilities": [
5230
+ "tools"
5231
+ ]
5232
  },
5233
  {
5234
  "name": "Devstral Small 2",
 
5337
  "type": "audio",
5338
  "currency": "USD",
5339
  "api_endpoint": "voxtral-mini-latest",
5340
+ "hf_private": false,
5341
  "price_per_minute": 0.003,
5342
  "capabilities": [
5343
  "audio",
5344
  "tools"
5345
+ ],
5346
+ "size_b": 3,
5347
+ "size_source": "manual",
5348
+ "hf_id": "mistralai/Voxtral-Mini-3B-2507"
5349
  },
5350
  {
5351
  "name": "Voxtral Realtime",
5352
  "type": "audio",
5353
  "currency": "USD",
5354
  "api_endpoint": "voxtral-mini-latest",
5355
+ "hf_private": false,
5356
  "price_per_minute": 0.006,
5357
  "capabilities": [
5358
  "audio",
5359
  "tools"
5360
+ ],
5361
+ "size_b": 4,
5362
+ "size_source": "manual",
5363
+ "hf_id": "mistralai/Voxtral-Mini-4B-Realtime-2602"
5364
  },
5365
  {
5366
  "name": "Voxtral Small",
 
5375
  ],
5376
  "size_b": 24,
5377
  "hf_id": "mistralai/Voxtral-Small-24B-2507",
5378
+ "hf_private": false,
5379
+ "size_source": "manual"
5380
  },
5381
  {
5382
  "name": "Voxtral Mini",
 
5385
  "output_price_per_1m": 0.04,
5386
  "currency": "USD",
5387
  "api_endpoint": "voxtral-mini-latest",
5388
+ "hf_private": false,
5389
  "capabilities": [
5390
  "audio",
5391
  "tools"
5392
+ ],
5393
+ "size_b": 3,
5394
+ "size_source": "manual",
5395
+ "hf_id": "mistralai/Voxtral-Mini-3B-2507"
5396
  },
5397
  {
5398
  "name": "Classifier API model 8B",
 
6344
  ],
6345
  "size_b": 24,
6346
  "hf_private": false,
6347
+ "audio_price_per_1m": 100,
6348
+ "size_source": "manual"
6349
  },
6350
  {
6351
  "name": "nvidia/llama-3.3-nemotron-super-49b-v1.5",
 
7744
  "tools"
7745
  ],
7746
  "size_b": 123,
7747
+ "hf_private": false,
7748
+ "size_source": "manual"
7749
  },
7750
  {
7751
  "name": "deepseek/deepseek-v3.2-speciale",
scripts/fetch-providers.js CHANGED
@@ -207,6 +207,15 @@ const MANUAL_HF_ID_MAP = {
207
  'gemini 3.1 pro': 'google/gemini-3.1-pro-preview',
208
  'gemini 3.1 flash lite': 'google/gemini-3.1-flash-lite-preview',
209
  'gemini 3 flash': 'google/gemini-3-flash-preview',
 
 
 
 
 
 
 
 
 
210
  };
211
 
212
  const MANUAL_OLLAMA_ID_MAP = {
@@ -238,6 +247,14 @@ const MANUAL_SIZE_MAP = {
238
  'google/gemini-3.1-flash-lite-preview': 371,
239
  'google/gemini-3-flash-preview': 1000,
240
  'xiaomi/mimo-v2-omni': 186,
 
 
 
 
 
 
 
 
241
  };
242
 
243
  const PROPRIETARY_KEYWORDS = [
 
207
  'gemini 3.1 pro': 'google/gemini-3.1-pro-preview',
208
  'gemini 3.1 flash lite': 'google/gemini-3.1-flash-lite-preview',
209
  'gemini 3 flash': 'google/gemini-3-flash-preview',
210
+ 'voxtral mini': 'mistralai/Voxtral-Mini-3B-2507',
211
+ 'voxtral realtime': 'mistralai/Voxtral-Mini-4B-Realtime-2602',
212
+ 'voxtral mini transcribe 2': 'mistralai/Voxtral-Mini-3B-2507',
213
+ 'voxtral small': 'mistralai/Voxtral-Small-24B-2507',
214
+ 'mistral large 3': 'mistralai/Mistral-Large-Instruct-2407',
215
+ 'mistral small 3': 'mistralai/Mistral-Small-Instruct-2409',
216
+ 'ministral 3 - 3b': 'mistralai/Ministral-3b-instruct-2410',
217
+ 'ministral 3 - 8b': 'mistralai/Ministral-8b-instruct-2410',
218
+ 'devstral 2': 'mistralai/Devstral-2-123B-Instruct-2512',
219
  };
220
 
221
  const MANUAL_OLLAMA_ID_MAP = {
 
247
  'google/gemini-3.1-flash-lite-preview': 371,
248
  'google/gemini-3-flash-preview': 1000,
249
  'xiaomi/mimo-v2-omni': 186,
250
+ 'mistralai/Voxtral-Mini-3B-2507': 3,
251
+ 'mistralai/Voxtral-Mini-4B-Realtime-2602': 4,
252
+ 'mistralai/Voxtral-Small-24B-2507': 24,
253
+ 'mistralai/Mistral-Large-Instruct-2407': 123,
254
+ 'mistralai/Mistral-Small-Instruct-2409': 22,
255
+ 'mistralai/Ministral-3b-instruct-2410': 3,
256
+ 'mistralai/Ministral-8b-instruct-2410': 8,
257
+ 'mistralai/Devstral-2-123B-Instruct-2512': 123,
258
  };
259
 
260
  const PROPRIETARY_KEYWORDS = [