CrispStrobe commited on
Commit
83eb519
·
1 Parent(s): b6e26aa

fix: correctly map Magistral, Pixtral Large, and Hermes 3 405B repositories

Browse files
Files changed (2) hide show
  1. data/providers.json +733 -725
  2. scripts/fetch-providers.js +3 -0
data/providers.json CHANGED
@@ -1242,16 +1242,24 @@
1242
  "hf_private": true
1243
  },
1244
  {
1245
- "name": "alibaba/qwen-turbo",
1246
  "type": "chat",
1247
  "input_price_per_1m": 0.05,
1248
- "output_price_per_1m": 0.2,
1249
  "currency": "USD",
1250
- "context_window": 1000000,
1251
- "capabilities": [
1252
- "tools"
1253
- ],
1254
- "hf_private": true
 
 
 
 
 
 
 
 
1255
  },
1256
  {
1257
  "name": "novita/meta-llama/llama-3.1-8b-instruct",
@@ -1270,24 +1278,16 @@
1270
  "hf_status": 200
1271
  },
1272
  {
1273
- "name": "novita/Sao10K/L3-8B-Stheno-v3.2",
1274
- "type": "chat",
1275
- "input_price_per_1m": 0.05,
1276
- "output_price_per_1m": 0.05,
1277
- "currency": "USD",
1278
- "context_window": 8192,
1279
- "size_b": 8,
1280
- "hf_private": false
1281
- },
1282
- {
1283
- "name": "novita/sao10k/l3-8b-lunaris",
1284
  "type": "chat",
1285
  "input_price_per_1m": 0.05,
1286
- "output_price_per_1m": 0.05,
1287
  "currency": "USD",
1288
- "context_window": 8192,
1289
- "size_b": 8,
1290
- "hf_private": false
 
 
1291
  },
1292
  {
1293
  "name": "azure/gpt-5-nano",
@@ -1311,6 +1311,16 @@
1311
  "size_b": 3,
1312
  "hf_private": false
1313
  },
 
 
 
 
 
 
 
 
 
 
1314
  {
1315
  "name": "deepinfra/microsoft/phi-4",
1316
  "type": "chat",
@@ -1325,16 +1335,6 @@
1325
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1326
  "hf_status": 200
1327
  },
1328
- {
1329
- "name": "deepinfra/Qwen/Qwen2.5-Coder-32B-Instruct",
1330
- "type": "chat",
1331
- "input_price_per_1m": 0.07,
1332
- "output_price_per_1m": 0.16,
1333
- "currency": "USD",
1334
- "context_window": 16384,
1335
- "size_b": 32,
1336
- "hf_private": false
1337
- },
1338
  {
1339
  "name": "novita/gryphe/mythomax-l2-13b",
1340
  "type": "chat",
@@ -1348,16 +1348,6 @@
1348
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1349
  "hf_status": 200
1350
  },
1351
- {
1352
- "name": "together/meta-llama/Meta-Llama-3-8B-Instruct-Lite",
1353
- "type": "chat",
1354
- "input_price_per_1m": 0.1,
1355
- "output_price_per_1m": 0.1,
1356
- "currency": "USD",
1357
- "context_window": 8192,
1358
- "size_b": 8,
1359
- "hf_private": false
1360
- },
1361
  {
1362
  "name": "groq/openai/gpt-oss-20b",
1363
  "type": "chat",
@@ -1376,21 +1366,47 @@
1376
  "hf_status": 200
1377
  },
1378
  {
1379
- "name": "mistral/devstral-small-2507",
1380
  "type": "chat",
1381
  "input_price_per_1m": 0.1,
1382
  "output_price_per_1m": 0.3,
1383
  "currency": "USD",
1384
- "context_window": 131072,
 
1385
  "capabilities": [
1386
- "tools"
 
1387
  ],
1388
- "hf_id": "mistralai/Devstral-Small-2507",
1389
- "size_b": 24,
1390
  "hf_private": false,
1391
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1392
  "hf_status": 200
1393
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1394
  {
1395
  "name": "mistral/devstral-small-latest",
1396
  "type": "chat",
@@ -1417,49 +1433,35 @@
1417
  "hf_private": true
1418
  },
1419
  {
1420
- "name": "openai-responses/gpt-4.1-nano",
1421
- "type": "vision",
1422
- "input_price_per_1m": 0.1,
1423
- "output_price_per_1m": 0.4,
1424
- "currency": "USD",
1425
- "capabilities": [
1426
- "vision"
1427
- ],
1428
- "context_window": 1047576,
1429
- "hf_private": true
1430
- },
1431
- {
1432
- "name": "deepinfra/Qwen/Qwen3-32B",
1433
  "type": "chat",
1434
  "input_price_per_1m": 0.1,
1435
  "output_price_per_1m": 0.3,
1436
  "currency": "USD",
1437
- "context_window": 40000,
1438
- "size_b": 32,
1439
  "capabilities": [
1440
- "tools",
1441
- "reasoning"
1442
  ],
1443
- "hf_id": "Qwen/Qwen3-32B",
 
1444
  "hf_private": false,
1445
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1446
  "hf_status": 200
1447
  },
1448
  {
1449
- "name": "vertex/gemini-2.5-flash-lite",
1450
  "type": "vision",
1451
  "input_price_per_1m": 0.1,
1452
  "output_price_per_1m": 0.4,
1453
  "currency": "USD",
1454
  "capabilities": [
1455
- "vision",
1456
- "reasoning"
1457
  ],
1458
- "context_window": 1048576,
1459
  "hf_private": true
1460
  },
1461
  {
1462
- "name": "google/gemini-2.0-flash-001",
1463
  "type": "vision",
1464
  "input_price_per_1m": 0.1,
1465
  "output_price_per_1m": 0.4,
@@ -1467,11 +1469,21 @@
1467
  "capabilities": [
1468
  "vision"
1469
  ],
1470
- "context_window": 1048576,
1471
  "hf_private": true
1472
  },
1473
  {
1474
- "name": "google/gemini-2.5-flash-lite",
 
 
 
 
 
 
 
 
 
 
1475
  "type": "vision",
1476
  "input_price_per_1m": 0.1,
1477
  "output_price_per_1m": 0.4,
@@ -1507,18 +1519,6 @@
1507
  "context_window": 1047576,
1508
  "hf_private": true
1509
  },
1510
- {
1511
- "name": "openai/gpt-4.1-nano",
1512
- "type": "vision",
1513
- "input_price_per_1m": 0.1,
1514
- "output_price_per_1m": 0.4,
1515
- "currency": "USD",
1516
- "capabilities": [
1517
- "vision"
1518
- ],
1519
- "context_window": 1047576,
1520
- "hf_private": true
1521
- },
1522
  {
1523
  "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct-Turbo",
1524
  "type": "chat",
@@ -1591,6 +1591,32 @@
1591
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1592
  "hf_status": 200
1593
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1594
  {
1595
  "name": "mistral/mistral-small-latest",
1596
  "type": "vision",
@@ -1622,30 +1648,16 @@
1622
  "hf_status": 200
1623
  },
1624
  {
1625
- "name": "nebius/openai/gpt-oss-120b",
1626
- "type": "chat",
1627
  "input_price_per_1m": 0.15,
1628
  "output_price_per_1m": 0.6,
1629
  "currency": "USD",
1630
  "capabilities": [
1631
- "reasoning"
1632
  ],
1633
- "context_window": 131000,
1634
- "size_b": 120,
1635
- "hf_id": "openai/gpt-oss-120b",
1636
- "hf_private": false,
1637
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
1638
- "hf_status": 200
1639
- },
1640
- {
1641
- "name": "parasail/parasail-qwen3-235b-a22b-instruct-2507",
1642
- "type": "chat",
1643
- "input_price_per_1m": 0.15,
1644
- "output_price_per_1m": 0.85,
1645
- "currency": "USD",
1646
- "context_window": 262144,
1647
- "size_b": 235,
1648
- "hf_private": false
1649
  },
1650
  {
1651
  "name": "novita/deepseek/deepseek-r1-distill-qwen-14b",
@@ -1665,18 +1677,6 @@
1665
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1666
  "hf_status": 200
1667
  },
1668
- {
1669
- "name": "openai/gpt-4o-mini",
1670
- "type": "vision",
1671
- "input_price_per_1m": 0.15,
1672
- "output_price_per_1m": 0.6,
1673
- "currency": "USD",
1674
- "capabilities": [
1675
- "vision"
1676
- ],
1677
- "context_window": 128000,
1678
- "hf_private": true
1679
- },
1680
  {
1681
  "name": "novita/mistralai/mistral-nemo",
1682
  "type": "chat",
@@ -1703,29 +1703,6 @@
1703
  "size_b": 8,
1704
  "hf_private": false
1705
  },
1706
- {
1707
- "name": "together/meta-llama/LlamaGuard-2-8b",
1708
- "type": "chat",
1709
- "input_price_per_1m": 0.2,
1710
- "output_price_per_1m": 0.2,
1711
- "currency": "USD",
1712
- "context_window": 8192,
1713
- "size_b": 8,
1714
- "hf_private": false
1715
- },
1716
- {
1717
- "name": "openai-responses/gpt-5.4-nano",
1718
- "type": "vision",
1719
- "input_price_per_1m": 0.2,
1720
- "output_price_per_1m": 1.25,
1721
- "currency": "USD",
1722
- "capabilities": [
1723
- "vision",
1724
- "reasoning"
1725
- ],
1726
- "context_window": 400000,
1727
- "hf_private": true
1728
- },
1729
  {
1730
  "name": "deepinfra/zai-org/GLM-4.5-Air",
1731
  "type": "chat",
@@ -1761,54 +1738,7 @@
1761
  "hf_status": 200
1762
  },
1763
  {
1764
- "name": "alibaba/qwen3-30b-a3b-instruct-2507",
1765
- "type": "vision",
1766
- "input_price_per_1m": 0.2,
1767
- "output_price_per_1m": 0.8,
1768
- "currency": "USD",
1769
- "capabilities": [
1770
- "vision"
1771
- ],
1772
- "context_window": 131072,
1773
- "size_b": 30,
1774
- "hf_id": "Qwen/Qwen3-30B-A3B-Instruct-2507",
1775
- "hf_private": false,
1776
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
1777
- "hf_status": 200
1778
- },
1779
- {
1780
- "name": "novita/meta-llama/llama-4-maverick-17b-128e-instruct-fp8",
1781
- "type": "chat",
1782
- "input_price_per_1m": 0.2,
1783
- "output_price_per_1m": 0.85,
1784
- "currency": "USD",
1785
- "context_window": 1048576,
1786
- "size_b": 17,
1787
- "capabilities": [
1788
- "vision",
1789
- "tools"
1790
- ],
1791
- "hf_private": false
1792
- },
1793
- {
1794
- "name": "novita/qwen/qwen3-235b-a22b-fp8",
1795
- "type": "chat",
1796
- "input_price_per_1m": 0.2,
1797
- "output_price_per_1m": 0.8,
1798
- "currency": "USD",
1799
- "context_window": 128000,
1800
- "size_b": 235,
1801
- "capabilities": [
1802
- "tools",
1803
- "reasoning"
1804
- ],
1805
- "hf_id": "Qwen/Qwen3-235B-A22B",
1806
- "hf_private": false,
1807
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
1808
- "hf_status": 200
1809
- },
1810
- {
1811
- "name": "xai/grok-4-fast-non-reasoning",
1812
  "type": "chat",
1813
  "input_price_per_1m": 0.2,
1814
  "output_price_per_1m": 0.5,
@@ -1846,7 +1776,19 @@
1846
  "hf_private": true
1847
  },
1848
  {
1849
- "name": "xai/grok-4-fast",
 
 
 
 
 
 
 
 
 
 
 
 
1850
  "type": "chat",
1851
  "input_price_per_1m": 0.2,
1852
  "output_price_per_1m": 0.5,
@@ -1860,15 +1802,16 @@
1860
  "hf_private": true
1861
  },
1862
  {
1863
- "name": "xai/grok-4-1-fast-reasoning",
1864
  "type": "vision",
1865
  "input_price_per_1m": 0.2,
1866
- "output_price_per_1m": 0.5,
1867
  "currency": "USD",
1868
  "capabilities": [
1869
- "vision"
 
1870
  ],
1871
- "context_window": 2000000,
1872
  "hf_private": true
1873
  },
1874
  {
@@ -1884,6 +1827,79 @@
1884
  "context_window": 400000,
1885
  "hf_private": true
1886
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1887
  {
1888
  "name": "deepinfra/deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1889
  "type": "chat",
@@ -1927,20 +1943,16 @@
1927
  "hf_status": 200
1928
  },
1929
  {
1930
- "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct",
1931
- "type": "chat",
1932
- "input_price_per_1m": 0.23,
1933
- "output_price_per_1m": 0.4,
1934
  "currency": "USD",
1935
- "context_window": 131072,
1936
- "size_b": 70,
1937
  "capabilities": [
1938
- "tools"
1939
  ],
1940
- "hf_private": false,
1941
- "hf_id": "meta-llama/Llama-3.3-70B-Instruct",
1942
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
1943
- "hf_status": 200
1944
  },
1945
  {
1946
  "name": "mistral/open-mistral-7b",
@@ -1977,18 +1989,6 @@
1977
  "context_window": 1048576,
1978
  "hf_private": true
1979
  },
1980
- {
1981
- "name": "google/gemini-3.1-flash-lite-preview",
1982
- "type": "vision",
1983
- "input_price_per_1m": 0.25,
1984
- "output_price_per_1m": 1.5,
1985
- "currency": "USD",
1986
- "capabilities": [
1987
- "vision"
1988
- ],
1989
- "context_window": 1048576,
1990
- "hf_private": true
1991
- },
1992
  {
1993
  "name": "azure/gpt-5-mini",
1994
  "type": "chat",
@@ -2044,52 +2044,33 @@
2044
  "hf_private": true
2045
  },
2046
  {
2047
- "name": "together/Qwen/Qwen2.5-7B-Instruct-Turbo",
2048
- "type": "chat",
2049
- "input_price_per_1m": 0.3,
2050
- "output_price_per_1m": 0.3,
2051
- "currency": "USD",
2052
- "context_window": 32768,
2053
- "size_b": 7,
2054
- "hf_private": false
2055
- },
2056
- {
2057
- "name": "mistral/codestral-latest",
2058
- "type": "chat",
2059
- "input_price_per_1m": 0.3,
2060
- "output_price_per_1m": 0.9,
2061
- "currency": "USD",
2062
- "context_window": 131072,
2063
- "hf_private": true
2064
- },
2065
- {
2066
- "name": "nebius/minimax/minimax-m2.1",
2067
  "type": "chat",
2068
  "input_price_per_1m": 0.3,
2069
- "output_price_per_1m": 1.2,
2070
  "currency": "USD",
2071
  "capabilities": [
2072
  "reasoning"
2073
  ],
2074
- "context_window": 200000,
2075
- "hf_id": "MiniMaxAI/MiniMax-M2.1",
2076
- "size_b": 228.7,
2077
  "hf_private": false,
2078
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2079
  "hf_status": 200
2080
  },
2081
  {
2082
- "name": "nebius/deepseek-ai/DeepSeek-V3.2",
2083
  "type": "chat",
2084
  "input_price_per_1m": 0.3,
2085
- "output_price_per_1m": 0.45,
2086
  "currency": "USD",
2087
  "capabilities": [
2088
  "reasoning"
2089
  ],
2090
- "context_window": 164000,
2091
- "hf_id": "deepseek-ai/DeepSeek-V3.2",
2092
- "size_b": 685.4,
2093
  "hf_private": false,
2094
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2095
  "hf_status": 200
@@ -2122,32 +2103,19 @@
2122
  "hf_private": false
2123
  },
2124
  {
2125
- "name": "alibaba/qwen3-coder-flash",
2126
- "type": "vision",
2127
- "input_price_per_1m": 0.3,
2128
- "output_price_per_1m": 1.5,
2129
- "currency": "USD",
2130
- "capabilities": [
2131
- "vision"
2132
- ],
2133
- "context_window": 1048576,
2134
- "hf_private": true
2135
- },
2136
- {
2137
- "name": "vertex/gemini-2.5-flash",
2138
- "type": "vision",
2139
  "input_price_per_1m": 0.3,
2140
- "output_price_per_1m": 2.5,
2141
  "currency": "USD",
2142
  "capabilities": [
2143
- "vision",
2144
  "reasoning"
2145
  ],
2146
- "context_window": 1048576,
2147
  "hf_private": true
2148
  },
2149
  {
2150
- "name": "vertex/gemini-2.5-flash-image",
2151
  "type": "vision",
2152
  "input_price_per_1m": 0.3,
2153
  "output_price_per_1m": 2.5,
@@ -2160,33 +2128,34 @@
2160
  "hf_private": true
2161
  },
2162
  {
2163
- "name": "coding/gemini-2.5-flash",
2164
- "type": "vision",
2165
  "input_price_per_1m": 0.3,
2166
- "output_price_per_1m": 2.5,
2167
  "currency": "USD",
2168
- "capabilities": [
2169
- "vision",
2170
- "reasoning"
2171
- ],
2172
- "context_window": 1048576,
2173
  "hf_private": true
2174
  },
2175
  {
2176
- "name": "google/gemini-2.5-flash",
2177
  "type": "vision",
2178
  "input_price_per_1m": 0.3,
2179
- "output_price_per_1m": 2.5,
2180
  "currency": "USD",
2181
  "capabilities": [
2182
  "vision",
2183
  "reasoning"
2184
  ],
2185
- "context_window": 1048576,
2186
- "hf_private": true
 
 
 
 
 
2187
  },
2188
  {
2189
- "name": "novita/minimax-m2.7",
2190
  "type": "vision",
2191
  "input_price_per_1m": 0.3,
2192
  "output_price_per_1m": 1.2,
@@ -2220,7 +2189,42 @@
2220
  "hf_status": 200
2221
  },
2222
  {
2223
- "name": "novita/MiniMax-M2.7",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2224
  "type": "vision",
2225
  "input_price_per_1m": 0.3,
2226
  "output_price_per_1m": 1.2,
@@ -2272,33 +2276,29 @@
2272
  "hf_status": 200
2273
  },
2274
  {
2275
- "name": "minimaxi/MiniMax-M2.7",
2276
  "type": "vision",
2277
  "input_price_per_1m": 0.3,
2278
- "output_price_per_1m": 1.2,
2279
  "currency": "USD",
2280
  "capabilities": [
2281
  "vision",
2282
  "reasoning"
2283
  ],
2284
- "context_window": 200000,
2285
- "hf_private": false,
2286
- "size_b": 230,
2287
- "size_source": "manual",
2288
- "hf_id": "MiniMaxAI/MiniMax-M2.7",
2289
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
2290
- "hf_status": 200
2291
  },
2292
  {
2293
- "name": "xai/grok-3-mini",
2294
- "type": "chat",
2295
  "input_price_per_1m": 0.3,
2296
- "output_price_per_1m": 0.5,
2297
  "currency": "USD",
2298
  "capabilities": [
 
2299
  "reasoning"
2300
  ],
2301
- "context_window": 131072,
2302
  "hf_private": true
2303
  },
2304
  {
@@ -2343,48 +2343,6 @@
2343
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2344
  "hf_status": 200
2345
  },
2346
- {
2347
- "name": "mistral/devstral-latest",
2348
- "type": "chat",
2349
- "input_price_per_1m": 0.4,
2350
- "output_price_per_1m": 2,
2351
- "currency": "USD",
2352
- "context_window": 256000,
2353
- "hf_private": true
2354
- },
2355
- {
2356
- "name": "mistral/mistral-medium-latest",
2357
- "type": "chat",
2358
- "input_price_per_1m": 0.4,
2359
- "output_price_per_1m": 2,
2360
- "currency": "USD",
2361
- "context_window": 131072,
2362
- "hf_private": true
2363
- },
2364
- {
2365
- "name": "mistral/devstral-medium-2507",
2366
- "type": "chat",
2367
- "input_price_per_1m": 0.4,
2368
- "output_price_per_1m": 2,
2369
- "currency": "USD",
2370
- "context_window": 131072,
2371
- "capabilities": [
2372
- "tools"
2373
- ],
2374
- "hf_private": true
2375
- },
2376
- {
2377
- "name": "openai-responses/gpt-4.1-mini",
2378
- "type": "vision",
2379
- "input_price_per_1m": 0.4,
2380
- "output_price_per_1m": 1.6,
2381
- "currency": "USD",
2382
- "capabilities": [
2383
- "vision"
2384
- ],
2385
- "context_window": 1047576,
2386
- "hf_private": true
2387
- },
2388
  {
2389
  "name": "nebius/zai-org/GLM-4.7",
2390
  "type": "chat",
@@ -2434,10 +2392,19 @@
2434
  "hf_status": 200
2435
  },
2436
  {
2437
- "name": "alibaba/qwen-plus",
2438
  "type": "chat",
2439
  "input_price_per_1m": 0.4,
2440
- "output_price_per_1m": 1.2,
 
 
 
 
 
 
 
 
 
2441
  "currency": "USD",
2442
  "context_window": 131072,
2443
  "capabilities": [
@@ -2445,6 +2412,48 @@
2445
  ],
2446
  "hf_private": true
2447
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2448
  {
2449
  "name": "novita/deepseek/deepseek-v3-0324",
2450
  "type": "chat",
@@ -2463,28 +2472,19 @@
2463
  "hf_status": 200
2464
  },
2465
  {
2466
- "name": "novita/deepseek/deepseek-v3-turbo",
2467
- "type": "chat",
2468
- "input_price_per_1m": 0.4,
2469
- "output_price_per_1m": 1.3,
2470
- "currency": "USD",
2471
- "context_window": 128000,
2472
- "hf_private": true
2473
- },
2474
- {
2475
- "name": "azure/gpt-4.1-mini",
2476
- "type": "vision",
2477
  "input_price_per_1m": 0.4,
2478
- "output_price_per_1m": 1.6,
2479
  "currency": "USD",
 
2480
  "capabilities": [
2481
- "vision"
2482
  ],
2483
- "context_window": 1047576,
2484
  "hf_private": true
2485
  },
2486
  {
2487
- "name": "azure/openai-responses/gpt-4.1-mini",
2488
  "type": "vision",
2489
  "input_price_per_1m": 0.4,
2490
  "output_price_per_1m": 1.6,
@@ -2496,7 +2496,7 @@
2496
  "hf_private": true
2497
  },
2498
  {
2499
- "name": "openai/gpt-4.1-mini",
2500
  "type": "vision",
2501
  "input_price_per_1m": 0.4,
2502
  "output_price_per_1m": 1.6,
@@ -2508,30 +2508,35 @@
2508
  "hf_private": true
2509
  },
2510
  {
2511
- "name": "mistral/mistral-large-latest",
2512
  "type": "chat",
2513
  "input_price_per_1m": 0.5,
2514
  "output_price_per_1m": 1.5,
2515
  "currency": "USD",
2516
- "context_window": 131072,
2517
  "capabilities": [
2518
- "tools"
 
2519
  ],
2520
- "hf_private": true
 
 
 
 
2521
  },
2522
  {
2523
- "name": "nebius/deepseek-ai/DeepSeek-V3-0324",
2524
- "type": "chat",
2525
  "input_price_per_1m": 0.5,
2526
- "output_price_per_1m": 1.5,
2527
  "currency": "USD",
2528
- "context_window": 128000,
2529
  "capabilities": [
2530
- "tools",
2531
  "reasoning"
2532
  ],
2533
- "size_b": 685,
2534
- "hf_id": "deepseek-ai/DeepSeek-V3-0324",
 
2535
  "hf_private": false,
2536
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2537
  "hf_status": 200
@@ -2553,72 +2558,67 @@
2553
  "hf_status": 200
2554
  },
2555
  {
2556
- "name": "nebius/moonshotai/kimi-k2.5",
2557
  "type": "vision",
2558
  "input_price_per_1m": 0.5,
2559
- "output_price_per_1m": 2.5,
2560
  "currency": "USD",
2561
  "capabilities": [
2562
  "vision",
2563
  "reasoning"
2564
  ],
2565
- "context_window": 256000,
2566
- "hf_id": "moonshotai/Kimi-K2.5",
2567
- "size_b": 1058.6,
2568
- "hf_private": false,
2569
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
2570
- "hf_status": 200
2571
  },
2572
  {
2573
- "name": "vertex/gemini-3-flash-preview",
2574
  "type": "vision",
2575
  "input_price_per_1m": 0.5,
2576
- "output_price_per_1m": 3,
2577
  "currency": "USD",
2578
  "capabilities": [
2579
  "vision",
2580
  "reasoning"
2581
  ],
2582
- "context_window": 1048576,
2583
  "hf_private": true
2584
  },
2585
  {
2586
- "name": "vertex/gemini-3.1-flash-image-preview",
2587
- "type": "vision",
2588
  "input_price_per_1m": 0.5,
2589
- "output_price_per_1m": 2,
2590
  "currency": "USD",
 
2591
  "capabilities": [
2592
- "vision",
2593
- "reasoning"
2594
  ],
2595
- "context_window": 131072,
2596
  "hf_private": true
2597
  },
2598
  {
2599
- "name": "google/gemini-3.1-flash-image-preview",
2600
  "type": "vision",
2601
  "input_price_per_1m": 0.5,
2602
- "output_price_per_1m": 2,
2603
  "currency": "USD",
2604
  "capabilities": [
2605
  "vision",
2606
  "reasoning"
2607
  ],
2608
- "context_window": 131072,
2609
  "hf_private": true
2610
  },
2611
  {
2612
- "name": "google/gemini-3-flash-preview",
2613
  "type": "vision",
2614
  "input_price_per_1m": 0.5,
2615
- "output_price_per_1m": 3,
2616
  "currency": "USD",
2617
  "capabilities": [
2618
  "vision",
2619
  "reasoning"
2620
  ],
2621
- "context_window": 1048576,
2622
  "hf_private": true
2623
  },
2624
  {
@@ -2683,16 +2683,34 @@
2683
  "hf_status": 200
2684
  },
2685
  {
2686
- "name": "zai/GLM-4.7",
2687
  "type": "chat",
2688
  "input_price_per_1m": 0.6,
2689
  "output_price_per_1m": 2.2,
2690
  "currency": "USD",
 
2691
  "capabilities": [
 
2692
  "reasoning"
2693
  ],
2694
- "context_window": 200000,
2695
- "hf_id": "zai-org/GLM-4.7",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2696
  "size_b": 358.3,
2697
  "hf_private": false,
2698
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
@@ -2731,24 +2749,23 @@
2731
  "hf_status": 200
2732
  },
2733
  {
2734
- "name": "nebius/zai-org/GLM-4.5",
2735
  "type": "chat",
2736
  "input_price_per_1m": 0.6,
2737
  "output_price_per_1m": 2.2,
2738
  "currency": "USD",
2739
- "context_window": 128000,
2740
  "capabilities": [
2741
- "tools",
2742
  "reasoning"
2743
  ],
2744
- "hf_id": "zai-org/GLM-4.5",
 
2745
  "size_b": 358.3,
2746
  "hf_private": false,
2747
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2748
  "hf_status": 200
2749
  },
2750
  {
2751
- "name": "deepinfra/zai-org/GLM-4.5",
2752
  "type": "chat",
2753
  "input_price_per_1m": 0.6,
2754
  "output_price_per_1m": 2.2,
@@ -2764,6 +2781,23 @@
2764
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2765
  "hf_status": 200
2766
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2767
  {
2768
  "name": "alibaba/qwen3.5",
2769
  "type": "vision",
@@ -2782,17 +2816,33 @@
2782
  "hf_status": 200
2783
  },
2784
  {
2785
- "name": "moonshot/kimi-k2-0711-preview",
2786
- "type": "chat",
2787
  "input_price_per_1m": 0.6,
2788
- "output_price_per_1m": 2.5,
2789
  "currency": "USD",
2790
- "context_window": 131072,
2791
  "capabilities": [
2792
- "tools"
 
2793
  ],
2794
- "hf_id": "moonshotai/Kimi-K2-Instruct",
2795
- "size_b": 1026.5,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2796
  "hf_private": false,
2797
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2798
  "hf_status": 200
@@ -2864,67 +2914,17 @@
2864
  "hf_status": 200
2865
  },
2866
  {
2867
- "name": "novita/zai-org/glm-4.6",
2868
- "type": "chat",
2869
- "input_price_per_1m": 0.6,
2870
- "output_price_per_1m": 2.2,
2871
- "currency": "USD",
2872
- "context_window": 204800,
2873
- "capabilities": [
2874
- "tools",
2875
- "reasoning"
2876
- ],
2877
- "hf_id": "zai-org/GLM-4.6",
2878
- "size_b": 356.8,
2879
- "hf_private": false,
2880
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
2881
- "hf_status": 200
2882
- },
2883
- {
2884
- "name": "novita/zai-org/glm-4.5",
2885
  "type": "chat",
2886
  "input_price_per_1m": 0.6,
2887
- "output_price_per_1m": 2.2,
2888
  "currency": "USD",
2889
  "context_window": 131072,
2890
  "capabilities": [
2891
- "tools",
2892
- "reasoning"
2893
- ],
2894
- "hf_id": "zai-org/GLM-4.5",
2895
- "size_b": 358.3,
2896
- "hf_private": false,
2897
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
2898
- "hf_status": 200
2899
- },
2900
- {
2901
- "name": "minimaxi/MiniMax-M2.7-highspeed",
2902
- "type": "vision",
2903
- "input_price_per_1m": 0.6,
2904
- "output_price_per_1m": 2.4,
2905
- "currency": "USD",
2906
- "capabilities": [
2907
- "vision",
2908
- "reasoning"
2909
- ],
2910
- "context_window": 200000,
2911
- "hf_private": false,
2912
- "size_b": 230,
2913
- "size_source": "manual"
2914
- },
2915
- {
2916
- "name": "minimaxi/MiniMax-M2.5-highspeed",
2917
- "type": "vision",
2918
- "input_price_per_1m": 0.6,
2919
- "output_price_per_1m": 2.4,
2920
- "currency": "USD",
2921
- "capabilities": [
2922
- "vision",
2923
- "reasoning"
2924
  ],
2925
- "context_window": 200000,
2926
- "hf_id": "MiniMaxAI/MiniMax-M2.5",
2927
- "size_b": 228.7,
2928
  "hf_private": false,
2929
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2930
  "hf_status": 200
@@ -3053,68 +3053,68 @@
3053
  "hf_status": 200
3054
  },
3055
  {
3056
- "name": "novita/qwen/qwen2.5-vl-72b-instruct",
3057
  "type": "chat",
3058
  "input_price_per_1m": 0.8,
3059
  "output_price_per_1m": 0.8,
3060
  "currency": "USD",
3061
- "context_window": 96000,
3062
- "size_b": 72,
3063
  "capabilities": [
3064
- "vision"
3065
  ],
3066
- "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
3067
  "hf_private": false,
3068
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3069
  "hf_status": 200
3070
  },
3071
  {
3072
- "name": "novita/deepseek/deepseek-r1-distill-llama-70b",
3073
  "type": "chat",
3074
  "input_price_per_1m": 0.8,
3075
  "output_price_per_1m": 0.8,
3076
  "currency": "USD",
3077
- "context_window": 32000,
3078
- "size_b": 70,
3079
  "capabilities": [
3080
- "reasoning"
3081
  ],
3082
- "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
3083
  "hf_private": false,
3084
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3085
  "hf_status": 200
3086
  },
3087
  {
3088
- "name": "deepinfra/deepseek-ai/DeepSeek-V3",
3089
  "type": "chat",
3090
  "input_price_per_1m": 0.85,
3091
- "output_price_per_1m": 0.9,
3092
  "currency": "USD",
3093
- "context_window": 128000,
3094
  "capabilities": [
3095
  "tools",
3096
  "reasoning"
3097
  ],
3098
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
3099
  "size_b": 671,
 
3100
  "hf_private": false,
3101
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3102
  "hf_status": 200
3103
  },
3104
  {
3105
- "name": "deepinfra/deepseek-ai/DeepSeek-R1",
3106
  "type": "chat",
3107
  "input_price_per_1m": 0.85,
3108
- "output_price_per_1m": 2.5,
3109
  "currency": "USD",
3110
- "context_window": 64000,
3111
  "capabilities": [
3112
  "tools",
3113
  "reasoning"
3114
  ],
3115
- "hf_id": "deepseek-ai/DeepSeek-R1",
3116
  "size_b": 671,
3117
- "size_source": "manual",
3118
  "hf_private": false,
3119
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3120
  "hf_status": 200
@@ -3189,18 +3189,17 @@
3189
  "hf_status": 200
3190
  },
3191
  {
3192
- "name": "zai/GLM-5",
3193
- "type": "vision",
3194
  "input_price_per_1m": 1,
3195
- "output_price_per_1m": 3.2,
3196
  "currency": "USD",
 
3197
  "capabilities": [
3198
- "vision",
3199
- "reasoning"
3200
  ],
3201
- "context_window": 200000,
3202
- "hf_id": "zai-org/GLM-5",
3203
- "size_b": 753.9,
3204
  "hf_private": false,
3205
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3206
  "hf_status": 200
@@ -3222,35 +3221,36 @@
3222
  "hf_status": 200
3223
  },
3224
  {
3225
- "name": "groq/moonshotai/kimi-k2-instruct",
3226
- "type": "chat",
3227
  "input_price_per_1m": 1,
3228
- "output_price_per_1m": 3,
3229
  "currency": "USD",
3230
- "context_window": 131072,
3231
  "capabilities": [
3232
- "tools"
 
3233
  ],
3234
- "hf_id": "moonshotai/Kimi-K2-Instruct",
3235
- "size_b": 1026.5,
 
3236
  "hf_private": false,
3237
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3238
  "hf_status": 200
3239
  },
3240
  {
3241
- "name": "alibaba/qwen3-coder-plus",
3242
- "type": "vision",
3243
  "input_price_per_1m": 1,
3244
- "output_price_per_1m": 5,
3245
  "currency": "USD",
 
3246
  "capabilities": [
3247
  "vision"
3248
  ],
3249
- "context_window": 1048576,
3250
  "hf_private": true
3251
  },
3252
  {
3253
- "name": "vertex/claude-haiku-4-5",
3254
  "type": "vision",
3255
  "input_price_per_1m": 1,
3256
  "output_price_per_1m": 5,
@@ -3262,25 +3262,14 @@
3262
  "hf_private": true
3263
  },
3264
  {
3265
- "name": "perplexity/sonar",
3266
- "type": "chat",
3267
- "input_price_per_1m": 1,
3268
- "output_price_per_1m": 1,
3269
- "currency": "USD",
3270
- "context_window": 131072,
3271
- "capabilities": [
3272
- "vision"
3273
- ],
3274
- "hf_private": true
3275
- },
3276
- {
3277
- "name": "bedrock/claude-haiku-4-5",
3278
  "type": "vision",
3279
  "input_price_per_1m": 1,
3280
- "output_price_per_1m": 5,
3281
  "currency": "USD",
3282
  "capabilities": [
3283
- "vision"
 
3284
  ],
3285
  "context_window": 200000,
3286
  "hf_private": true
@@ -3302,7 +3291,7 @@
3302
  "hf_status": 200
3303
  },
3304
  {
3305
- "name": "anthropic/claude-haiku-4-5",
3306
  "type": "vision",
3307
  "input_price_per_1m": 1,
3308
  "output_price_per_1m": 5,
@@ -3314,14 +3303,25 @@
3314
  "hf_private": true
3315
  },
3316
  {
3317
- "name": "openai/o3",
3318
  "type": "vision",
3319
  "input_price_per_1m": 1,
3320
- "output_price_per_1m": 4,
3321
  "currency": "USD",
3322
  "capabilities": [
3323
- "vision",
3324
- "reasoning"
 
 
 
 
 
 
 
 
 
 
 
3325
  ],
3326
  "context_window": 200000,
3327
  "hf_private": true
@@ -3351,7 +3351,7 @@
3351
  "hf_private": true
3352
  },
3353
  {
3354
- "name": "azure/o4-mini",
3355
  "type": "chat",
3356
  "input_price_per_1m": 1.1,
3357
  "output_price_per_1m": 4.4,
@@ -3363,7 +3363,7 @@
3363
  "hf_private": true
3364
  },
3365
  {
3366
- "name": "openai/o3-mini",
3367
  "type": "chat",
3368
  "input_price_per_1m": 1.1,
3369
  "output_price_per_1m": 4.4,
@@ -3401,24 +3401,20 @@
3401
  "hf_status": 200
3402
  },
3403
  {
3404
- "name": "together/deepseek-ai/DeepSeek-V3",
3405
- "type": "chat",
3406
  "input_price_per_1m": 1.25,
3407
- "output_price_per_1m": 1.25,
3408
  "currency": "USD",
3409
- "context_window": 131072,
3410
  "capabilities": [
3411
- "tools",
3412
  "reasoning"
3413
  ],
3414
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
3415
- "size_b": 671,
3416
- "hf_private": false,
3417
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
3418
- "hf_status": 200
3419
  },
3420
  {
3421
- "name": "openai-responses/gpt-5.1",
3422
  "type": "vision",
3423
  "input_price_per_1m": 1.25,
3424
  "output_price_per_1m": 10,
@@ -3431,7 +3427,7 @@
3431
  "hf_private": true
3432
  },
3433
  {
3434
- "name": "openai-responses/gpt-5.1-codex",
3435
  "type": "vision",
3436
  "input_price_per_1m": 1.25,
3437
  "output_price_per_1m": 10,
@@ -3444,7 +3440,7 @@
3444
  "hf_private": true
3445
  },
3446
  {
3447
- "name": "openai-responses/gpt-5",
3448
  "type": "vision",
3449
  "input_price_per_1m": 1.25,
3450
  "output_price_per_1m": 10,
@@ -3457,7 +3453,7 @@
3457
  "hf_private": true
3458
  },
3459
  {
3460
- "name": "openai-responses/gpt-5-codex",
3461
  "type": "vision",
3462
  "input_price_per_1m": 1.25,
3463
  "output_price_per_1m": 10,
@@ -3470,7 +3466,7 @@
3470
  "hf_private": true
3471
  },
3472
  {
3473
- "name": "vertex/gemini-2.5-pro",
3474
  "type": "vision",
3475
  "input_price_per_1m": 1.25,
3476
  "output_price_per_1m": 10,
@@ -3479,11 +3475,11 @@
3479
  "vision",
3480
  "reasoning"
3481
  ],
3482
- "context_window": 1048576,
3483
  "hf_private": true
3484
  },
3485
  {
3486
- "name": "coding/gemini-2.5-pro",
3487
  "type": "vision",
3488
  "input_price_per_1m": 1.25,
3489
  "output_price_per_1m": 10,
@@ -3492,11 +3488,11 @@
3492
  "vision",
3493
  "reasoning"
3494
  ],
3495
- "context_window": 1048576,
3496
  "hf_private": true
3497
  },
3498
  {
3499
- "name": "google/gemini-2.5-pro",
3500
  "type": "vision",
3501
  "input_price_per_1m": 1.25,
3502
  "output_price_per_1m": 10,
@@ -3505,35 +3501,41 @@
3505
  "vision",
3506
  "reasoning"
3507
  ],
3508
- "context_window": 1048576,
3509
  "hf_private": true
3510
  },
3511
  {
3512
- "name": "azure/gpt-5.1",
3513
- "type": "chat",
3514
  "input_price_per_1m": 1.25,
3515
  "output_price_per_1m": 10,
3516
  "currency": "USD",
3517
  "capabilities": [
 
3518
  "reasoning"
3519
  ],
3520
- "context_window": 200000,
3521
  "hf_private": true
3522
  },
3523
  {
3524
- "name": "azure/gpt-5",
3525
  "type": "chat",
3526
  "input_price_per_1m": 1.25,
3527
- "output_price_per_1m": 10,
3528
  "currency": "USD",
 
3529
  "capabilities": [
 
3530
  "reasoning"
3531
  ],
3532
- "context_window": 200000,
3533
- "hf_private": true
 
 
 
3534
  },
3535
  {
3536
- "name": "openai/gpt-5-chat",
3537
  "type": "vision",
3538
  "input_price_per_1m": 1.25,
3539
  "output_price_per_1m": 10,
@@ -3542,33 +3544,31 @@
3542
  "vision",
3543
  "reasoning"
3544
  ],
3545
- "context_window": 128000,
3546
  "hf_private": true
3547
  },
3548
  {
3549
- "name": "openai/gpt-5.1-chat",
3550
- "type": "vision",
3551
  "input_price_per_1m": 1.25,
3552
  "output_price_per_1m": 10,
3553
  "currency": "USD",
3554
  "capabilities": [
3555
- "vision",
3556
  "reasoning"
3557
  ],
3558
- "context_window": 128000,
3559
  "hf_private": true
3560
  },
3561
  {
3562
- "name": "openai/gpt-5.1",
3563
- "type": "vision",
3564
  "input_price_per_1m": 1.25,
3565
  "output_price_per_1m": 10,
3566
  "currency": "USD",
3567
  "capabilities": [
3568
- "vision",
3569
  "reasoning"
3570
  ],
3571
- "context_window": 400000,
3572
  "hf_private": true
3573
  },
3574
  {
@@ -3604,7 +3604,7 @@
3604
  "hf_private": true
3605
  },
3606
  {
3607
- "name": "openai-responses/gpt-5.3-codex",
3608
  "type": "vision",
3609
  "input_price_per_1m": 1.75,
3610
  "output_price_per_1m": 14,
@@ -3617,7 +3617,7 @@
3617
  "hf_private": true
3618
  },
3619
  {
3620
- "name": "openai-responses/gpt-5.3-chat",
3621
  "type": "vision",
3622
  "input_price_per_1m": 1.75,
3623
  "output_price_per_1m": 14,
@@ -3626,11 +3626,11 @@
3626
  "vision",
3627
  "reasoning"
3628
  ],
3629
- "context_window": 128000,
3630
  "hf_private": true
3631
  },
3632
  {
3633
- "name": "openai-responses/gpt-5.2-codex",
3634
  "type": "vision",
3635
  "input_price_per_1m": 1.75,
3636
  "output_price_per_1m": 14,
@@ -3639,11 +3639,11 @@
3639
  "vision",
3640
  "reasoning"
3641
  ],
3642
- "context_window": 400000,
3643
  "hf_private": true
3644
  },
3645
  {
3646
- "name": "openai-responses/gpt-5.2",
3647
  "type": "vision",
3648
  "input_price_per_1m": 1.75,
3649
  "output_price_per_1m": 14,
@@ -3656,7 +3656,7 @@
3656
  "hf_private": true
3657
  },
3658
  {
3659
- "name": "azure/openai-responses/gpt-5.2-codex",
3660
  "type": "vision",
3661
  "input_price_per_1m": 1.75,
3662
  "output_price_per_1m": 14,
@@ -3665,11 +3665,11 @@
3665
  "vision",
3666
  "reasoning"
3667
  ],
3668
- "context_window": 400000,
3669
  "hf_private": true
3670
  },
3671
  {
3672
- "name": "azure/gpt-5.3-codex",
3673
  "type": "vision",
3674
  "input_price_per_1m": 1.75,
3675
  "output_price_per_1m": 14,
@@ -3682,19 +3682,20 @@
3682
  "hf_private": true
3683
  },
3684
  {
3685
- "name": "azure/gpt-5.2",
3686
- "type": "chat",
3687
  "input_price_per_1m": 1.75,
3688
  "output_price_per_1m": 14,
3689
  "currency": "USD",
3690
  "capabilities": [
 
3691
  "reasoning"
3692
  ],
3693
- "context_window": 200000,
3694
  "hf_private": true
3695
  },
3696
  {
3697
- "name": "openai/gpt-5.2",
3698
  "type": "vision",
3699
  "input_price_per_1m": 1.75,
3700
  "output_price_per_1m": 14,
@@ -3707,20 +3708,19 @@
3707
  "hf_private": true
3708
  },
3709
  {
3710
- "name": "openai/gpt-5.3-chat",
3711
- "type": "vision",
3712
  "input_price_per_1m": 1.75,
3713
  "output_price_per_1m": 14,
3714
  "currency": "USD",
3715
  "capabilities": [
3716
- "vision",
3717
  "reasoning"
3718
  ],
3719
- "context_window": 128000,
3720
  "hf_private": true
3721
  },
3722
  {
3723
- "name": "openai/gpt-5.2-chat",
3724
  "type": "vision",
3725
  "input_price_per_1m": 1.75,
3726
  "output_price_per_1m": 14,
@@ -3729,41 +3729,55 @@
3729
  "vision",
3730
  "reasoning"
3731
  ],
 
 
 
 
 
 
 
 
 
3732
  "context_window": 128000,
3733
  "hf_private": true
3734
  },
3735
  {
3736
- "name": "mistral/pixtral-large-latest",
3737
  "type": "chat",
3738
  "input_price_per_1m": 2,
3739
- "output_price_per_1m": 5,
3740
  "currency": "USD",
3741
  "context_window": 131072,
 
 
 
 
3742
  "hf_private": true
3743
  },
3744
  {
3745
- "name": "openai-responses/gpt-4.1",
3746
  "type": "vision",
3747
  "input_price_per_1m": 2,
3748
- "output_price_per_1m": 8,
3749
  "currency": "USD",
3750
  "capabilities": [
3751
- "vision"
 
3752
  ],
3753
- "context_window": 1047576,
3754
  "hf_private": true
3755
  },
3756
  {
3757
- "name": "nebius/deepseek-ai/DeepSeek-V3-0324-fast",
3758
  "type": "chat",
3759
  "input_price_per_1m": 2,
3760
- "output_price_per_1m": 6,
3761
  "currency": "USD",
3762
- "context_window": 128000,
3763
  "hf_private": true
3764
  },
3765
  {
3766
- "name": "vertex/gemini-3.1-pro-preview",
3767
  "type": "vision",
3768
  "input_price_per_1m": 2,
3769
  "output_price_per_1m": 12,
@@ -3776,7 +3790,7 @@
3776
  "hf_private": true
3777
  },
3778
  {
3779
- "name": "vertex/gemini-3-pro-preview",
3780
  "type": "vision",
3781
  "input_price_per_1m": 2,
3782
  "output_price_per_1m": 12,
@@ -3789,33 +3803,53 @@
3789
  "hf_private": true
3790
  },
3791
  {
3792
- "name": "vertex/gemini-3-pro-image-preview",
 
 
 
 
 
 
 
 
 
3793
  "type": "vision",
3794
  "input_price_per_1m": 2,
3795
- "output_price_per_1m": 12,
 
 
 
 
 
 
 
 
 
 
 
 
3796
  "currency": "USD",
3797
  "capabilities": [
3798
  "vision",
3799
  "reasoning"
3800
  ],
3801
- "context_window": 1048576,
3802
  "hf_private": true
3803
  },
3804
  {
3805
- "name": "perplexity/sonar-reasoning-pro",
3806
- "type": "chat",
3807
  "input_price_per_1m": 2,
3808
  "output_price_per_1m": 8,
3809
  "currency": "USD",
3810
- "context_window": 131072,
3811
  "capabilities": [
3812
- "vision",
3813
- "reasoning"
3814
  ],
 
3815
  "hf_private": true
3816
  },
3817
  {
3818
- "name": "google/gemini-3-pro-preview",
3819
  "type": "vision",
3820
  "input_price_per_1m": 2,
3821
  "output_price_per_1m": 12,
@@ -3828,7 +3862,7 @@
3828
  "hf_private": true
3829
  },
3830
  {
3831
- "name": "google/gemini-3.1-pro-preview",
3832
  "type": "vision",
3833
  "input_price_per_1m": 2,
3834
  "output_price_per_1m": 12,
@@ -3841,25 +3875,16 @@
3841
  "hf_private": true
3842
  },
3843
  {
3844
- "name": "xai/grok-4.2-beta",
3845
  "type": "vision",
3846
  "input_price_per_1m": 2,
3847
- "output_price_per_1m": 6,
3848
  "currency": "USD",
3849
  "capabilities": [
3850
  "vision",
3851
  "reasoning"
3852
  ],
3853
- "context_window": 2000000,
3854
- "hf_private": true
3855
- },
3856
- {
3857
- "name": "xai/grok-2-1212",
3858
- "type": "chat",
3859
- "input_price_per_1m": 2,
3860
- "output_price_per_1m": 10,
3861
- "currency": "USD",
3862
- "context_window": 131072,
3863
  "hf_private": true
3864
  },
3865
  {
@@ -3887,32 +3912,20 @@
3887
  "hf_private": true
3888
  },
3889
  {
3890
- "name": "openai/o4-mini-deep-research",
3891
  "type": "vision",
3892
- "input_price_per_1m": 2,
3893
- "output_price_per_1m": 8,
3894
  "currency": "USD",
3895
  "capabilities": [
3896
  "vision",
3897
  "reasoning"
3898
  ],
3899
- "context_window": 100000,
3900
- "hf_private": true
3901
- },
3902
- {
3903
- "name": "openai/gpt-4.1",
3904
- "type": "vision",
3905
- "input_price_per_1m": 2,
3906
- "output_price_per_1m": 8,
3907
- "currency": "USD",
3908
- "capabilities": [
3909
- "vision"
3910
- ],
3911
- "context_window": 1047576,
3912
  "hf_private": true
3913
  },
3914
  {
3915
- "name": "openai-responses/gpt-5.4",
3916
  "type": "vision",
3917
  "input_price_per_1m": 2.5,
3918
  "output_price_per_1m": 15,
@@ -3925,20 +3938,19 @@
3925
  "hf_private": true
3926
  },
3927
  {
3928
- "name": "azure/openai-responses/gpt-5.4",
3929
  "type": "vision",
3930
  "input_price_per_1m": 2.5,
3931
- "output_price_per_1m": 15,
3932
  "currency": "USD",
3933
  "capabilities": [
3934
- "vision",
3935
- "reasoning"
3936
  ],
3937
- "context_window": 1050000,
3938
  "hf_private": true
3939
  },
3940
  {
3941
- "name": "openai/gpt-4o",
3942
  "type": "vision",
3943
  "input_price_per_1m": 2.5,
3944
  "output_price_per_1m": 10,
@@ -3950,7 +3962,7 @@
3950
  "hf_private": true
3951
  },
3952
  {
3953
- "name": "openai/gpt-4o-2024-11-20",
3954
  "type": "vision",
3955
  "input_price_per_1m": 2.5,
3956
  "output_price_per_1m": 10,
@@ -3962,7 +3974,7 @@
3962
  "hf_private": true
3963
  },
3964
  {
3965
- "name": "openai/gpt-4o-2024-08-06",
3966
  "type": "vision",
3967
  "input_price_per_1m": 2.5,
3968
  "output_price_per_1m": 10,
@@ -3974,7 +3986,7 @@
3974
  "hf_private": true
3975
  },
3976
  {
3977
- "name": "openai/gpt-5.4",
3978
  "type": "vision",
3979
  "input_price_per_1m": 2.5,
3980
  "output_price_per_1m": 15,
@@ -3987,37 +3999,31 @@
3987
  "hf_private": true
3988
  },
3989
  {
3990
- "name": "openai/gpt-4o-2024-05-13",
3991
- "type": "vision",
3992
- "input_price_per_1m": 2.5,
3993
- "output_price_per_1m": 10,
3994
  "currency": "USD",
 
3995
  "capabilities": [
3996
  "vision"
3997
  ],
3998
- "context_window": 128000,
3999
  "hf_private": true
4000
  },
4001
  {
4002
- "name": "together/deepseek-ai/DeepSeek-R1",
4003
- "type": "chat",
4004
  "input_price_per_1m": 3,
4005
- "output_price_per_1m": 7,
4006
  "currency": "USD",
4007
- "context_window": 64000,
4008
  "capabilities": [
4009
- "tools",
4010
- "reasoning"
4011
  ],
4012
- "hf_id": "deepseek-ai/DeepSeek-R1",
4013
- "size_b": 671,
4014
- "size_source": "manual",
4015
- "hf_private": false,
4016
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
4017
- "hf_status": 200
4018
  },
4019
  {
4020
- "name": "vertex/claude-sonnet-4-5",
4021
  "type": "vision",
4022
  "input_price_per_1m": 3,
4023
  "output_price_per_1m": 15,
@@ -4026,11 +4032,11 @@
4026
  "vision",
4027
  "reasoning"
4028
  ],
4029
- "context_window": 200000,
4030
  "hf_private": true
4031
  },
4032
  {
4033
- "name": "vertex/claude-3-7-sonnet",
4034
  "type": "vision",
4035
  "input_price_per_1m": 3,
4036
  "output_price_per_1m": 15,
@@ -4039,11 +4045,11 @@
4039
  "vision",
4040
  "reasoning"
4041
  ],
4042
- "context_window": 200000,
4043
  "hf_private": true
4044
  },
4045
  {
4046
- "name": "vertex/claude-sonnet-4",
4047
  "type": "vision",
4048
  "input_price_per_1m": 3,
4049
  "output_price_per_1m": 15,
@@ -4052,35 +4058,24 @@
4052
  "vision",
4053
  "reasoning"
4054
  ],
4055
- "context_window": 200000,
4056
  "hf_private": true
4057
  },
4058
  {
4059
- "name": "vertex/claude-3-5-sonnet",
4060
  "type": "vision",
4061
  "input_price_per_1m": 3,
4062
  "output_price_per_1m": 15,
4063
  "currency": "USD",
4064
  "capabilities": [
4065
- "vision"
 
4066
  ],
4067
  "context_window": 200000,
4068
  "hf_private": true
4069
  },
4070
  {
4071
- "name": "perplexity/sonar-pro",
4072
- "type": "chat",
4073
- "input_price_per_1m": 3,
4074
- "output_price_per_1m": 15,
4075
- "currency": "USD",
4076
- "context_window": 204800,
4077
- "capabilities": [
4078
- "vision"
4079
- ],
4080
- "hf_private": true
4081
- },
4082
- {
4083
- "name": "coding/claude-sonnet-4-20250514",
4084
  "type": "vision",
4085
  "input_price_per_1m": 3,
4086
  "output_price_per_1m": 15,
@@ -4093,7 +4088,7 @@
4093
  "hf_private": true
4094
  },
4095
  {
4096
- "name": "bedrock/claude-sonnet-4-5",
4097
  "type": "vision",
4098
  "input_price_per_1m": 3,
4099
  "output_price_per_1m": 15,
@@ -4102,11 +4097,11 @@
4102
  "vision",
4103
  "reasoning"
4104
  ],
4105
- "context_window": 200000,
4106
  "hf_private": true
4107
  },
4108
  {
4109
- "name": "bedrock/claude-sonnet-4-6",
4110
  "type": "vision",
4111
  "input_price_per_1m": 3,
4112
  "output_price_per_1m": 15,
@@ -4115,11 +4110,11 @@
4115
  "vision",
4116
  "reasoning"
4117
  ],
4118
- "context_window": 1000000,
4119
  "hf_private": true
4120
  },
4121
  {
4122
- "name": "bedrock/claude-sonnet-4",
4123
  "type": "vision",
4124
  "input_price_per_1m": 3,
4125
  "output_price_per_1m": 15,
@@ -4132,20 +4127,25 @@
4132
  "hf_private": true
4133
  },
4134
  {
4135
- "name": "bedrock/claude-3-7-sonnet",
4136
- "type": "vision",
4137
  "input_price_per_1m": 3,
4138
- "output_price_per_1m": 15,
4139
  "currency": "USD",
 
4140
  "capabilities": [
4141
- "vision",
4142
  "reasoning"
4143
  ],
4144
- "context_window": 200000,
4145
- "hf_private": true
 
 
 
 
4146
  },
4147
  {
4148
- "name": "xai/grok-4",
4149
  "type": "vision",
4150
  "input_price_per_1m": 3,
4151
  "output_price_per_1m": 15,
@@ -4153,11 +4153,11 @@
4153
  "capabilities": [
4154
  "vision"
4155
  ],
4156
- "context_window": 256000,
4157
  "hf_private": true
4158
  },
4159
  {
4160
- "name": "anthropic/claude-sonnet-4-5",
4161
  "type": "vision",
4162
  "input_price_per_1m": 3,
4163
  "output_price_per_1m": 15,
@@ -4166,11 +4166,11 @@
4166
  "vision",
4167
  "reasoning"
4168
  ],
4169
- "context_window": 1000000,
4170
  "hf_private": true
4171
  },
4172
  {
4173
- "name": "anthropic/claude-sonnet-4-6",
4174
  "type": "vision",
4175
  "input_price_per_1m": 3,
4176
  "output_price_per_1m": 15,
@@ -4179,11 +4179,11 @@
4179
  "vision",
4180
  "reasoning"
4181
  ],
4182
- "context_window": 1000000,
4183
  "hf_private": true
4184
  },
4185
  {
4186
- "name": "anthropic/claude-sonnet-4",
4187
  "type": "vision",
4188
  "input_price_per_1m": 3,
4189
  "output_price_per_1m": 15,
@@ -4192,7 +4192,7 @@
4192
  "vision",
4193
  "reasoning"
4194
  ],
4195
- "context_window": 1000000,
4196
  "hf_private": true
4197
  },
4198
  {
@@ -4214,20 +4214,19 @@
4214
  "hf_status": 200
4215
  },
4216
  {
4217
- "name": "vertex/claude-opus-4-6",
4218
- "type": "vision",
4219
  "input_price_per_1m": 5,
4220
  "output_price_per_1m": 25,
4221
  "currency": "USD",
 
4222
  "capabilities": [
4223
- "vision",
4224
- "reasoning"
4225
  ],
4226
- "context_window": 1000000,
4227
  "hf_private": true
4228
  },
4229
  {
4230
- "name": "vertex/claude-opus-4-5",
4231
  "type": "vision",
4232
  "input_price_per_1m": 5,
4233
  "output_price_per_1m": 25,
@@ -4240,7 +4239,7 @@
4240
  "hf_private": true
4241
  },
4242
  {
4243
- "name": "bedrock/claude-opus-4-5",
4244
  "type": "vision",
4245
  "input_price_per_1m": 5,
4246
  "output_price_per_1m": 25,
@@ -4249,36 +4248,36 @@
4249
  "vision",
4250
  "reasoning"
4251
  ],
4252
- "context_window": 200000,
4253
  "hf_private": true
4254
  },
4255
  {
4256
- "name": "bedrock/claude-opus-4-6",
4257
  "type": "vision",
4258
  "input_price_per_1m": 5,
4259
- "output_price_per_1m": 25,
4260
  "currency": "USD",
4261
  "capabilities": [
4262
- "vision",
4263
- "reasoning"
4264
  ],
4265
- "context_window": 1000000,
4266
  "hf_private": true
4267
  },
4268
  {
4269
- "name": "xai/grok-3",
4270
- "type": "chat",
4271
  "input_price_per_1m": 5,
4272
  "output_price_per_1m": 25,
4273
  "currency": "USD",
4274
- "context_window": 131072,
4275
  "capabilities": [
4276
- "tools"
 
4277
  ],
 
4278
  "hf_private": true
4279
  },
4280
  {
4281
- "name": "anthropic/claude-opus-4-5",
4282
  "type": "vision",
4283
  "input_price_per_1m": 5,
4284
  "output_price_per_1m": 25,
@@ -4287,11 +4286,11 @@
4287
  "vision",
4288
  "reasoning"
4289
  ],
4290
- "context_window": 200000,
4291
  "hf_private": true
4292
  },
4293
  {
4294
- "name": "anthropic/claude-opus-4-6",
4295
  "type": "vision",
4296
  "input_price_per_1m": 5,
4297
  "output_price_per_1m": 25,
@@ -4304,15 +4303,16 @@
4304
  "hf_private": true
4305
  },
4306
  {
4307
- "name": "openai/chatgpt-4o",
4308
  "type": "vision",
4309
  "input_price_per_1m": 5,
4310
- "output_price_per_1m": 15,
4311
  "currency": "USD",
4312
  "capabilities": [
4313
- "vision"
 
4314
  ],
4315
- "context_window": 128000,
4316
  "hf_private": true
4317
  },
4318
  {
@@ -4329,20 +4329,20 @@
4329
  "hf_private": true
4330
  },
4331
  {
4332
- "name": "openai-responses/gpt-5-pro",
4333
  "type": "vision",
4334
  "input_price_per_1m": 15,
4335
- "output_price_per_1m": 120,
4336
  "currency": "USD",
4337
  "capabilities": [
4338
  "vision",
4339
  "reasoning"
4340
  ],
4341
- "context_window": 400000,
4342
  "hf_private": true
4343
  },
4344
  {
4345
- "name": "vertex/claude-opus-4-1",
4346
  "type": "vision",
4347
  "input_price_per_1m": 15,
4348
  "output_price_per_1m": 75,
@@ -4355,23 +4355,23 @@
4355
  "hf_private": true
4356
  },
4357
  {
4358
- "name": "vertex/claude-opus-4",
4359
  "type": "vision",
4360
  "input_price_per_1m": 15,
4361
- "output_price_per_1m": 75,
4362
  "currency": "USD",
4363
  "capabilities": [
4364
  "vision",
4365
  "reasoning"
4366
  ],
4367
- "context_window": 200000,
4368
  "hf_private": true
4369
  },
4370
  {
4371
- "name": "coding/claude-opus-4-20250514",
4372
  "type": "vision",
4373
  "input_price_per_1m": 15,
4374
- "output_price_per_1m": 75,
4375
  "currency": "USD",
4376
  "capabilities": [
4377
  "vision",
@@ -4394,7 +4394,7 @@
4394
  "hf_private": true
4395
  },
4396
  {
4397
- "name": "anthropic/claude-opus-4-1",
4398
  "type": "vision",
4399
  "input_price_per_1m": 15,
4400
  "output_price_per_1m": 75,
@@ -4407,7 +4407,7 @@
4407
  "hf_private": true
4408
  },
4409
  {
4410
- "name": "anthropic/claude-opus-4",
4411
  "type": "vision",
4412
  "input_price_per_1m": 15,
4413
  "output_price_per_1m": 75,
@@ -4420,10 +4420,10 @@
4420
  "hf_private": true
4421
  },
4422
  {
4423
- "name": "openai/o1",
4424
  "type": "vision",
4425
  "input_price_per_1m": 15,
4426
- "output_price_per_1m": 60,
4427
  "currency": "USD",
4428
  "capabilities": [
4429
  "vision",
@@ -4459,7 +4459,7 @@
4459
  "hf_private": true
4460
  },
4461
  {
4462
- "name": "azure/openai-responses/gpt-5.4-pro",
4463
  "type": "vision",
4464
  "input_price_per_1m": 30,
4465
  "output_price_per_1m": 180,
@@ -4472,7 +4472,7 @@
4472
  "hf_private": true
4473
  },
4474
  {
4475
- "name": "openai/gpt-5.4-pro",
4476
  "type": "vision",
4477
  "input_price_per_1m": 30,
4478
  "output_price_per_1m": 180,
@@ -5636,7 +5636,12 @@
5636
  "output_price_per_1m": 1.5,
5637
  "currency": "USD",
5638
  "api_endpoint": "magistral-small-latest",
5639
- "hf_private": true
 
 
 
 
 
5640
  },
5641
  {
5642
  "name": "Ministral 3 - 3B",
@@ -5803,7 +5808,10 @@
5803
  "tools"
5804
  ],
5805
  "size_b": 124,
5806
- "hf_private": false
 
 
 
5807
  },
5808
  {
5809
  "name": "Pixtral 12B",
 
1242
  "hf_private": true
1243
  },
1244
  {
1245
+ "name": "novita/sao10k/l3-8b-lunaris",
1246
  "type": "chat",
1247
  "input_price_per_1m": 0.05,
1248
+ "output_price_per_1m": 0.05,
1249
  "currency": "USD",
1250
+ "context_window": 8192,
1251
+ "size_b": 8,
1252
+ "hf_private": false
1253
+ },
1254
+ {
1255
+ "name": "novita/Sao10K/L3-8B-Stheno-v3.2",
1256
+ "type": "chat",
1257
+ "input_price_per_1m": 0.05,
1258
+ "output_price_per_1m": 0.05,
1259
+ "currency": "USD",
1260
+ "context_window": 8192,
1261
+ "size_b": 8,
1262
+ "hf_private": false
1263
  },
1264
  {
1265
  "name": "novita/meta-llama/llama-3.1-8b-instruct",
 
1278
  "hf_status": 200
1279
  },
1280
  {
1281
+ "name": "alibaba/qwen-turbo",
 
 
 
 
 
 
 
 
 
 
1282
  "type": "chat",
1283
  "input_price_per_1m": 0.05,
1284
+ "output_price_per_1m": 0.2,
1285
  "currency": "USD",
1286
+ "context_window": 1000000,
1287
+ "capabilities": [
1288
+ "tools"
1289
+ ],
1290
+ "hf_private": true
1291
  },
1292
  {
1293
  "name": "azure/gpt-5-nano",
 
1311
  "size_b": 3,
1312
  "hf_private": false
1313
  },
1314
+ {
1315
+ "name": "deepinfra/Qwen/Qwen2.5-Coder-32B-Instruct",
1316
+ "type": "chat",
1317
+ "input_price_per_1m": 0.07,
1318
+ "output_price_per_1m": 0.16,
1319
+ "currency": "USD",
1320
+ "context_window": 16384,
1321
+ "size_b": 32,
1322
+ "hf_private": false
1323
+ },
1324
  {
1325
  "name": "deepinfra/microsoft/phi-4",
1326
  "type": "chat",
 
1335
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1336
  "hf_status": 200
1337
  },
 
 
 
 
 
 
 
 
 
 
1338
  {
1339
  "name": "novita/gryphe/mythomax-l2-13b",
1340
  "type": "chat",
 
1348
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1349
  "hf_status": 200
1350
  },
 
 
 
 
 
 
 
 
 
 
1351
  {
1352
  "name": "groq/openai/gpt-oss-20b",
1353
  "type": "chat",
 
1366
  "hf_status": 200
1367
  },
1368
  {
1369
+ "name": "deepinfra/Qwen/Qwen3-32B",
1370
  "type": "chat",
1371
  "input_price_per_1m": 0.1,
1372
  "output_price_per_1m": 0.3,
1373
  "currency": "USD",
1374
+ "context_window": 40000,
1375
+ "size_b": 32,
1376
  "capabilities": [
1377
+ "tools",
1378
+ "reasoning"
1379
  ],
1380
+ "hf_id": "Qwen/Qwen3-32B",
 
1381
  "hf_private": false,
1382
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1383
  "hf_status": 200
1384
  },
1385
+ {
1386
+ "name": "google/gemini-2.5-flash-lite",
1387
+ "type": "vision",
1388
+ "input_price_per_1m": 0.1,
1389
+ "output_price_per_1m": 0.4,
1390
+ "currency": "USD",
1391
+ "capabilities": [
1392
+ "vision",
1393
+ "reasoning"
1394
+ ],
1395
+ "context_window": 1048576,
1396
+ "hf_private": true
1397
+ },
1398
+ {
1399
+ "name": "google/gemini-2.0-flash-001",
1400
+ "type": "vision",
1401
+ "input_price_per_1m": 0.1,
1402
+ "output_price_per_1m": 0.4,
1403
+ "currency": "USD",
1404
+ "capabilities": [
1405
+ "vision"
1406
+ ],
1407
+ "context_window": 1048576,
1408
+ "hf_private": true
1409
+ },
1410
  {
1411
  "name": "mistral/devstral-small-latest",
1412
  "type": "chat",
 
1433
  "hf_private": true
1434
  },
1435
  {
1436
+ "name": "mistral/devstral-small-2507",
 
 
 
 
 
 
 
 
 
 
 
 
1437
  "type": "chat",
1438
  "input_price_per_1m": 0.1,
1439
  "output_price_per_1m": 0.3,
1440
  "currency": "USD",
1441
+ "context_window": 131072,
 
1442
  "capabilities": [
1443
+ "tools"
 
1444
  ],
1445
+ "hf_id": "mistralai/Devstral-Small-2507",
1446
+ "size_b": 24,
1447
  "hf_private": false,
1448
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1449
  "hf_status": 200
1450
  },
1451
  {
1452
+ "name": "openai-responses/gpt-4.1-nano",
1453
  "type": "vision",
1454
  "input_price_per_1m": 0.1,
1455
  "output_price_per_1m": 0.4,
1456
  "currency": "USD",
1457
  "capabilities": [
1458
+ "vision"
 
1459
  ],
1460
+ "context_window": 1047576,
1461
  "hf_private": true
1462
  },
1463
  {
1464
+ "name": "openai/gpt-4.1-nano",
1465
  "type": "vision",
1466
  "input_price_per_1m": 0.1,
1467
  "output_price_per_1m": 0.4,
 
1469
  "capabilities": [
1470
  "vision"
1471
  ],
1472
+ "context_window": 1047576,
1473
  "hf_private": true
1474
  },
1475
  {
1476
+ "name": "together/meta-llama/Meta-Llama-3-8B-Instruct-Lite",
1477
+ "type": "chat",
1478
+ "input_price_per_1m": 0.1,
1479
+ "output_price_per_1m": 0.1,
1480
+ "currency": "USD",
1481
+ "context_window": 8192,
1482
+ "size_b": 8,
1483
+ "hf_private": false
1484
+ },
1485
+ {
1486
+ "name": "vertex/gemini-2.5-flash-lite",
1487
  "type": "vision",
1488
  "input_price_per_1m": 0.1,
1489
  "output_price_per_1m": 0.4,
 
1519
  "context_window": 1047576,
1520
  "hf_private": true
1521
  },
 
 
 
 
 
 
 
 
 
 
 
 
1522
  {
1523
  "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct-Turbo",
1524
  "type": "chat",
 
1591
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1592
  "hf_status": 200
1593
  },
1594
+ {
1595
+ "name": "nebius/openai/gpt-oss-120b",
1596
+ "type": "chat",
1597
+ "input_price_per_1m": 0.15,
1598
+ "output_price_per_1m": 0.6,
1599
+ "currency": "USD",
1600
+ "capabilities": [
1601
+ "reasoning"
1602
+ ],
1603
+ "context_window": 131000,
1604
+ "size_b": 120,
1605
+ "hf_id": "openai/gpt-oss-120b",
1606
+ "hf_private": false,
1607
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
1608
+ "hf_status": 200
1609
+ },
1610
+ {
1611
+ "name": "parasail/parasail-qwen3-235b-a22b-instruct-2507",
1612
+ "type": "chat",
1613
+ "input_price_per_1m": 0.15,
1614
+ "output_price_per_1m": 0.85,
1615
+ "currency": "USD",
1616
+ "context_window": 262144,
1617
+ "size_b": 235,
1618
+ "hf_private": false
1619
+ },
1620
  {
1621
  "name": "mistral/mistral-small-latest",
1622
  "type": "vision",
 
1648
  "hf_status": 200
1649
  },
1650
  {
1651
+ "name": "openai/gpt-4o-mini",
1652
+ "type": "vision",
1653
  "input_price_per_1m": 0.15,
1654
  "output_price_per_1m": 0.6,
1655
  "currency": "USD",
1656
  "capabilities": [
1657
+ "vision"
1658
  ],
1659
+ "context_window": 128000,
1660
+ "hf_private": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1661
  },
1662
  {
1663
  "name": "novita/deepseek/deepseek-r1-distill-qwen-14b",
 
1677
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1678
  "hf_status": 200
1679
  },
 
 
 
 
 
 
 
 
 
 
 
 
1680
  {
1681
  "name": "novita/mistralai/mistral-nemo",
1682
  "type": "chat",
 
1703
  "size_b": 8,
1704
  "hf_private": false
1705
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1706
  {
1707
  "name": "deepinfra/zai-org/GLM-4.5-Air",
1708
  "type": "chat",
 
1738
  "hf_status": 200
1739
  },
1740
  {
1741
+ "name": "xai/grok-4-fast",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1742
  "type": "chat",
1743
  "input_price_per_1m": 0.2,
1744
  "output_price_per_1m": 0.5,
 
1776
  "hf_private": true
1777
  },
1778
  {
1779
+ "name": "xai/grok-4-1-fast-reasoning",
1780
+ "type": "vision",
1781
+ "input_price_per_1m": 0.2,
1782
+ "output_price_per_1m": 0.5,
1783
+ "currency": "USD",
1784
+ "capabilities": [
1785
+ "vision"
1786
+ ],
1787
+ "context_window": 2000000,
1788
+ "hf_private": true
1789
+ },
1790
+ {
1791
+ "name": "xai/grok-4-fast-non-reasoning",
1792
  "type": "chat",
1793
  "input_price_per_1m": 0.2,
1794
  "output_price_per_1m": 0.5,
 
1802
  "hf_private": true
1803
  },
1804
  {
1805
+ "name": "openai-responses/gpt-5.4-nano",
1806
  "type": "vision",
1807
  "input_price_per_1m": 0.2,
1808
+ "output_price_per_1m": 1.25,
1809
  "currency": "USD",
1810
  "capabilities": [
1811
+ "vision",
1812
+ "reasoning"
1813
  ],
1814
+ "context_window": 400000,
1815
  "hf_private": true
1816
  },
1817
  {
 
1827
  "context_window": 400000,
1828
  "hf_private": true
1829
  },
1830
+ {
1831
+ "name": "novita/meta-llama/llama-4-maverick-17b-128e-instruct-fp8",
1832
+ "type": "chat",
1833
+ "input_price_per_1m": 0.2,
1834
+ "output_price_per_1m": 0.85,
1835
+ "currency": "USD",
1836
+ "context_window": 1048576,
1837
+ "size_b": 17,
1838
+ "capabilities": [
1839
+ "vision",
1840
+ "tools"
1841
+ ],
1842
+ "hf_private": false
1843
+ },
1844
+ {
1845
+ "name": "novita/qwen/qwen3-235b-a22b-fp8",
1846
+ "type": "chat",
1847
+ "input_price_per_1m": 0.2,
1848
+ "output_price_per_1m": 0.8,
1849
+ "currency": "USD",
1850
+ "context_window": 128000,
1851
+ "size_b": 235,
1852
+ "capabilities": [
1853
+ "tools",
1854
+ "reasoning"
1855
+ ],
1856
+ "hf_id": "Qwen/Qwen3-235B-A22B",
1857
+ "hf_private": false,
1858
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
1859
+ "hf_status": 200
1860
+ },
1861
+ {
1862
+ "name": "together/meta-llama/LlamaGuard-2-8b",
1863
+ "type": "chat",
1864
+ "input_price_per_1m": 0.2,
1865
+ "output_price_per_1m": 0.2,
1866
+ "currency": "USD",
1867
+ "context_window": 8192,
1868
+ "size_b": 8,
1869
+ "hf_private": false
1870
+ },
1871
+ {
1872
+ "name": "alibaba/qwen3-30b-a3b-instruct-2507",
1873
+ "type": "vision",
1874
+ "input_price_per_1m": 0.2,
1875
+ "output_price_per_1m": 0.8,
1876
+ "currency": "USD",
1877
+ "capabilities": [
1878
+ "vision"
1879
+ ],
1880
+ "context_window": 131072,
1881
+ "size_b": 30,
1882
+ "hf_id": "Qwen/Qwen3-30B-A3B-Instruct-2507",
1883
+ "hf_private": false,
1884
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
1885
+ "hf_status": 200
1886
+ },
1887
+ {
1888
+ "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct",
1889
+ "type": "chat",
1890
+ "input_price_per_1m": 0.23,
1891
+ "output_price_per_1m": 0.4,
1892
+ "currency": "USD",
1893
+ "context_window": 131072,
1894
+ "size_b": 70,
1895
+ "capabilities": [
1896
+ "tools"
1897
+ ],
1898
+ "hf_private": false,
1899
+ "hf_id": "meta-llama/Llama-3.3-70B-Instruct",
1900
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
1901
+ "hf_status": 200
1902
+ },
1903
  {
1904
  "name": "deepinfra/deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1905
  "type": "chat",
 
1943
  "hf_status": 200
1944
  },
1945
  {
1946
+ "name": "google/gemini-3.1-flash-lite-preview",
1947
+ "type": "vision",
1948
+ "input_price_per_1m": 0.25,
1949
+ "output_price_per_1m": 1.5,
1950
  "currency": "USD",
 
 
1951
  "capabilities": [
1952
+ "vision"
1953
  ],
1954
+ "context_window": 1048576,
1955
+ "hf_private": true
 
 
1956
  },
1957
  {
1958
  "name": "mistral/open-mistral-7b",
 
1989
  "context_window": 1048576,
1990
  "hf_private": true
1991
  },
 
 
 
 
 
 
 
 
 
 
 
 
1992
  {
1993
  "name": "azure/gpt-5-mini",
1994
  "type": "chat",
 
2044
  "hf_private": true
2045
  },
2046
  {
2047
+ "name": "nebius/deepseek-ai/DeepSeek-V3.2",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2048
  "type": "chat",
2049
  "input_price_per_1m": 0.3,
2050
+ "output_price_per_1m": 0.45,
2051
  "currency": "USD",
2052
  "capabilities": [
2053
  "reasoning"
2054
  ],
2055
+ "context_window": 164000,
2056
+ "hf_id": "deepseek-ai/DeepSeek-V3.2",
2057
+ "size_b": 685.4,
2058
  "hf_private": false,
2059
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2060
  "hf_status": 200
2061
  },
2062
  {
2063
+ "name": "nebius/minimax/minimax-m2.1",
2064
  "type": "chat",
2065
  "input_price_per_1m": 0.3,
2066
+ "output_price_per_1m": 1.2,
2067
  "currency": "USD",
2068
  "capabilities": [
2069
  "reasoning"
2070
  ],
2071
+ "context_window": 200000,
2072
+ "hf_id": "MiniMaxAI/MiniMax-M2.1",
2073
+ "size_b": 228.7,
2074
  "hf_private": false,
2075
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2076
  "hf_status": 200
 
2103
  "hf_private": false
2104
  },
2105
  {
2106
+ "name": "xai/grok-3-mini",
2107
+ "type": "chat",
 
 
 
 
 
 
 
 
 
 
 
 
2108
  "input_price_per_1m": 0.3,
2109
+ "output_price_per_1m": 0.5,
2110
  "currency": "USD",
2111
  "capabilities": [
 
2112
  "reasoning"
2113
  ],
2114
+ "context_window": 131072,
2115
  "hf_private": true
2116
  },
2117
  {
2118
+ "name": "google/gemini-2.5-flash",
2119
  "type": "vision",
2120
  "input_price_per_1m": 0.3,
2121
  "output_price_per_1m": 2.5,
 
2128
  "hf_private": true
2129
  },
2130
  {
2131
+ "name": "mistral/codestral-latest",
2132
+ "type": "chat",
2133
  "input_price_per_1m": 0.3,
2134
+ "output_price_per_1m": 0.9,
2135
  "currency": "USD",
2136
+ "context_window": 131072,
 
 
 
 
2137
  "hf_private": true
2138
  },
2139
  {
2140
+ "name": "novita/minimax-m2.7",
2141
  "type": "vision",
2142
  "input_price_per_1m": 0.3,
2143
+ "output_price_per_1m": 1.2,
2144
  "currency": "USD",
2145
  "capabilities": [
2146
  "vision",
2147
  "reasoning"
2148
  ],
2149
+ "context_window": 200000,
2150
+ "hf_private": false,
2151
+ "size_b": 230,
2152
+ "size_source": "manual",
2153
+ "hf_id": "MiniMaxAI/MiniMax-M2.7",
2154
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
2155
+ "hf_status": 200
2156
  },
2157
  {
2158
+ "name": "novita/MiniMax-M2.7",
2159
  "type": "vision",
2160
  "input_price_per_1m": 0.3,
2161
  "output_price_per_1m": 1.2,
 
2189
  "hf_status": 200
2190
  },
2191
  {
2192
+ "name": "coding/gemini-2.5-flash",
2193
+ "type": "vision",
2194
+ "input_price_per_1m": 0.3,
2195
+ "output_price_per_1m": 2.5,
2196
+ "currency": "USD",
2197
+ "capabilities": [
2198
+ "vision",
2199
+ "reasoning"
2200
+ ],
2201
+ "context_window": 1048576,
2202
+ "hf_private": true
2203
+ },
2204
+ {
2205
+ "name": "together/Qwen/Qwen2.5-7B-Instruct-Turbo",
2206
+ "type": "chat",
2207
+ "input_price_per_1m": 0.3,
2208
+ "output_price_per_1m": 0.3,
2209
+ "currency": "USD",
2210
+ "context_window": 32768,
2211
+ "size_b": 7,
2212
+ "hf_private": false
2213
+ },
2214
+ {
2215
+ "name": "alibaba/qwen3-coder-flash",
2216
+ "type": "vision",
2217
+ "input_price_per_1m": 0.3,
2218
+ "output_price_per_1m": 1.5,
2219
+ "currency": "USD",
2220
+ "capabilities": [
2221
+ "vision"
2222
+ ],
2223
+ "context_window": 1048576,
2224
+ "hf_private": true
2225
+ },
2226
+ {
2227
+ "name": "minimaxi/MiniMax-M2.7",
2228
  "type": "vision",
2229
  "input_price_per_1m": 0.3,
2230
  "output_price_per_1m": 1.2,
 
2276
  "hf_status": 200
2277
  },
2278
  {
2279
+ "name": "vertex/gemini-2.5-flash",
2280
  "type": "vision",
2281
  "input_price_per_1m": 0.3,
2282
+ "output_price_per_1m": 2.5,
2283
  "currency": "USD",
2284
  "capabilities": [
2285
  "vision",
2286
  "reasoning"
2287
  ],
2288
+ "context_window": 1048576,
2289
+ "hf_private": true
 
 
 
 
 
2290
  },
2291
  {
2292
+ "name": "vertex/gemini-2.5-flash-image",
2293
+ "type": "vision",
2294
  "input_price_per_1m": 0.3,
2295
+ "output_price_per_1m": 2.5,
2296
  "currency": "USD",
2297
  "capabilities": [
2298
+ "vision",
2299
  "reasoning"
2300
  ],
2301
+ "context_window": 1048576,
2302
  "hf_private": true
2303
  },
2304
  {
 
2343
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2344
  "hf_status": 200
2345
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2346
  {
2347
  "name": "nebius/zai-org/GLM-4.7",
2348
  "type": "chat",
 
2392
  "hf_status": 200
2393
  },
2394
  {
2395
+ "name": "mistral/mistral-medium-latest",
2396
  "type": "chat",
2397
  "input_price_per_1m": 0.4,
2398
+ "output_price_per_1m": 2,
2399
+ "currency": "USD",
2400
+ "context_window": 131072,
2401
+ "hf_private": true
2402
+ },
2403
+ {
2404
+ "name": "mistral/devstral-medium-2507",
2405
+ "type": "chat",
2406
+ "input_price_per_1m": 0.4,
2407
+ "output_price_per_1m": 2,
2408
  "currency": "USD",
2409
  "context_window": 131072,
2410
  "capabilities": [
 
2412
  ],
2413
  "hf_private": true
2414
  },
2415
+ {
2416
+ "name": "mistral/devstral-latest",
2417
+ "type": "chat",
2418
+ "input_price_per_1m": 0.4,
2419
+ "output_price_per_1m": 2,
2420
+ "currency": "USD",
2421
+ "context_window": 256000,
2422
+ "hf_private": true
2423
+ },
2424
+ {
2425
+ "name": "openai-responses/gpt-4.1-mini",
2426
+ "type": "vision",
2427
+ "input_price_per_1m": 0.4,
2428
+ "output_price_per_1m": 1.6,
2429
+ "currency": "USD",
2430
+ "capabilities": [
2431
+ "vision"
2432
+ ],
2433
+ "context_window": 1047576,
2434
+ "hf_private": true
2435
+ },
2436
+ {
2437
+ "name": "openai/gpt-4.1-mini",
2438
+ "type": "vision",
2439
+ "input_price_per_1m": 0.4,
2440
+ "output_price_per_1m": 1.6,
2441
+ "currency": "USD",
2442
+ "capabilities": [
2443
+ "vision"
2444
+ ],
2445
+ "context_window": 1047576,
2446
+ "hf_private": true
2447
+ },
2448
+ {
2449
+ "name": "novita/deepseek/deepseek-v3-turbo",
2450
+ "type": "chat",
2451
+ "input_price_per_1m": 0.4,
2452
+ "output_price_per_1m": 1.3,
2453
+ "currency": "USD",
2454
+ "context_window": 128000,
2455
+ "hf_private": true
2456
+ },
2457
  {
2458
  "name": "novita/deepseek/deepseek-v3-0324",
2459
  "type": "chat",
 
2472
  "hf_status": 200
2473
  },
2474
  {
2475
+ "name": "alibaba/qwen-plus",
2476
+ "type": "chat",
 
 
 
 
 
 
 
 
 
2477
  "input_price_per_1m": 0.4,
2478
+ "output_price_per_1m": 1.2,
2479
  "currency": "USD",
2480
+ "context_window": 131072,
2481
  "capabilities": [
2482
+ "tools"
2483
  ],
 
2484
  "hf_private": true
2485
  },
2486
  {
2487
+ "name": "azure/gpt-4.1-mini",
2488
  "type": "vision",
2489
  "input_price_per_1m": 0.4,
2490
  "output_price_per_1m": 1.6,
 
2496
  "hf_private": true
2497
  },
2498
  {
2499
+ "name": "azure/openai-responses/gpt-4.1-mini",
2500
  "type": "vision",
2501
  "input_price_per_1m": 0.4,
2502
  "output_price_per_1m": 1.6,
 
2508
  "hf_private": true
2509
  },
2510
  {
2511
+ "name": "nebius/deepseek-ai/DeepSeek-V3-0324",
2512
  "type": "chat",
2513
  "input_price_per_1m": 0.5,
2514
  "output_price_per_1m": 1.5,
2515
  "currency": "USD",
2516
+ "context_window": 128000,
2517
  "capabilities": [
2518
+ "tools",
2519
+ "reasoning"
2520
  ],
2521
+ "size_b": 685,
2522
+ "hf_id": "deepseek-ai/DeepSeek-V3-0324",
2523
+ "hf_private": false,
2524
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
2525
+ "hf_status": 200
2526
  },
2527
  {
2528
+ "name": "nebius/moonshotai/kimi-k2.5",
2529
+ "type": "vision",
2530
  "input_price_per_1m": 0.5,
2531
+ "output_price_per_1m": 2.5,
2532
  "currency": "USD",
 
2533
  "capabilities": [
2534
+ "vision",
2535
  "reasoning"
2536
  ],
2537
+ "context_window": 256000,
2538
+ "hf_id": "moonshotai/Kimi-K2.5",
2539
+ "size_b": 1058.6,
2540
  "hf_private": false,
2541
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2542
  "hf_status": 200
 
2558
  "hf_status": 200
2559
  },
2560
  {
2561
+ "name": "google/gemini-3-flash-preview",
2562
  "type": "vision",
2563
  "input_price_per_1m": 0.5,
2564
+ "output_price_per_1m": 3,
2565
  "currency": "USD",
2566
  "capabilities": [
2567
  "vision",
2568
  "reasoning"
2569
  ],
2570
+ "context_window": 1048576,
2571
+ "hf_private": true
 
 
 
 
2572
  },
2573
  {
2574
+ "name": "google/gemini-3.1-flash-image-preview",
2575
  "type": "vision",
2576
  "input_price_per_1m": 0.5,
2577
+ "output_price_per_1m": 2,
2578
  "currency": "USD",
2579
  "capabilities": [
2580
  "vision",
2581
  "reasoning"
2582
  ],
2583
+ "context_window": 131072,
2584
  "hf_private": true
2585
  },
2586
  {
2587
+ "name": "mistral/mistral-large-latest",
2588
+ "type": "chat",
2589
  "input_price_per_1m": 0.5,
2590
+ "output_price_per_1m": 1.5,
2591
  "currency": "USD",
2592
+ "context_window": 131072,
2593
  "capabilities": [
2594
+ "tools"
 
2595
  ],
 
2596
  "hf_private": true
2597
  },
2598
  {
2599
+ "name": "vertex/gemini-3-flash-preview",
2600
  "type": "vision",
2601
  "input_price_per_1m": 0.5,
2602
+ "output_price_per_1m": 3,
2603
  "currency": "USD",
2604
  "capabilities": [
2605
  "vision",
2606
  "reasoning"
2607
  ],
2608
+ "context_window": 1048576,
2609
  "hf_private": true
2610
  },
2611
  {
2612
+ "name": "vertex/gemini-3.1-flash-image-preview",
2613
  "type": "vision",
2614
  "input_price_per_1m": 0.5,
2615
+ "output_price_per_1m": 2,
2616
  "currency": "USD",
2617
  "capabilities": [
2618
  "vision",
2619
  "reasoning"
2620
  ],
2621
+ "context_window": 131072,
2622
  "hf_private": true
2623
  },
2624
  {
 
2683
  "hf_status": 200
2684
  },
2685
  {
2686
+ "name": "nebius/zai-org/GLM-4.5",
2687
  "type": "chat",
2688
  "input_price_per_1m": 0.6,
2689
  "output_price_per_1m": 2.2,
2690
  "currency": "USD",
2691
+ "context_window": 128000,
2692
  "capabilities": [
2693
+ "tools",
2694
  "reasoning"
2695
  ],
2696
+ "hf_id": "zai-org/GLM-4.5",
2697
+ "size_b": 358.3,
2698
+ "hf_private": false,
2699
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
2700
+ "hf_status": 200
2701
+ },
2702
+ {
2703
+ "name": "deepinfra/zai-org/GLM-4.5",
2704
+ "type": "chat",
2705
+ "input_price_per_1m": 0.6,
2706
+ "output_price_per_1m": 2.2,
2707
+ "currency": "USD",
2708
+ "context_window": 131072,
2709
+ "capabilities": [
2710
+ "tools",
2711
+ "reasoning"
2712
+ ],
2713
+ "hf_id": "zai-org/GLM-4.5",
2714
  "size_b": 358.3,
2715
  "hf_private": false,
2716
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
 
2749
  "hf_status": 200
2750
  },
2751
  {
2752
+ "name": "zai/GLM-4.7",
2753
  "type": "chat",
2754
  "input_price_per_1m": 0.6,
2755
  "output_price_per_1m": 2.2,
2756
  "currency": "USD",
 
2757
  "capabilities": [
 
2758
  "reasoning"
2759
  ],
2760
+ "context_window": 200000,
2761
+ "hf_id": "zai-org/GLM-4.7",
2762
  "size_b": 358.3,
2763
  "hf_private": false,
2764
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2765
  "hf_status": 200
2766
  },
2767
  {
2768
+ "name": "novita/zai-org/glm-4.5",
2769
  "type": "chat",
2770
  "input_price_per_1m": 0.6,
2771
  "output_price_per_1m": 2.2,
 
2781
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2782
  "hf_status": 200
2783
  },
2784
+ {
2785
+ "name": "novita/zai-org/glm-4.6",
2786
+ "type": "chat",
2787
+ "input_price_per_1m": 0.6,
2788
+ "output_price_per_1m": 2.2,
2789
+ "currency": "USD",
2790
+ "context_window": 204800,
2791
+ "capabilities": [
2792
+ "tools",
2793
+ "reasoning"
2794
+ ],
2795
+ "hf_id": "zai-org/GLM-4.6",
2796
+ "size_b": 356.8,
2797
+ "hf_private": false,
2798
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
2799
+ "hf_status": 200
2800
+ },
2801
  {
2802
  "name": "alibaba/qwen3.5",
2803
  "type": "vision",
 
2816
  "hf_status": 200
2817
  },
2818
  {
2819
+ "name": "minimaxi/MiniMax-M2.7-highspeed",
2820
+ "type": "vision",
2821
  "input_price_per_1m": 0.6,
2822
+ "output_price_per_1m": 2.4,
2823
  "currency": "USD",
 
2824
  "capabilities": [
2825
+ "vision",
2826
+ "reasoning"
2827
  ],
2828
+ "context_window": 200000,
2829
+ "hf_private": false,
2830
+ "size_b": 230,
2831
+ "size_source": "manual"
2832
+ },
2833
+ {
2834
+ "name": "minimaxi/MiniMax-M2.5-highspeed",
2835
+ "type": "vision",
2836
+ "input_price_per_1m": 0.6,
2837
+ "output_price_per_1m": 2.4,
2838
+ "currency": "USD",
2839
+ "capabilities": [
2840
+ "vision",
2841
+ "reasoning"
2842
+ ],
2843
+ "context_window": 200000,
2844
+ "hf_id": "MiniMaxAI/MiniMax-M2.5",
2845
+ "size_b": 228.7,
2846
  "hf_private": false,
2847
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2848
  "hf_status": 200
 
2914
  "hf_status": 200
2915
  },
2916
  {
2917
+ "name": "moonshot/kimi-k2-0711-preview",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2918
  "type": "chat",
2919
  "input_price_per_1m": 0.6,
2920
+ "output_price_per_1m": 2.5,
2921
  "currency": "USD",
2922
  "context_window": 131072,
2923
  "capabilities": [
2924
+ "tools"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2925
  ],
2926
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
2927
+ "size_b": 1026.5,
 
2928
  "hf_private": false,
2929
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2930
  "hf_status": 200
 
3053
  "hf_status": 200
3054
  },
3055
  {
3056
+ "name": "novita/deepseek/deepseek-r1-distill-llama-70b",
3057
  "type": "chat",
3058
  "input_price_per_1m": 0.8,
3059
  "output_price_per_1m": 0.8,
3060
  "currency": "USD",
3061
+ "context_window": 32000,
3062
+ "size_b": 70,
3063
  "capabilities": [
3064
+ "reasoning"
3065
  ],
3066
+ "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
3067
  "hf_private": false,
3068
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3069
  "hf_status": 200
3070
  },
3071
  {
3072
+ "name": "novita/qwen/qwen2.5-vl-72b-instruct",
3073
  "type": "chat",
3074
  "input_price_per_1m": 0.8,
3075
  "output_price_per_1m": 0.8,
3076
  "currency": "USD",
3077
+ "context_window": 96000,
3078
+ "size_b": 72,
3079
  "capabilities": [
3080
+ "vision"
3081
  ],
3082
+ "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
3083
  "hf_private": false,
3084
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3085
  "hf_status": 200
3086
  },
3087
  {
3088
+ "name": "deepinfra/deepseek-ai/DeepSeek-R1",
3089
  "type": "chat",
3090
  "input_price_per_1m": 0.85,
3091
+ "output_price_per_1m": 2.5,
3092
  "currency": "USD",
3093
+ "context_window": 64000,
3094
  "capabilities": [
3095
  "tools",
3096
  "reasoning"
3097
  ],
3098
+ "hf_id": "deepseek-ai/DeepSeek-R1",
3099
  "size_b": 671,
3100
+ "size_source": "manual",
3101
  "hf_private": false,
3102
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3103
  "hf_status": 200
3104
  },
3105
  {
3106
+ "name": "deepinfra/deepseek-ai/DeepSeek-V3",
3107
  "type": "chat",
3108
  "input_price_per_1m": 0.85,
3109
+ "output_price_per_1m": 0.9,
3110
  "currency": "USD",
3111
+ "context_window": 128000,
3112
  "capabilities": [
3113
  "tools",
3114
  "reasoning"
3115
  ],
3116
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
3117
  "size_b": 671,
 
3118
  "hf_private": false,
3119
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3120
  "hf_status": 200
 
3189
  "hf_status": 200
3190
  },
3191
  {
3192
+ "name": "groq/moonshotai/kimi-k2-instruct",
3193
+ "type": "chat",
3194
  "input_price_per_1m": 1,
3195
+ "output_price_per_1m": 3,
3196
  "currency": "USD",
3197
+ "context_window": 131072,
3198
  "capabilities": [
3199
+ "tools"
 
3200
  ],
3201
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
3202
+ "size_b": 1026.5,
 
3203
  "hf_private": false,
3204
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3205
  "hf_status": 200
 
3221
  "hf_status": 200
3222
  },
3223
  {
3224
+ "name": "zai/GLM-5",
3225
+ "type": "vision",
3226
  "input_price_per_1m": 1,
3227
+ "output_price_per_1m": 3.2,
3228
  "currency": "USD",
 
3229
  "capabilities": [
3230
+ "vision",
3231
+ "reasoning"
3232
  ],
3233
+ "context_window": 200000,
3234
+ "hf_id": "zai-org/GLM-5",
3235
+ "size_b": 753.9,
3236
  "hf_private": false,
3237
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3238
  "hf_status": 200
3239
  },
3240
  {
3241
+ "name": "perplexity/sonar",
3242
+ "type": "chat",
3243
  "input_price_per_1m": 1,
3244
+ "output_price_per_1m": 1,
3245
  "currency": "USD",
3246
+ "context_window": 131072,
3247
  "capabilities": [
3248
  "vision"
3249
  ],
 
3250
  "hf_private": true
3251
  },
3252
  {
3253
+ "name": "anthropic/claude-haiku-4-5",
3254
  "type": "vision",
3255
  "input_price_per_1m": 1,
3256
  "output_price_per_1m": 5,
 
3262
  "hf_private": true
3263
  },
3264
  {
3265
+ "name": "openai/o3",
 
 
 
 
 
 
 
 
 
 
 
 
3266
  "type": "vision",
3267
  "input_price_per_1m": 1,
3268
+ "output_price_per_1m": 4,
3269
  "currency": "USD",
3270
  "capabilities": [
3271
+ "vision",
3272
+ "reasoning"
3273
  ],
3274
  "context_window": 200000,
3275
  "hf_private": true
 
3291
  "hf_status": 200
3292
  },
3293
  {
3294
+ "name": "bedrock/claude-haiku-4-5",
3295
  "type": "vision",
3296
  "input_price_per_1m": 1,
3297
  "output_price_per_1m": 5,
 
3303
  "hf_private": true
3304
  },
3305
  {
3306
+ "name": "alibaba/qwen3-coder-plus",
3307
  "type": "vision",
3308
  "input_price_per_1m": 1,
3309
+ "output_price_per_1m": 5,
3310
  "currency": "USD",
3311
  "capabilities": [
3312
+ "vision"
3313
+ ],
3314
+ "context_window": 1048576,
3315
+ "hf_private": true
3316
+ },
3317
+ {
3318
+ "name": "vertex/claude-haiku-4-5",
3319
+ "type": "vision",
3320
+ "input_price_per_1m": 1,
3321
+ "output_price_per_1m": 5,
3322
+ "currency": "USD",
3323
+ "capabilities": [
3324
+ "vision"
3325
  ],
3326
  "context_window": 200000,
3327
  "hf_private": true
 
3351
  "hf_private": true
3352
  },
3353
  {
3354
+ "name": "openai/o3-mini",
3355
  "type": "chat",
3356
  "input_price_per_1m": 1.1,
3357
  "output_price_per_1m": 4.4,
 
3363
  "hf_private": true
3364
  },
3365
  {
3366
+ "name": "azure/o4-mini",
3367
  "type": "chat",
3368
  "input_price_per_1m": 1.1,
3369
  "output_price_per_1m": 4.4,
 
3401
  "hf_status": 200
3402
  },
3403
  {
3404
+ "name": "google/gemini-2.5-pro",
3405
+ "type": "vision",
3406
  "input_price_per_1m": 1.25,
3407
+ "output_price_per_1m": 10,
3408
  "currency": "USD",
 
3409
  "capabilities": [
3410
+ "vision",
3411
  "reasoning"
3412
  ],
3413
+ "context_window": 1048576,
3414
+ "hf_private": true
 
 
 
3415
  },
3416
  {
3417
+ "name": "openai-responses/gpt-5.1-codex",
3418
  "type": "vision",
3419
  "input_price_per_1m": 1.25,
3420
  "output_price_per_1m": 10,
 
3427
  "hf_private": true
3428
  },
3429
  {
3430
+ "name": "openai-responses/gpt-5.1",
3431
  "type": "vision",
3432
  "input_price_per_1m": 1.25,
3433
  "output_price_per_1m": 10,
 
3440
  "hf_private": true
3441
  },
3442
  {
3443
+ "name": "openai-responses/gpt-5-codex",
3444
  "type": "vision",
3445
  "input_price_per_1m": 1.25,
3446
  "output_price_per_1m": 10,
 
3453
  "hf_private": true
3454
  },
3455
  {
3456
+ "name": "openai-responses/gpt-5",
3457
  "type": "vision",
3458
  "input_price_per_1m": 1.25,
3459
  "output_price_per_1m": 10,
 
3466
  "hf_private": true
3467
  },
3468
  {
3469
+ "name": "openai/gpt-5-chat",
3470
  "type": "vision",
3471
  "input_price_per_1m": 1.25,
3472
  "output_price_per_1m": 10,
 
3475
  "vision",
3476
  "reasoning"
3477
  ],
3478
+ "context_window": 128000,
3479
  "hf_private": true
3480
  },
3481
  {
3482
+ "name": "openai/gpt-5.1",
3483
  "type": "vision",
3484
  "input_price_per_1m": 1.25,
3485
  "output_price_per_1m": 10,
 
3488
  "vision",
3489
  "reasoning"
3490
  ],
3491
+ "context_window": 400000,
3492
  "hf_private": true
3493
  },
3494
  {
3495
+ "name": "openai/gpt-5.1-chat",
3496
  "type": "vision",
3497
  "input_price_per_1m": 1.25,
3498
  "output_price_per_1m": 10,
 
3501
  "vision",
3502
  "reasoning"
3503
  ],
3504
+ "context_window": 128000,
3505
  "hf_private": true
3506
  },
3507
  {
3508
+ "name": "coding/gemini-2.5-pro",
3509
+ "type": "vision",
3510
  "input_price_per_1m": 1.25,
3511
  "output_price_per_1m": 10,
3512
  "currency": "USD",
3513
  "capabilities": [
3514
+ "vision",
3515
  "reasoning"
3516
  ],
3517
+ "context_window": 1048576,
3518
  "hf_private": true
3519
  },
3520
  {
3521
+ "name": "together/deepseek-ai/DeepSeek-V3",
3522
  "type": "chat",
3523
  "input_price_per_1m": 1.25,
3524
+ "output_price_per_1m": 1.25,
3525
  "currency": "USD",
3526
+ "context_window": 131072,
3527
  "capabilities": [
3528
+ "tools",
3529
  "reasoning"
3530
  ],
3531
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
3532
+ "size_b": 671,
3533
+ "hf_private": false,
3534
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
3535
+ "hf_status": 200
3536
  },
3537
  {
3538
+ "name": "vertex/gemini-2.5-pro",
3539
  "type": "vision",
3540
  "input_price_per_1m": 1.25,
3541
  "output_price_per_1m": 10,
 
3544
  "vision",
3545
  "reasoning"
3546
  ],
3547
+ "context_window": 1048576,
3548
  "hf_private": true
3549
  },
3550
  {
3551
+ "name": "azure/gpt-5",
3552
+ "type": "chat",
3553
  "input_price_per_1m": 1.25,
3554
  "output_price_per_1m": 10,
3555
  "currency": "USD",
3556
  "capabilities": [
 
3557
  "reasoning"
3558
  ],
3559
+ "context_window": 200000,
3560
  "hf_private": true
3561
  },
3562
  {
3563
+ "name": "azure/gpt-5.1",
3564
+ "type": "chat",
3565
  "input_price_per_1m": 1.25,
3566
  "output_price_per_1m": 10,
3567
  "currency": "USD",
3568
  "capabilities": [
 
3569
  "reasoning"
3570
  ],
3571
+ "context_window": 200000,
3572
  "hf_private": true
3573
  },
3574
  {
 
3604
  "hf_private": true
3605
  },
3606
  {
3607
+ "name": "openai-responses/gpt-5.2",
3608
  "type": "vision",
3609
  "input_price_per_1m": 1.75,
3610
  "output_price_per_1m": 14,
 
3617
  "hf_private": true
3618
  },
3619
  {
3620
+ "name": "openai-responses/gpt-5.2-codex",
3621
  "type": "vision",
3622
  "input_price_per_1m": 1.75,
3623
  "output_price_per_1m": 14,
 
3626
  "vision",
3627
  "reasoning"
3628
  ],
3629
+ "context_window": 400000,
3630
  "hf_private": true
3631
  },
3632
  {
3633
+ "name": "openai-responses/gpt-5.3-chat",
3634
  "type": "vision",
3635
  "input_price_per_1m": 1.75,
3636
  "output_price_per_1m": 14,
 
3639
  "vision",
3640
  "reasoning"
3641
  ],
3642
+ "context_window": 128000,
3643
  "hf_private": true
3644
  },
3645
  {
3646
+ "name": "openai-responses/gpt-5.3-codex",
3647
  "type": "vision",
3648
  "input_price_per_1m": 1.75,
3649
  "output_price_per_1m": 14,
 
3656
  "hf_private": true
3657
  },
3658
  {
3659
+ "name": "openai/gpt-5.3-chat",
3660
  "type": "vision",
3661
  "input_price_per_1m": 1.75,
3662
  "output_price_per_1m": 14,
 
3665
  "vision",
3666
  "reasoning"
3667
  ],
3668
+ "context_window": 128000,
3669
  "hf_private": true
3670
  },
3671
  {
3672
+ "name": "openai/gpt-5.2",
3673
  "type": "vision",
3674
  "input_price_per_1m": 1.75,
3675
  "output_price_per_1m": 14,
 
3682
  "hf_private": true
3683
  },
3684
  {
3685
+ "name": "openai/gpt-5.2-chat",
3686
+ "type": "vision",
3687
  "input_price_per_1m": 1.75,
3688
  "output_price_per_1m": 14,
3689
  "currency": "USD",
3690
  "capabilities": [
3691
+ "vision",
3692
  "reasoning"
3693
  ],
3694
+ "context_window": 128000,
3695
  "hf_private": true
3696
  },
3697
  {
3698
+ "name": "azure/openai-responses/gpt-5.2-codex",
3699
  "type": "vision",
3700
  "input_price_per_1m": 1.75,
3701
  "output_price_per_1m": 14,
 
3708
  "hf_private": true
3709
  },
3710
  {
3711
+ "name": "azure/gpt-5.2",
3712
+ "type": "chat",
3713
  "input_price_per_1m": 1.75,
3714
  "output_price_per_1m": 14,
3715
  "currency": "USD",
3716
  "capabilities": [
 
3717
  "reasoning"
3718
  ],
3719
+ "context_window": 200000,
3720
  "hf_private": true
3721
  },
3722
  {
3723
+ "name": "azure/gpt-5.3-codex",
3724
  "type": "vision",
3725
  "input_price_per_1m": 1.75,
3726
  "output_price_per_1m": 14,
 
3729
  "vision",
3730
  "reasoning"
3731
  ],
3732
+ "context_window": 400000,
3733
+ "hf_private": true
3734
+ },
3735
+ {
3736
+ "name": "nebius/deepseek-ai/DeepSeek-V3-0324-fast",
3737
+ "type": "chat",
3738
+ "input_price_per_1m": 2,
3739
+ "output_price_per_1m": 6,
3740
+ "currency": "USD",
3741
  "context_window": 128000,
3742
  "hf_private": true
3743
  },
3744
  {
3745
+ "name": "perplexity/sonar-reasoning-pro",
3746
  "type": "chat",
3747
  "input_price_per_1m": 2,
3748
+ "output_price_per_1m": 8,
3749
  "currency": "USD",
3750
  "context_window": 131072,
3751
+ "capabilities": [
3752
+ "vision",
3753
+ "reasoning"
3754
+ ],
3755
  "hf_private": true
3756
  },
3757
  {
3758
+ "name": "xai/grok-4.2-beta",
3759
  "type": "vision",
3760
  "input_price_per_1m": 2,
3761
+ "output_price_per_1m": 6,
3762
  "currency": "USD",
3763
  "capabilities": [
3764
+ "vision",
3765
+ "reasoning"
3766
  ],
3767
+ "context_window": 2000000,
3768
  "hf_private": true
3769
  },
3770
  {
3771
+ "name": "xai/grok-2-1212",
3772
  "type": "chat",
3773
  "input_price_per_1m": 2,
3774
+ "output_price_per_1m": 10,
3775
  "currency": "USD",
3776
+ "context_window": 131072,
3777
  "hf_private": true
3778
  },
3779
  {
3780
+ "name": "google/gemini-3-pro-preview",
3781
  "type": "vision",
3782
  "input_price_per_1m": 2,
3783
  "output_price_per_1m": 12,
 
3790
  "hf_private": true
3791
  },
3792
  {
3793
+ "name": "google/gemini-3.1-pro-preview",
3794
  "type": "vision",
3795
  "input_price_per_1m": 2,
3796
  "output_price_per_1m": 12,
 
3803
  "hf_private": true
3804
  },
3805
  {
3806
+ "name": "mistral/pixtral-large-latest",
3807
+ "type": "chat",
3808
+ "input_price_per_1m": 2,
3809
+ "output_price_per_1m": 5,
3810
+ "currency": "USD",
3811
+ "context_window": 131072,
3812
+ "hf_private": true
3813
+ },
3814
+ {
3815
+ "name": "openai-responses/gpt-4.1",
3816
  "type": "vision",
3817
  "input_price_per_1m": 2,
3818
+ "output_price_per_1m": 8,
3819
+ "currency": "USD",
3820
+ "capabilities": [
3821
+ "vision"
3822
+ ],
3823
+ "context_window": 1047576,
3824
+ "hf_private": true
3825
+ },
3826
+ {
3827
+ "name": "openai/o4-mini-deep-research",
3828
+ "type": "vision",
3829
+ "input_price_per_1m": 2,
3830
+ "output_price_per_1m": 8,
3831
  "currency": "USD",
3832
  "capabilities": [
3833
  "vision",
3834
  "reasoning"
3835
  ],
3836
+ "context_window": 100000,
3837
  "hf_private": true
3838
  },
3839
  {
3840
+ "name": "openai/gpt-4.1",
3841
+ "type": "vision",
3842
  "input_price_per_1m": 2,
3843
  "output_price_per_1m": 8,
3844
  "currency": "USD",
 
3845
  "capabilities": [
3846
+ "vision"
 
3847
  ],
3848
+ "context_window": 1047576,
3849
  "hf_private": true
3850
  },
3851
  {
3852
+ "name": "vertex/gemini-3-pro-image-preview",
3853
  "type": "vision",
3854
  "input_price_per_1m": 2,
3855
  "output_price_per_1m": 12,
 
3862
  "hf_private": true
3863
  },
3864
  {
3865
+ "name": "vertex/gemini-3-pro-preview",
3866
  "type": "vision",
3867
  "input_price_per_1m": 2,
3868
  "output_price_per_1m": 12,
 
3875
  "hf_private": true
3876
  },
3877
  {
3878
+ "name": "vertex/gemini-3.1-pro-preview",
3879
  "type": "vision",
3880
  "input_price_per_1m": 2,
3881
+ "output_price_per_1m": 12,
3882
  "currency": "USD",
3883
  "capabilities": [
3884
  "vision",
3885
  "reasoning"
3886
  ],
3887
+ "context_window": 1048576,
 
 
 
 
 
 
 
 
 
3888
  "hf_private": true
3889
  },
3890
  {
 
3912
  "hf_private": true
3913
  },
3914
  {
3915
+ "name": "openai-responses/gpt-5.4",
3916
  "type": "vision",
3917
+ "input_price_per_1m": 2.5,
3918
+ "output_price_per_1m": 15,
3919
  "currency": "USD",
3920
  "capabilities": [
3921
  "vision",
3922
  "reasoning"
3923
  ],
3924
+ "context_window": 1050000,
 
 
 
 
 
 
 
 
 
 
 
 
3925
  "hf_private": true
3926
  },
3927
  {
3928
+ "name": "openai/gpt-5.4",
3929
  "type": "vision",
3930
  "input_price_per_1m": 2.5,
3931
  "output_price_per_1m": 15,
 
3938
  "hf_private": true
3939
  },
3940
  {
3941
+ "name": "openai/gpt-4o-2024-08-06",
3942
  "type": "vision",
3943
  "input_price_per_1m": 2.5,
3944
+ "output_price_per_1m": 10,
3945
  "currency": "USD",
3946
  "capabilities": [
3947
+ "vision"
 
3948
  ],
3949
+ "context_window": 128000,
3950
  "hf_private": true
3951
  },
3952
  {
3953
+ "name": "openai/gpt-4o-2024-05-13",
3954
  "type": "vision",
3955
  "input_price_per_1m": 2.5,
3956
  "output_price_per_1m": 10,
 
3962
  "hf_private": true
3963
  },
3964
  {
3965
+ "name": "openai/gpt-4o",
3966
  "type": "vision",
3967
  "input_price_per_1m": 2.5,
3968
  "output_price_per_1m": 10,
 
3974
  "hf_private": true
3975
  },
3976
  {
3977
+ "name": "openai/gpt-4o-2024-11-20",
3978
  "type": "vision",
3979
  "input_price_per_1m": 2.5,
3980
  "output_price_per_1m": 10,
 
3986
  "hf_private": true
3987
  },
3988
  {
3989
+ "name": "azure/openai-responses/gpt-5.4",
3990
  "type": "vision",
3991
  "input_price_per_1m": 2.5,
3992
  "output_price_per_1m": 15,
 
3999
  "hf_private": true
4000
  },
4001
  {
4002
+ "name": "perplexity/sonar-pro",
4003
+ "type": "chat",
4004
+ "input_price_per_1m": 3,
4005
+ "output_price_per_1m": 15,
4006
  "currency": "USD",
4007
+ "context_window": 204800,
4008
  "capabilities": [
4009
  "vision"
4010
  ],
 
4011
  "hf_private": true
4012
  },
4013
  {
4014
+ "name": "xai/grok-4",
4015
+ "type": "vision",
4016
  "input_price_per_1m": 3,
4017
+ "output_price_per_1m": 15,
4018
  "currency": "USD",
 
4019
  "capabilities": [
4020
+ "vision"
 
4021
  ],
4022
+ "context_window": 256000,
4023
+ "hf_private": true
 
 
 
 
4024
  },
4025
  {
4026
+ "name": "anthropic/claude-sonnet-4",
4027
  "type": "vision",
4028
  "input_price_per_1m": 3,
4029
  "output_price_per_1m": 15,
 
4032
  "vision",
4033
  "reasoning"
4034
  ],
4035
+ "context_window": 1000000,
4036
  "hf_private": true
4037
  },
4038
  {
4039
+ "name": "anthropic/claude-sonnet-4-6",
4040
  "type": "vision",
4041
  "input_price_per_1m": 3,
4042
  "output_price_per_1m": 15,
 
4045
  "vision",
4046
  "reasoning"
4047
  ],
4048
+ "context_window": 1000000,
4049
  "hf_private": true
4050
  },
4051
  {
4052
+ "name": "anthropic/claude-sonnet-4-5",
4053
  "type": "vision",
4054
  "input_price_per_1m": 3,
4055
  "output_price_per_1m": 15,
 
4058
  "vision",
4059
  "reasoning"
4060
  ],
4061
+ "context_window": 1000000,
4062
  "hf_private": true
4063
  },
4064
  {
4065
+ "name": "bedrock/claude-sonnet-4",
4066
  "type": "vision",
4067
  "input_price_per_1m": 3,
4068
  "output_price_per_1m": 15,
4069
  "currency": "USD",
4070
  "capabilities": [
4071
+ "vision",
4072
+ "reasoning"
4073
  ],
4074
  "context_window": 200000,
4075
  "hf_private": true
4076
  },
4077
  {
4078
+ "name": "bedrock/claude-3-7-sonnet",
 
 
 
 
 
 
 
 
 
 
 
 
4079
  "type": "vision",
4080
  "input_price_per_1m": 3,
4081
  "output_price_per_1m": 15,
 
4088
  "hf_private": true
4089
  },
4090
  {
4091
+ "name": "bedrock/claude-sonnet-4-6",
4092
  "type": "vision",
4093
  "input_price_per_1m": 3,
4094
  "output_price_per_1m": 15,
 
4097
  "vision",
4098
  "reasoning"
4099
  ],
4100
+ "context_window": 1000000,
4101
  "hf_private": true
4102
  },
4103
  {
4104
+ "name": "bedrock/claude-sonnet-4-5",
4105
  "type": "vision",
4106
  "input_price_per_1m": 3,
4107
  "output_price_per_1m": 15,
 
4110
  "vision",
4111
  "reasoning"
4112
  ],
4113
+ "context_window": 200000,
4114
  "hf_private": true
4115
  },
4116
  {
4117
+ "name": "coding/claude-sonnet-4-20250514",
4118
  "type": "vision",
4119
  "input_price_per_1m": 3,
4120
  "output_price_per_1m": 15,
 
4127
  "hf_private": true
4128
  },
4129
  {
4130
+ "name": "together/deepseek-ai/DeepSeek-R1",
4131
+ "type": "chat",
4132
  "input_price_per_1m": 3,
4133
+ "output_price_per_1m": 7,
4134
  "currency": "USD",
4135
+ "context_window": 64000,
4136
  "capabilities": [
4137
+ "tools",
4138
  "reasoning"
4139
  ],
4140
+ "hf_id": "deepseek-ai/DeepSeek-R1",
4141
+ "size_b": 671,
4142
+ "size_source": "manual",
4143
+ "hf_private": false,
4144
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
4145
+ "hf_status": 200
4146
  },
4147
  {
4148
+ "name": "vertex/claude-3-5-sonnet",
4149
  "type": "vision",
4150
  "input_price_per_1m": 3,
4151
  "output_price_per_1m": 15,
 
4153
  "capabilities": [
4154
  "vision"
4155
  ],
4156
+ "context_window": 200000,
4157
  "hf_private": true
4158
  },
4159
  {
4160
+ "name": "vertex/claude-sonnet-4-5",
4161
  "type": "vision",
4162
  "input_price_per_1m": 3,
4163
  "output_price_per_1m": 15,
 
4166
  "vision",
4167
  "reasoning"
4168
  ],
4169
+ "context_window": 200000,
4170
  "hf_private": true
4171
  },
4172
  {
4173
+ "name": "vertex/claude-sonnet-4",
4174
  "type": "vision",
4175
  "input_price_per_1m": 3,
4176
  "output_price_per_1m": 15,
 
4179
  "vision",
4180
  "reasoning"
4181
  ],
4182
+ "context_window": 200000,
4183
  "hf_private": true
4184
  },
4185
  {
4186
+ "name": "vertex/claude-3-7-sonnet",
4187
  "type": "vision",
4188
  "input_price_per_1m": 3,
4189
  "output_price_per_1m": 15,
 
4192
  "vision",
4193
  "reasoning"
4194
  ],
4195
+ "context_window": 200000,
4196
  "hf_private": true
4197
  },
4198
  {
 
4214
  "hf_status": 200
4215
  },
4216
  {
4217
+ "name": "xai/grok-3",
4218
+ "type": "chat",
4219
  "input_price_per_1m": 5,
4220
  "output_price_per_1m": 25,
4221
  "currency": "USD",
4222
+ "context_window": 131072,
4223
  "capabilities": [
4224
+ "tools"
 
4225
  ],
 
4226
  "hf_private": true
4227
  },
4228
  {
4229
+ "name": "anthropic/claude-opus-4-5",
4230
  "type": "vision",
4231
  "input_price_per_1m": 5,
4232
  "output_price_per_1m": 25,
 
4239
  "hf_private": true
4240
  },
4241
  {
4242
+ "name": "anthropic/claude-opus-4-6",
4243
  "type": "vision",
4244
  "input_price_per_1m": 5,
4245
  "output_price_per_1m": 25,
 
4248
  "vision",
4249
  "reasoning"
4250
  ],
4251
+ "context_window": 1000000,
4252
  "hf_private": true
4253
  },
4254
  {
4255
+ "name": "openai/chatgpt-4o",
4256
  "type": "vision",
4257
  "input_price_per_1m": 5,
4258
+ "output_price_per_1m": 15,
4259
  "currency": "USD",
4260
  "capabilities": [
4261
+ "vision"
 
4262
  ],
4263
+ "context_window": 128000,
4264
  "hf_private": true
4265
  },
4266
  {
4267
+ "name": "bedrock/claude-opus-4-5",
4268
+ "type": "vision",
4269
  "input_price_per_1m": 5,
4270
  "output_price_per_1m": 25,
4271
  "currency": "USD",
 
4272
  "capabilities": [
4273
+ "vision",
4274
+ "reasoning"
4275
  ],
4276
+ "context_window": 200000,
4277
  "hf_private": true
4278
  },
4279
  {
4280
+ "name": "bedrock/claude-opus-4-6",
4281
  "type": "vision",
4282
  "input_price_per_1m": 5,
4283
  "output_price_per_1m": 25,
 
4286
  "vision",
4287
  "reasoning"
4288
  ],
4289
+ "context_window": 1000000,
4290
  "hf_private": true
4291
  },
4292
  {
4293
+ "name": "vertex/claude-opus-4-6",
4294
  "type": "vision",
4295
  "input_price_per_1m": 5,
4296
  "output_price_per_1m": 25,
 
4303
  "hf_private": true
4304
  },
4305
  {
4306
+ "name": "vertex/claude-opus-4-5",
4307
  "type": "vision",
4308
  "input_price_per_1m": 5,
4309
+ "output_price_per_1m": 25,
4310
  "currency": "USD",
4311
  "capabilities": [
4312
+ "vision",
4313
+ "reasoning"
4314
  ],
4315
+ "context_window": 200000,
4316
  "hf_private": true
4317
  },
4318
  {
 
4329
  "hf_private": true
4330
  },
4331
  {
4332
+ "name": "anthropic/claude-opus-4",
4333
  "type": "vision",
4334
  "input_price_per_1m": 15,
4335
+ "output_price_per_1m": 75,
4336
  "currency": "USD",
4337
  "capabilities": [
4338
  "vision",
4339
  "reasoning"
4340
  ],
4341
+ "context_window": 200000,
4342
  "hf_private": true
4343
  },
4344
  {
4345
+ "name": "anthropic/claude-opus-4-1",
4346
  "type": "vision",
4347
  "input_price_per_1m": 15,
4348
  "output_price_per_1m": 75,
 
4355
  "hf_private": true
4356
  },
4357
  {
4358
+ "name": "openai-responses/gpt-5-pro",
4359
  "type": "vision",
4360
  "input_price_per_1m": 15,
4361
+ "output_price_per_1m": 120,
4362
  "currency": "USD",
4363
  "capabilities": [
4364
  "vision",
4365
  "reasoning"
4366
  ],
4367
+ "context_window": 400000,
4368
  "hf_private": true
4369
  },
4370
  {
4371
+ "name": "openai/o1",
4372
  "type": "vision",
4373
  "input_price_per_1m": 15,
4374
+ "output_price_per_1m": 60,
4375
  "currency": "USD",
4376
  "capabilities": [
4377
  "vision",
 
4394
  "hf_private": true
4395
  },
4396
  {
4397
+ "name": "coding/claude-opus-4-20250514",
4398
  "type": "vision",
4399
  "input_price_per_1m": 15,
4400
  "output_price_per_1m": 75,
 
4407
  "hf_private": true
4408
  },
4409
  {
4410
+ "name": "vertex/claude-opus-4-1",
4411
  "type": "vision",
4412
  "input_price_per_1m": 15,
4413
  "output_price_per_1m": 75,
 
4420
  "hf_private": true
4421
  },
4422
  {
4423
+ "name": "vertex/claude-opus-4",
4424
  "type": "vision",
4425
  "input_price_per_1m": 15,
4426
+ "output_price_per_1m": 75,
4427
  "currency": "USD",
4428
  "capabilities": [
4429
  "vision",
 
4459
  "hf_private": true
4460
  },
4461
  {
4462
+ "name": "openai/gpt-5.4-pro",
4463
  "type": "vision",
4464
  "input_price_per_1m": 30,
4465
  "output_price_per_1m": 180,
 
4472
  "hf_private": true
4473
  },
4474
  {
4475
+ "name": "azure/openai-responses/gpt-5.4-pro",
4476
  "type": "vision",
4477
  "input_price_per_1m": 30,
4478
  "output_price_per_1m": 180,
 
5636
  "output_price_per_1m": 1.5,
5637
  "currency": "USD",
5638
  "api_endpoint": "magistral-small-latest",
5639
+ "hf_private": false,
5640
+ "size_b": 23.6,
5641
+ "size_source": "hf-total",
5642
+ "hf_id": "mistralai/Magistral-Small-2506",
5643
+ "hf_validated_at": "2026-03-22T20:03:46.317Z",
5644
+ "hf_status": 200
5645
  },
5646
  {
5647
  "name": "Ministral 3 - 3B",
 
5808
  "tools"
5809
  ],
5810
  "size_b": 124,
5811
+ "hf_private": false,
5812
+ "hf_id": "mistralai/Pixtral-Large-Instruct-2411",
5813
+ "hf_validated_at": "2026-03-22T20:03:46.317Z",
5814
+ "hf_status": 200
5815
  },
5816
  {
5817
  "name": "Pixtral 12B",
scripts/fetch-providers.js CHANGED
@@ -245,6 +245,9 @@ const MANUAL_HF_ID_MAP = {
245
  'kimi-k2-thinking': 'moonshotai/Kimi-K2-Thinking',
246
  'llama 4 scout': 'meta-llama/Llama-4-Scout-17B-16E-Instruct',
247
  'llama 4 maverick': 'meta-llama/Llama-4-Maverick-17B-128E-Instruct',
 
 
 
248
  };
249
 
250
  const MANUAL_OLLAMA_ID_MAP = {
 
245
  'kimi-k2-thinking': 'moonshotai/Kimi-K2-Thinking',
246
  'llama 4 scout': 'meta-llama/Llama-4-Scout-17B-16E-Instruct',
247
  'llama 4 maverick': 'meta-llama/Llama-4-Maverick-17B-128E-Instruct',
248
+ 'magistral small': 'mistralai/Magistral-Small-2506',
249
+ 'pixtral large': 'mistralai/Pixtral-Large-Instruct-2411',
250
+ 'hermes 3 llama 3.1 405b': 'NousResearch/Hermes-3-Llama-3.1-405B',
251
  };
252
 
253
  const MANUAL_OLLAMA_ID_MAP = {