CrispStrobe commited on
Commit
2d8f720
·
1 Parent(s): 83eb519

fix: correct Apertus/Teuken IDs and ensure robust mapping for Kimi models

Browse files
Files changed (2) hide show
  1. data/providers.json +859 -849
  2. scripts/fetch-providers.js +2 -0
data/providers.json CHANGED
@@ -1163,16 +1163,6 @@
1163
  "gdpr_compliant": true,
1164
  "eu_endpoints": true,
1165
  "models": [
1166
- {
1167
- "name": "deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo",
1168
- "type": "chat",
1169
- "input_price_per_1m": 0.02,
1170
- "output_price_per_1m": 0.05,
1171
- "currency": "USD",
1172
- "context_window": 131072,
1173
- "size_b": 8,
1174
- "hf_private": false
1175
- },
1176
  {
1177
  "name": "novita/meta-llama/llama-3.2-1b-instruct",
1178
  "type": "chat",
@@ -1186,6 +1176,16 @@
1186
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1187
  "hf_status": 200
1188
  },
 
 
 
 
 
 
 
 
 
 
1189
  {
1190
  "name": "openai/gpt-5-nano",
1191
  "type": "vision",
@@ -1229,27 +1229,32 @@
1229
  "hf_status": 200
1230
  },
1231
  {
1232
- "name": "openai-responses/gpt-5-nano",
1233
- "type": "vision",
1234
  "input_price_per_1m": 0.05,
1235
  "output_price_per_1m": 0.4,
1236
  "currency": "USD",
1237
  "capabilities": [
1238
- "vision",
1239
  "reasoning"
1240
  ],
1241
- "context_window": 400000,
1242
  "hf_private": true
1243
  },
1244
  {
1245
- "name": "novita/sao10k/l3-8b-lunaris",
1246
  "type": "chat",
1247
  "input_price_per_1m": 0.05,
1248
  "output_price_per_1m": 0.05,
1249
  "currency": "USD",
1250
- "context_window": 8192,
1251
  "size_b": 8,
1252
- "hf_private": false
 
 
 
 
 
 
1253
  },
1254
  {
1255
  "name": "novita/Sao10K/L3-8B-Stheno-v3.2",
@@ -1262,43 +1267,38 @@
1262
  "hf_private": false
1263
  },
1264
  {
1265
- "name": "novita/meta-llama/llama-3.1-8b-instruct",
1266
  "type": "chat",
1267
  "input_price_per_1m": 0.05,
1268
  "output_price_per_1m": 0.05,
1269
  "currency": "USD",
1270
- "context_window": 16384,
1271
  "size_b": 8,
1272
- "capabilities": [
1273
- "tools"
1274
- ],
1275
- "hf_private": false,
1276
- "hf_id": "meta-llama/Meta-Llama-3.1-8B-Instruct",
1277
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
1278
- "hf_status": 200
1279
  },
1280
  {
1281
- "name": "alibaba/qwen-turbo",
1282
- "type": "chat",
1283
  "input_price_per_1m": 0.05,
1284
- "output_price_per_1m": 0.2,
1285
  "currency": "USD",
1286
- "context_window": 1000000,
1287
  "capabilities": [
1288
- "tools"
 
1289
  ],
 
1290
  "hf_private": true
1291
  },
1292
  {
1293
- "name": "azure/gpt-5-nano",
1294
  "type": "chat",
1295
  "input_price_per_1m": 0.05,
1296
- "output_price_per_1m": 0.4,
1297
  "currency": "USD",
 
1298
  "capabilities": [
1299
- "reasoning"
1300
  ],
1301
- "context_window": 200000,
1302
  "hf_private": true
1303
  },
1304
  {
@@ -1349,54 +1349,19 @@
1349
  "hf_status": 200
1350
  },
1351
  {
1352
- "name": "groq/openai/gpt-oss-20b",
1353
- "type": "chat",
1354
- "input_price_per_1m": 0.1,
1355
- "output_price_per_1m": 0.5,
1356
- "currency": "USD",
1357
- "context_window": 131072,
1358
- "size_b": 20,
1359
- "capabilities": [
1360
- "tools",
1361
- "reasoning"
1362
- ],
1363
- "hf_id": "openai/gpt-oss-20b",
1364
- "hf_private": false,
1365
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
1366
- "hf_status": 200
1367
- },
1368
- {
1369
- "name": "deepinfra/Qwen/Qwen3-32B",
1370
- "type": "chat",
1371
- "input_price_per_1m": 0.1,
1372
- "output_price_per_1m": 0.3,
1373
- "currency": "USD",
1374
- "context_window": 40000,
1375
- "size_b": 32,
1376
- "capabilities": [
1377
- "tools",
1378
- "reasoning"
1379
- ],
1380
- "hf_id": "Qwen/Qwen3-32B",
1381
- "hf_private": false,
1382
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
1383
- "hf_status": 200
1384
- },
1385
- {
1386
- "name": "google/gemini-2.5-flash-lite",
1387
  "type": "vision",
1388
  "input_price_per_1m": 0.1,
1389
  "output_price_per_1m": 0.4,
1390
  "currency": "USD",
1391
  "capabilities": [
1392
- "vision",
1393
- "reasoning"
1394
  ],
1395
- "context_window": 1048576,
1396
  "hf_private": true
1397
  },
1398
  {
1399
- "name": "google/gemini-2.0-flash-001",
1400
  "type": "vision",
1401
  "input_price_per_1m": 0.1,
1402
  "output_price_per_1m": 0.4,
@@ -1404,11 +1369,11 @@
1404
  "capabilities": [
1405
  "vision"
1406
  ],
1407
- "context_window": 1048576,
1408
  "hf_private": true
1409
  },
1410
  {
1411
- "name": "mistral/devstral-small-latest",
1412
  "type": "chat",
1413
  "input_price_per_1m": 0.1,
1414
  "output_price_per_1m": 0.3,
@@ -1424,16 +1389,7 @@
1424
  "hf_status": 200
1425
  },
1426
  {
1427
- "name": "mistral/mistral-small-2503",
1428
- "type": "chat",
1429
- "input_price_per_1m": 0.1,
1430
- "output_price_per_1m": 0.3,
1431
- "currency": "USD",
1432
- "context_window": 32768,
1433
- "hf_private": true
1434
- },
1435
- {
1436
- "name": "mistral/devstral-small-2507",
1437
  "type": "chat",
1438
  "input_price_per_1m": 0.1,
1439
  "output_price_per_1m": 0.3,
@@ -1448,6 +1404,15 @@
1448
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1449
  "hf_status": 200
1450
  },
 
 
 
 
 
 
 
 
 
1451
  {
1452
  "name": "openai-responses/gpt-4.1-nano",
1453
  "type": "vision",
@@ -1460,6 +1425,19 @@
1460
  "context_window": 1047576,
1461
  "hf_private": true
1462
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
1463
  {
1464
  "name": "openai/gpt-4.1-nano",
1465
  "type": "vision",
@@ -1473,51 +1451,73 @@
1473
  "hf_private": true
1474
  },
1475
  {
1476
- "name": "together/meta-llama/Meta-Llama-3-8B-Instruct-Lite",
1477
  "type": "chat",
1478
  "input_price_per_1m": 0.1,
1479
- "output_price_per_1m": 0.1,
1480
  "currency": "USD",
1481
- "context_window": 8192,
1482
- "size_b": 8,
1483
- "hf_private": false
 
 
 
 
 
 
 
1484
  },
1485
  {
1486
- "name": "vertex/gemini-2.5-flash-lite",
1487
  "type": "vision",
1488
  "input_price_per_1m": 0.1,
1489
  "output_price_per_1m": 0.4,
1490
  "currency": "USD",
1491
  "capabilities": [
1492
- "vision",
1493
- "reasoning"
1494
  ],
1495
  "context_window": 1048576,
1496
  "hf_private": true
1497
  },
1498
  {
1499
- "name": "azure/openai-responses/gpt-4.1-nano",
1500
  "type": "vision",
1501
  "input_price_per_1m": 0.1,
1502
  "output_price_per_1m": 0.4,
1503
  "currency": "USD",
1504
  "capabilities": [
1505
- "vision"
 
1506
  ],
1507
- "context_window": 1047576,
1508
  "hf_private": true
1509
  },
1510
  {
1511
- "name": "azure/gpt-4.1-nano",
1512
- "type": "vision",
1513
  "input_price_per_1m": 0.1,
1514
- "output_price_per_1m": 0.4,
1515
  "currency": "USD",
 
 
1516
  "capabilities": [
1517
- "vision"
 
1518
  ],
1519
- "context_window": 1047576,
1520
- "hf_private": true
 
 
 
 
 
 
 
 
 
 
 
 
1521
  },
1522
  {
1523
  "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct-Turbo",
@@ -1575,48 +1575,40 @@
1575
  "hf_status": 200
1576
  },
1577
  {
1578
- "name": "groq/openai/gpt-oss-120b",
1579
  "type": "chat",
1580
  "input_price_per_1m": 0.15,
1581
- "output_price_per_1m": 0.75,
1582
  "currency": "USD",
1583
- "context_window": 131072,
1584
- "size_b": 120,
1585
  "capabilities": [
1586
  "tools",
1587
  "reasoning"
1588
  ],
1589
- "hf_id": "openai/gpt-oss-120b",
 
1590
  "hf_private": false,
1591
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1592
  "hf_status": 200
1593
  },
1594
  {
1595
- "name": "nebius/openai/gpt-oss-120b",
1596
- "type": "chat",
1597
  "input_price_per_1m": 0.15,
1598
  "output_price_per_1m": 0.6,
1599
  "currency": "USD",
1600
  "capabilities": [
 
1601
  "reasoning"
1602
  ],
1603
- "context_window": 131000,
1604
- "size_b": 120,
1605
- "hf_id": "openai/gpt-oss-120b",
1606
  "hf_private": false,
1607
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1608
  "hf_status": 200
1609
  },
1610
- {
1611
- "name": "parasail/parasail-qwen3-235b-a22b-instruct-2507",
1612
- "type": "chat",
1613
- "input_price_per_1m": 0.15,
1614
- "output_price_per_1m": 0.85,
1615
- "currency": "USD",
1616
- "context_window": 262144,
1617
- "size_b": 235,
1618
- "hf_private": false
1619
- },
1620
  {
1621
  "name": "mistral/mistral-small-latest",
1622
  "type": "vision",
@@ -1630,23 +1622,6 @@
1630
  "context_window": 256000,
1631
  "hf_private": true
1632
  },
1633
- {
1634
- "name": "mistral/mistral-small-2603",
1635
- "type": "vision",
1636
- "input_price_per_1m": 0.15,
1637
- "output_price_per_1m": 0.6,
1638
- "currency": "USD",
1639
- "capabilities": [
1640
- "vision",
1641
- "reasoning"
1642
- ],
1643
- "context_window": 256000,
1644
- "size_b": 119,
1645
- "hf_id": "mistralai/Mistral-Small-4-119B-2603",
1646
- "hf_private": false,
1647
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
1648
- "hf_status": 200
1649
- },
1650
  {
1651
  "name": "openai/gpt-4o-mini",
1652
  "type": "vision",
@@ -1660,19 +1635,44 @@
1660
  "hf_private": true
1661
  },
1662
  {
1663
- "name": "novita/deepseek/deepseek-r1-distill-qwen-14b",
1664
  "type": "chat",
1665
  "input_price_per_1m": 0.15,
1666
- "output_price_per_1m": 0.15,
1667
  "currency": "USD",
1668
- "context_window": 128000,
1669
- "size_b": 14,
 
 
 
 
 
 
 
 
 
 
1670
  "capabilities": [
1671
  "tools",
1672
  "reasoning"
1673
  ],
1674
- "hf_id": "deepseek-ai/DeepSeek-R1",
1675
- "size_source": "manual",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1676
  "hf_private": false,
1677
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1678
  "hf_status": 200
@@ -1704,87 +1704,84 @@
1704
  "hf_private": false
1705
  },
1706
  {
1707
- "name": "deepinfra/zai-org/GLM-4.5-Air",
1708
  "type": "chat",
1709
  "input_price_per_1m": 0.2,
1710
- "output_price_per_1m": 1.1,
1711
  "currency": "USD",
1712
- "context_window": 131072,
 
1713
  "capabilities": [
1714
  "tools",
1715
  "reasoning"
1716
  ],
1717
- "hf_id": "zai-org/GLM-4.5-Air",
1718
- "size_b": 110.5,
1719
  "hf_private": false,
1720
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1721
  "hf_status": 200
1722
  },
1723
  {
1724
- "name": "deepinfra/Qwen/Qwen3-235B-A22B",
1725
  "type": "chat",
1726
  "input_price_per_1m": 0.2,
1727
- "output_price_per_1m": 0.6,
1728
  "currency": "USD",
1729
- "context_window": 40000,
1730
- "size_b": 235,
1731
  "capabilities": [
1732
- "tools",
1733
- "reasoning"
1734
  ],
1735
- "hf_id": "Qwen/Qwen3-235B-A22B",
1736
- "hf_private": false,
1737
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
1738
- "hf_status": 200
1739
  },
1740
  {
1741
- "name": "xai/grok-4-fast",
1742
- "type": "chat",
1743
  "input_price_per_1m": 0.2,
1744
- "output_price_per_1m": 0.5,
1745
  "currency": "USD",
1746
- "context_window": 2000000,
1747
  "capabilities": [
1748
  "vision",
1749
- "tools",
1750
  "reasoning"
1751
  ],
 
1752
  "hf_private": true
1753
  },
1754
  {
1755
- "name": "xai/grok-4-1-fast-non-reasoning",
1756
  "type": "vision",
1757
  "input_price_per_1m": 0.2,
1758
- "output_price_per_1m": 0.5,
1759
  "currency": "USD",
1760
  "capabilities": [
1761
- "vision"
 
1762
  ],
1763
- "context_window": 2000000,
1764
  "hf_private": true
1765
  },
1766
  {
1767
- "name": "xai/grok-code-fast-1",
1768
  "type": "vision",
1769
  "input_price_per_1m": 0.2,
1770
- "output_price_per_1m": 1.5,
1771
  "currency": "USD",
1772
  "capabilities": [
1773
  "vision"
1774
  ],
1775
- "context_window": 256000,
1776
  "hf_private": true
1777
  },
1778
  {
1779
- "name": "xai/grok-4-1-fast-reasoning",
1780
  "type": "vision",
1781
  "input_price_per_1m": 0.2,
1782
- "output_price_per_1m": 0.5,
1783
  "currency": "USD",
1784
  "capabilities": [
1785
  "vision"
1786
  ],
1787
- "context_window": 2000000,
1788
  "hf_private": true
1789
  },
1790
  {
@@ -1802,58 +1799,61 @@
1802
  "hf_private": true
1803
  },
1804
  {
1805
- "name": "openai-responses/gpt-5.4-nano",
1806
  "type": "vision",
1807
  "input_price_per_1m": 0.2,
1808
- "output_price_per_1m": 1.25,
1809
  "currency": "USD",
1810
  "capabilities": [
1811
- "vision",
1812
- "reasoning"
1813
  ],
1814
- "context_window": 400000,
1815
  "hf_private": true
1816
  },
1817
  {
1818
- "name": "openai/gpt-5.4-nano",
1819
- "type": "vision",
1820
  "input_price_per_1m": 0.2,
1821
- "output_price_per_1m": 1.25,
1822
  "currency": "USD",
 
1823
  "capabilities": [
1824
  "vision",
 
1825
  "reasoning"
1826
  ],
1827
- "context_window": 400000,
1828
  "hf_private": true
1829
  },
1830
  {
1831
- "name": "novita/meta-llama/llama-4-maverick-17b-128e-instruct-fp8",
1832
  "type": "chat",
1833
  "input_price_per_1m": 0.2,
1834
- "output_price_per_1m": 0.85,
1835
  "currency": "USD",
1836
- "context_window": 1048576,
1837
- "size_b": 17,
1838
  "capabilities": [
1839
- "vision",
1840
- "tools"
1841
  ],
1842
- "hf_private": false
 
 
 
1843
  },
1844
  {
1845
- "name": "novita/qwen/qwen3-235b-a22b-fp8",
1846
  "type": "chat",
1847
  "input_price_per_1m": 0.2,
1848
- "output_price_per_1m": 0.8,
1849
  "currency": "USD",
1850
- "context_window": 128000,
1851
- "size_b": 235,
1852
  "capabilities": [
1853
  "tools",
1854
  "reasoning"
1855
  ],
1856
- "hf_id": "Qwen/Qwen3-235B-A22B",
 
1857
  "hf_private": false,
1858
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1859
  "hf_status": 200
@@ -1884,6 +1884,16 @@
1884
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1885
  "hf_status": 200
1886
  },
 
 
 
 
 
 
 
 
 
 
1887
  {
1888
  "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct",
1889
  "type": "chat",
@@ -1916,16 +1926,6 @@
1916
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1917
  "hf_status": 200
1918
  },
1919
- {
1920
- "name": "deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct",
1921
- "type": "chat",
1922
- "input_price_per_1m": 0.23,
1923
- "output_price_per_1m": 0.4,
1924
- "currency": "USD",
1925
- "context_window": 130815,
1926
- "size_b": 70,
1927
- "hf_private": false
1928
- },
1929
  {
1930
  "name": "deepinfra/Qwen/Qwen2.5-72B-Instruct",
1931
  "type": "chat",
@@ -1943,15 +1943,15 @@
1943
  "hf_status": 200
1944
  },
1945
  {
1946
- "name": "google/gemini-3.1-flash-lite-preview",
1947
- "type": "vision",
1948
  "input_price_per_1m": 0.25,
1949
- "output_price_per_1m": 1.5,
1950
  "currency": "USD",
1951
  "capabilities": [
1952
- "vision"
1953
  ],
1954
- "context_window": 1048576,
1955
  "hf_private": true
1956
  },
1957
  {
@@ -1990,15 +1990,15 @@
1990
  "hf_private": true
1991
  },
1992
  {
1993
- "name": "azure/gpt-5-mini",
1994
- "type": "chat",
1995
  "input_price_per_1m": 0.25,
1996
- "output_price_per_1m": 2,
1997
  "currency": "USD",
1998
  "capabilities": [
1999
- "reasoning"
2000
  ],
2001
- "context_window": 200000,
2002
  "hf_private": true
2003
  },
2004
  {
@@ -2044,91 +2044,111 @@
2044
  "hf_private": true
2045
  },
2046
  {
2047
- "name": "nebius/deepseek-ai/DeepSeek-V3.2",
2048
- "type": "chat",
2049
  "input_price_per_1m": 0.3,
2050
- "output_price_per_1m": 0.45,
2051
  "currency": "USD",
2052
  "capabilities": [
 
2053
  "reasoning"
2054
  ],
2055
- "context_window": 164000,
2056
- "hf_id": "deepseek-ai/DeepSeek-V3.2",
2057
- "size_b": 685.4,
2058
  "hf_private": false,
 
 
 
2059
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2060
  "hf_status": 200
2061
  },
2062
  {
2063
- "name": "nebius/minimax/minimax-m2.1",
2064
  "type": "chat",
2065
  "input_price_per_1m": 0.3,
2066
- "output_price_per_1m": 1.2,
2067
  "currency": "USD",
 
 
2068
  "capabilities": [
2069
  "reasoning"
2070
  ],
2071
- "context_window": 200000,
2072
- "hf_id": "MiniMaxAI/MiniMax-M2.1",
2073
- "size_b": 228.7,
2074
  "hf_private": false,
2075
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2076
  "hf_status": 200
2077
  },
2078
  {
2079
- "name": "deepinfra/deepseek-ai/DeepSeek-V3.1",
2080
- "type": "chat",
2081
  "input_price_per_1m": 0.3,
2082
- "output_price_per_1m": 1,
2083
  "currency": "USD",
2084
- "context_window": 163840,
2085
  "capabilities": [
2086
- "tools",
2087
  "reasoning"
2088
  ],
2089
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
2090
- "size_b": 671,
2091
  "hf_private": false,
 
 
 
2092
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2093
  "hf_status": 200
2094
  },
2095
  {
2096
- "name": "parasail/parasail-gemma3-27b-it",
2097
- "type": "chat",
2098
- "input_price_per_1m": 0.3,
2099
- "output_price_per_1m": 0.5,
2100
- "currency": "USD",
2101
- "context_window": 128000,
2102
- "size_b": 27,
2103
- "hf_private": false
2104
- },
2105
- {
2106
- "name": "xai/grok-3-mini",
2107
- "type": "chat",
2108
  "input_price_per_1m": 0.3,
2109
- "output_price_per_1m": 0.5,
2110
  "currency": "USD",
2111
  "capabilities": [
 
2112
  "reasoning"
2113
  ],
2114
- "context_window": 131072,
2115
- "hf_private": true
 
 
 
 
 
2116
  },
2117
  {
2118
- "name": "google/gemini-2.5-flash",
2119
  "type": "vision",
2120
  "input_price_per_1m": 0.3,
2121
- "output_price_per_1m": 2.5,
2122
  "currency": "USD",
2123
  "capabilities": [
2124
  "vision",
2125
  "reasoning"
2126
  ],
2127
- "context_window": 1048576,
2128
- "hf_private": true
 
 
 
 
2129
  },
2130
  {
2131
- "name": "mistral/codestral-latest",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2132
  "type": "chat",
2133
  "input_price_per_1m": 0.3,
2134
  "output_price_per_1m": 0.9,
@@ -2137,56 +2157,42 @@
2137
  "hf_private": true
2138
  },
2139
  {
2140
- "name": "novita/minimax-m2.7",
2141
  "type": "vision",
2142
  "input_price_per_1m": 0.3,
2143
- "output_price_per_1m": 1.2,
2144
  "currency": "USD",
2145
  "capabilities": [
2146
  "vision",
2147
  "reasoning"
2148
  ],
2149
- "context_window": 200000,
2150
- "hf_private": false,
2151
- "size_b": 230,
2152
- "size_source": "manual",
2153
- "hf_id": "MiniMaxAI/MiniMax-M2.7",
2154
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
2155
- "hf_status": 200
2156
  },
2157
  {
2158
- "name": "novita/MiniMax-M2.7",
2159
  "type": "vision",
2160
  "input_price_per_1m": 0.3,
2161
- "output_price_per_1m": 1.2,
2162
  "currency": "USD",
2163
  "capabilities": [
2164
  "vision",
2165
  "reasoning"
2166
  ],
2167
- "context_window": 200000,
2168
- "hf_private": false,
2169
- "size_b": 230,
2170
- "size_source": "manual",
2171
- "hf_id": "MiniMaxAI/MiniMax-M2.7",
2172
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
2173
- "hf_status": 200
2174
  },
2175
  {
2176
- "name": "novita/deepseek/deepseek-r1-distill-qwen-32b",
2177
  "type": "chat",
2178
  "input_price_per_1m": 0.3,
2179
- "output_price_per_1m": 0.3,
2180
  "currency": "USD",
2181
- "context_window": 12800,
2182
- "size_b": 32,
2183
  "capabilities": [
2184
  "reasoning"
2185
  ],
2186
- "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",
2187
- "hf_private": false,
2188
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
2189
- "hf_status": 200
2190
  },
2191
  {
2192
  "name": "coding/gemini-2.5-flash",
@@ -2202,101 +2208,95 @@
2202
  "hf_private": true
2203
  },
2204
  {
2205
- "name": "together/Qwen/Qwen2.5-7B-Instruct-Turbo",
2206
  "type": "chat",
2207
  "input_price_per_1m": 0.3,
2208
- "output_price_per_1m": 0.3,
2209
  "currency": "USD",
2210
- "context_window": 32768,
2211
- "size_b": 7,
2212
- "hf_private": false
 
 
 
 
 
 
 
2213
  },
2214
  {
2215
- "name": "alibaba/qwen3-coder-flash",
2216
  "type": "vision",
2217
  "input_price_per_1m": 0.3,
2218
- "output_price_per_1m": 1.5,
2219
  "currency": "USD",
2220
  "capabilities": [
2221
- "vision"
 
2222
  ],
2223
  "context_window": 1048576,
2224
  "hf_private": true
2225
  },
2226
  {
2227
- "name": "minimaxi/MiniMax-M2.7",
2228
- "type": "vision",
2229
  "input_price_per_1m": 0.3,
2230
- "output_price_per_1m": 1.2,
2231
  "currency": "USD",
2232
- "capabilities": [
2233
- "vision",
2234
- "reasoning"
2235
- ],
2236
- "context_window": 200000,
2237
- "hf_private": false,
2238
- "size_b": 230,
2239
- "size_source": "manual",
2240
- "hf_id": "MiniMaxAI/MiniMax-M2.7",
2241
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
2242
- "hf_status": 200
2243
  },
2244
  {
2245
- "name": "minimaxi/MiniMax-M2",
2246
  "type": "chat",
2247
  "input_price_per_1m": 0.3,
2248
  "output_price_per_1m": 1.2,
2249
  "currency": "USD",
2250
- "context_window": 200000,
2251
  "capabilities": [
2252
- "tools",
2253
  "reasoning"
2254
  ],
2255
- "hf_id": "MiniMaxAI/MiniMax-M2",
 
2256
  "size_b": 228.7,
2257
  "hf_private": false,
2258
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2259
  "hf_status": 200
2260
  },
2261
  {
2262
- "name": "minimaxi/MiniMax-M2.5",
2263
- "type": "vision",
2264
  "input_price_per_1m": 0.3,
2265
- "output_price_per_1m": 1.2,
2266
  "currency": "USD",
2267
  "capabilities": [
2268
- "vision",
2269
  "reasoning"
2270
  ],
2271
- "context_window": 200000,
2272
- "hf_id": "MiniMaxAI/MiniMax-M2.5",
2273
- "size_b": 228.7,
2274
  "hf_private": false,
2275
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2276
  "hf_status": 200
2277
  },
2278
  {
2279
- "name": "vertex/gemini-2.5-flash",
2280
- "type": "vision",
2281
  "input_price_per_1m": 0.3,
2282
- "output_price_per_1m": 2.5,
2283
  "currency": "USD",
2284
- "capabilities": [
2285
- "vision",
2286
- "reasoning"
2287
- ],
2288
- "context_window": 1048576,
2289
- "hf_private": true
2290
  },
2291
  {
2292
- "name": "vertex/gemini-2.5-flash-image",
2293
  "type": "vision",
2294
  "input_price_per_1m": 0.3,
2295
- "output_price_per_1m": 2.5,
2296
  "currency": "USD",
2297
  "capabilities": [
2298
- "vision",
2299
- "reasoning"
2300
  ],
2301
  "context_window": 1048576,
2302
  "hf_private": true
@@ -2344,85 +2344,7 @@
2344
  "hf_status": 200
2345
  },
2346
  {
2347
- "name": "nebius/zai-org/GLM-4.7",
2348
- "type": "chat",
2349
- "input_price_per_1m": 0.4,
2350
- "output_price_per_1m": 2,
2351
- "currency": "USD",
2352
- "capabilities": [
2353
- "reasoning"
2354
- ],
2355
- "context_window": 200000,
2356
- "hf_id": "zai-org/GLM-4.7",
2357
- "size_b": 358.3,
2358
- "hf_private": false,
2359
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
2360
- "hf_status": 200
2361
- },
2362
- {
2363
- "name": "nebius/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2364
- "type": "chat",
2365
- "input_price_per_1m": 0.4,
2366
- "output_price_per_1m": 1.8,
2367
- "currency": "USD",
2368
- "context_window": 262000,
2369
- "size_b": 480,
2370
- "capabilities": [
2371
- "tools"
2372
- ],
2373
- "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct",
2374
- "hf_private": false,
2375
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
2376
- "hf_status": 200
2377
- },
2378
- {
2379
- "name": "deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2380
- "type": "chat",
2381
- "input_price_per_1m": 0.4,
2382
- "output_price_per_1m": 1.6,
2383
- "currency": "USD",
2384
- "context_window": 262144,
2385
- "size_b": 480,
2386
- "capabilities": [
2387
- "tools"
2388
- ],
2389
- "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct",
2390
- "hf_private": false,
2391
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
2392
- "hf_status": 200
2393
- },
2394
- {
2395
- "name": "mistral/mistral-medium-latest",
2396
- "type": "chat",
2397
- "input_price_per_1m": 0.4,
2398
- "output_price_per_1m": 2,
2399
- "currency": "USD",
2400
- "context_window": 131072,
2401
- "hf_private": true
2402
- },
2403
- {
2404
- "name": "mistral/devstral-medium-2507",
2405
- "type": "chat",
2406
- "input_price_per_1m": 0.4,
2407
- "output_price_per_1m": 2,
2408
- "currency": "USD",
2409
- "context_window": 131072,
2410
- "capabilities": [
2411
- "tools"
2412
- ],
2413
- "hf_private": true
2414
- },
2415
- {
2416
- "name": "mistral/devstral-latest",
2417
- "type": "chat",
2418
- "input_price_per_1m": 0.4,
2419
- "output_price_per_1m": 2,
2420
- "currency": "USD",
2421
- "context_window": 256000,
2422
- "hf_private": true
2423
- },
2424
- {
2425
- "name": "openai-responses/gpt-4.1-mini",
2426
  "type": "vision",
2427
  "input_price_per_1m": 0.4,
2428
  "output_price_per_1m": 1.6,
@@ -2434,7 +2356,7 @@
2434
  "hf_private": true
2435
  },
2436
  {
2437
- "name": "openai/gpt-4.1-mini",
2438
  "type": "vision",
2439
  "input_price_per_1m": 0.4,
2440
  "output_price_per_1m": 1.6,
@@ -2472,10 +2394,10 @@
2472
  "hf_status": 200
2473
  },
2474
  {
2475
- "name": "alibaba/qwen-plus",
2476
  "type": "chat",
2477
  "input_price_per_1m": 0.4,
2478
- "output_price_per_1m": 1.2,
2479
  "currency": "USD",
2480
  "context_window": 131072,
2481
  "capabilities": [
@@ -2484,7 +2406,25 @@
2484
  "hf_private": true
2485
  },
2486
  {
2487
- "name": "azure/gpt-4.1-mini",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2488
  "type": "vision",
2489
  "input_price_per_1m": 0.4,
2490
  "output_price_per_1m": 1.6,
@@ -2496,7 +2436,7 @@
2496
  "hf_private": true
2497
  },
2498
  {
2499
- "name": "azure/openai-responses/gpt-4.1-mini",
2500
  "type": "vision",
2501
  "input_price_per_1m": 0.4,
2502
  "output_price_per_1m": 1.6,
@@ -2508,79 +2448,63 @@
2508
  "hf_private": true
2509
  },
2510
  {
2511
- "name": "nebius/deepseek-ai/DeepSeek-V3-0324",
2512
  "type": "chat",
2513
- "input_price_per_1m": 0.5,
2514
- "output_price_per_1m": 1.5,
2515
  "currency": "USD",
2516
- "context_window": 128000,
 
2517
  "capabilities": [
2518
- "tools",
2519
- "reasoning"
2520
  ],
2521
- "size_b": 685,
2522
- "hf_id": "deepseek-ai/DeepSeek-V3-0324",
2523
  "hf_private": false,
2524
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2525
  "hf_status": 200
2526
  },
2527
  {
2528
- "name": "nebius/moonshotai/kimi-k2.5",
2529
- "type": "vision",
2530
- "input_price_per_1m": 0.5,
2531
- "output_price_per_1m": 2.5,
2532
  "currency": "USD",
2533
  "capabilities": [
2534
- "vision",
2535
  "reasoning"
2536
  ],
2537
- "context_window": 256000,
2538
- "hf_id": "moonshotai/Kimi-K2.5",
2539
- "size_b": 1058.6,
2540
  "hf_private": false,
2541
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2542
  "hf_status": 200
2543
  },
2544
  {
2545
- "name": "nebius/moonshotai/Kimi-K2-Instruct",
2546
  "type": "chat",
2547
- "input_price_per_1m": 0.5,
2548
- "output_price_per_1m": 2.4,
2549
  "currency": "USD",
2550
- "context_window": 131000,
 
2551
  "capabilities": [
2552
  "tools"
2553
  ],
2554
- "hf_id": "moonshotai/Kimi-K2-Instruct",
2555
- "size_b": 1026.5,
2556
  "hf_private": false,
2557
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2558
  "hf_status": 200
2559
  },
2560
  {
2561
- "name": "google/gemini-3-flash-preview",
2562
- "type": "vision",
2563
- "input_price_per_1m": 0.5,
2564
- "output_price_per_1m": 3,
2565
- "currency": "USD",
2566
- "capabilities": [
2567
- "vision",
2568
- "reasoning"
2569
- ],
2570
- "context_window": 1048576,
2571
- "hf_private": true
2572
- },
2573
- {
2574
- "name": "google/gemini-3.1-flash-image-preview",
2575
- "type": "vision",
2576
- "input_price_per_1m": 0.5,
2577
- "output_price_per_1m": 2,
2578
  "currency": "USD",
 
2579
  "capabilities": [
2580
- "vision",
2581
- "reasoning"
2582
  ],
2583
- "context_window": 131072,
2584
  "hf_private": true
2585
  },
2586
  {
@@ -2622,57 +2546,55 @@
2622
  "hf_private": true
2623
  },
2624
  {
2625
- "name": "novita/meta-llama/llama-3-70b-instruct",
2626
- "type": "chat",
2627
- "input_price_per_1m": 0.51,
2628
- "output_price_per_1m": 0.74,
2629
  "currency": "USD",
2630
- "context_window": 8192,
2631
- "size_b": 70,
2632
  "capabilities": [
2633
- "tools"
 
2634
  ],
2635
- "hf_private": false,
2636
- "hf_id": "meta-llama/Meta-Llama-3-70B-Instruct",
2637
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
2638
- "hf_status": 200
2639
  },
2640
  {
2641
- "name": "openai/o4-mini",
2642
- "type": "chat",
2643
- "input_price_per_1m": 0.55,
2644
- "output_price_per_1m": 2.2,
2645
  "currency": "USD",
2646
  "capabilities": [
 
2647
  "reasoning"
2648
  ],
2649
- "context_window": 200000,
2650
  "hf_private": true
2651
  },
2652
  {
2653
- "name": "vertex/deepseek-v3.2",
2654
- "type": "vision",
2655
- "input_price_per_1m": 0.56,
2656
- "output_price_per_1m": 1.68,
2657
  "currency": "USD",
 
2658
  "capabilities": [
2659
- "vision",
2660
  "reasoning"
2661
  ],
2662
- "context_window": 163840,
2663
- "hf_id": "deepseek-ai/DeepSeek-V3.2",
2664
- "size_b": 685.4,
2665
  "hf_private": false,
2666
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2667
  "hf_status": 200
2668
  },
2669
  {
2670
- "name": "novita/moonshotai/kimi-k2-instruct",
2671
  "type": "chat",
2672
- "input_price_per_1m": 0.57,
2673
- "output_price_per_1m": 2.3,
2674
  "currency": "USD",
2675
- "context_window": 131072,
2676
  "capabilities": [
2677
  "tools"
2678
  ],
@@ -2683,83 +2605,79 @@
2683
  "hf_status": 200
2684
  },
2685
  {
2686
- "name": "nebius/zai-org/GLM-4.5",
2687
- "type": "chat",
2688
- "input_price_per_1m": 0.6,
2689
- "output_price_per_1m": 2.2,
2690
  "currency": "USD",
2691
- "context_window": 128000,
2692
  "capabilities": [
2693
- "tools",
2694
  "reasoning"
2695
  ],
2696
- "hf_id": "zai-org/GLM-4.5",
2697
- "size_b": 358.3,
 
2698
  "hf_private": false,
2699
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2700
  "hf_status": 200
2701
  },
2702
  {
2703
- "name": "deepinfra/zai-org/GLM-4.5",
2704
  "type": "chat",
2705
- "input_price_per_1m": 0.6,
2706
- "output_price_per_1m": 2.2,
2707
  "currency": "USD",
2708
- "context_window": 131072,
 
2709
  "capabilities": [
2710
- "tools",
2711
- "reasoning"
2712
  ],
2713
- "hf_id": "zai-org/GLM-4.5",
2714
- "size_b": 358.3,
2715
  "hf_private": false,
 
2716
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2717
  "hf_status": 200
2718
  },
2719
  {
2720
- "name": "zai/GLM-4.5",
2721
  "type": "chat",
2722
- "input_price_per_1m": 0.6,
2723
  "output_price_per_1m": 2.2,
2724
  "currency": "USD",
2725
  "capabilities": [
2726
  "reasoning"
2727
  ],
2728
- "context_window": 131072,
2729
- "hf_id": "zai-org/GLM-4.5",
2730
- "size_b": 358.3,
2731
- "hf_private": false,
2732
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
2733
- "hf_status": 200
2734
  },
2735
  {
2736
- "name": "zai/GLM-4.6",
2737
- "type": "chat",
2738
- "input_price_per_1m": 0.6,
2739
- "output_price_per_1m": 2.2,
2740
  "currency": "USD",
2741
  "capabilities": [
 
2742
  "reasoning"
2743
  ],
2744
- "context_window": 200000,
2745
- "hf_id": "zai-org/GLM-4.6",
2746
- "size_b": 356.8,
2747
  "hf_private": false,
2748
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2749
  "hf_status": 200
2750
  },
2751
  {
2752
- "name": "zai/GLM-4.7",
2753
  "type": "chat",
2754
- "input_price_per_1m": 0.6,
2755
- "output_price_per_1m": 2.2,
2756
  "currency": "USD",
 
2757
  "capabilities": [
2758
- "reasoning"
2759
  ],
2760
- "context_window": 200000,
2761
- "hf_id": "zai-org/GLM-4.7",
2762
- "size_b": 358.3,
2763
  "hf_private": false,
2764
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2765
  "hf_status": 200
@@ -2798,23 +2716,6 @@
2798
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2799
  "hf_status": 200
2800
  },
2801
- {
2802
- "name": "alibaba/qwen3.5",
2803
- "type": "vision",
2804
- "input_price_per_1m": 0.6,
2805
- "output_price_per_1m": 3.6,
2806
- "currency": "USD",
2807
- "capabilities": [
2808
- "vision",
2809
- "reasoning"
2810
- ],
2811
- "context_window": 256000,
2812
- "size_b": 9,
2813
- "hf_id": "Qwen/Qwen3.5-9B",
2814
- "hf_private": false,
2815
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
2816
- "hf_status": 200
2817
- },
2818
  {
2819
  "name": "minimaxi/MiniMax-M2.7-highspeed",
2820
  "type": "vision",
@@ -2847,6 +2748,22 @@
2847
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2848
  "hf_status": 200
2849
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2850
  {
2851
  "name": "moonshot/kimi-k2.5",
2852
  "type": "vision",
@@ -2914,17 +2831,100 @@
2914
  "hf_status": 200
2915
  },
2916
  {
2917
- "name": "moonshot/kimi-k2-0711-preview",
2918
  "type": "chat",
2919
  "input_price_per_1m": 0.6,
2920
- "output_price_per_1m": 2.5,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2921
  "currency": "USD",
 
 
 
2922
  "context_window": 131072,
 
 
 
 
 
 
 
 
 
 
 
 
2923
  "capabilities": [
2924
- "tools"
2925
  ],
2926
- "hf_id": "moonshotai/Kimi-K2-Instruct",
2927
- "size_b": 1026.5,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2928
  "hf_private": false,
2929
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2930
  "hf_status": 200
@@ -2956,17 +2956,22 @@
2956
  "hf_private": true
2957
  },
2958
  {
2959
- "name": "parasail/parasail-qwen25-vl-72b-instruct",
2960
- "type": "vision",
2961
  "input_price_per_1m": 0.7,
2962
- "output_price_per_1m": 0.7,
2963
  "currency": "USD",
 
2964
  "capabilities": [
2965
- "vision"
 
2966
  ],
2967
- "context_window": 32768,
2968
- "size_b": 72,
2969
- "hf_private": false
 
 
 
2970
  },
2971
  {
2972
  "name": "novita/deepseek/deepseek-prover-v2-671b",
@@ -2979,22 +2984,17 @@
2979
  "hf_private": false
2980
  },
2981
  {
2982
- "name": "novita/deepseek/deepseek-r1-turbo",
2983
- "type": "chat",
2984
  "input_price_per_1m": 0.7,
2985
- "output_price_per_1m": 2.5,
2986
  "currency": "USD",
2987
- "context_window": 64000,
2988
  "capabilities": [
2989
- "tools",
2990
- "reasoning"
2991
  ],
2992
- "hf_id": "deepseek-ai/DeepSeek-R1",
2993
- "size_b": 671,
2994
- "size_source": "manual",
2995
- "hf_private": false,
2996
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
2997
- "hf_status": 200
2998
  },
2999
  {
3000
  "name": "openai-responses/gpt-5.4-mini",
@@ -3023,63 +3023,63 @@
3023
  "hf_private": true
3024
  },
3025
  {
3026
- "name": "nebius/deepseek-ai/DeepSeek-R1-0528",
3027
  "type": "chat",
3028
  "input_price_per_1m": 0.8,
3029
- "output_price_per_1m": 2.4,
3030
  "currency": "USD",
3031
- "context_window": 164000,
 
3032
  "capabilities": [
3033
- "tools",
3034
  "reasoning"
3035
  ],
3036
- "hf_id": "deepseek-ai/DeepSeek-R1-0528",
3037
- "size_b": 684.5,
3038
  "hf_private": false,
3039
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3040
  "hf_status": 200
3041
  },
3042
  {
3043
- "name": "deepinfra/meta-llama/Meta-Llama-3.1-405B-Instruct",
3044
  "type": "chat",
3045
  "input_price_per_1m": 0.8,
3046
  "output_price_per_1m": 0.8,
3047
  "currency": "USD",
3048
- "context_window": 130815,
3049
- "size_b": 405,
 
 
 
 
3050
  "hf_private": false,
3051
- "hf_id": "meta-llama/Llama-3.1-405B-Instruct",
3052
- "hf_validated_at": "2026-03-22T19:58:46.149Z",
3053
  "hf_status": 200
3054
  },
3055
  {
3056
- "name": "novita/deepseek/deepseek-r1-distill-llama-70b",
3057
  "type": "chat",
3058
  "input_price_per_1m": 0.8,
3059
  "output_price_per_1m": 0.8,
3060
  "currency": "USD",
3061
- "context_window": 32000,
3062
- "size_b": 70,
3063
- "capabilities": [
3064
- "reasoning"
3065
- ],
3066
- "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
3067
  "hf_private": false,
3068
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
 
3069
  "hf_status": 200
3070
  },
3071
  {
3072
- "name": "novita/qwen/qwen2.5-vl-72b-instruct",
3073
  "type": "chat",
3074
  "input_price_per_1m": 0.8,
3075
- "output_price_per_1m": 0.8,
3076
  "currency": "USD",
3077
- "context_window": 96000,
3078
- "size_b": 72,
3079
  "capabilities": [
3080
- "vision"
 
3081
  ],
3082
- "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
 
3083
  "hf_private": false,
3084
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3085
  "hf_status": 200
@@ -3189,33 +3189,17 @@
3189
  "hf_status": 200
3190
  },
3191
  {
3192
- "name": "groq/moonshotai/kimi-k2-instruct",
3193
- "type": "chat",
3194
- "input_price_per_1m": 1,
3195
- "output_price_per_1m": 3,
3196
- "currency": "USD",
3197
- "context_window": 131072,
3198
- "capabilities": [
3199
- "tools"
3200
- ],
3201
- "hf_id": "moonshotai/Kimi-K2-Instruct",
3202
- "size_b": 1026.5,
3203
- "hf_private": false,
3204
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
3205
- "hf_status": 200
3206
- },
3207
- {
3208
- "name": "groq/moonshotai/Kimi-K2-Instruct-0905",
3209
  "type": "chat",
3210
  "input_price_per_1m": 1,
3211
- "output_price_per_1m": 3,
3212
  "currency": "USD",
3213
- "context_window": 256000,
3214
  "capabilities": [
3215
- "tools"
3216
  ],
3217
- "hf_id": "moonshotai/Kimi-K2-Instruct",
3218
- "size_b": 1026.5,
 
3219
  "hf_private": false,
3220
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3221
  "hf_status": 200
@@ -3238,19 +3222,32 @@
3238
  "hf_status": 200
3239
  },
3240
  {
3241
- "name": "perplexity/sonar",
3242
- "type": "chat",
3243
  "input_price_per_1m": 1,
3244
- "output_price_per_1m": 1,
3245
  "currency": "USD",
3246
- "context_window": 131072,
3247
  "capabilities": [
3248
  "vision"
3249
  ],
 
3250
  "hf_private": true
3251
  },
3252
  {
3253
- "name": "anthropic/claude-haiku-4-5",
 
 
 
 
 
 
 
 
 
 
 
 
 
3254
  "type": "vision",
3255
  "input_price_per_1m": 1,
3256
  "output_price_per_1m": 5,
@@ -3262,45 +3259,48 @@
3262
  "hf_private": true
3263
  },
3264
  {
3265
- "name": "openai/o3",
3266
  "type": "vision",
3267
  "input_price_per_1m": 1,
3268
- "output_price_per_1m": 4,
3269
  "currency": "USD",
3270
  "capabilities": [
3271
- "vision",
3272
- "reasoning"
3273
  ],
3274
  "context_window": 200000,
3275
  "hf_private": true
3276
  },
3277
  {
3278
- "name": "novita/GLM-5",
3279
  "type": "chat",
3280
  "input_price_per_1m": 1,
3281
- "output_price_per_1m": 3.2,
3282
  "currency": "USD",
 
3283
  "capabilities": [
3284
- "reasoning"
3285
  ],
3286
- "context_window": 202800,
3287
- "hf_id": "zai-org/GLM-5",
3288
- "size_b": 753.9,
3289
  "hf_private": false,
3290
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3291
  "hf_status": 200
3292
  },
3293
  {
3294
- "name": "bedrock/claude-haiku-4-5",
3295
- "type": "vision",
3296
  "input_price_per_1m": 1,
3297
- "output_price_per_1m": 5,
3298
  "currency": "USD",
 
3299
  "capabilities": [
3300
- "vision"
3301
  ],
3302
- "context_window": 200000,
3303
- "hf_private": true
 
 
 
3304
  },
3305
  {
3306
  "name": "alibaba/qwen3-coder-plus",
@@ -3315,19 +3315,19 @@
3315
  "hf_private": true
3316
  },
3317
  {
3318
- "name": "vertex/claude-haiku-4-5",
3319
- "type": "vision",
3320
  "input_price_per_1m": 1,
3321
- "output_price_per_1m": 5,
3322
  "currency": "USD",
 
3323
  "capabilities": [
3324
  "vision"
3325
  ],
3326
- "context_window": 200000,
3327
  "hf_private": true
3328
  },
3329
  {
3330
- "name": "openai-responses/o3-mini",
3331
  "type": "chat",
3332
  "input_price_per_1m": 1.1,
3333
  "output_price_per_1m": 4.4,
@@ -3339,7 +3339,7 @@
3339
  "hf_private": true
3340
  },
3341
  {
3342
- "name": "openai-responses/o4-mini",
3343
  "type": "chat",
3344
  "input_price_per_1m": 1.1,
3345
  "output_price_per_1m": 4.4,
@@ -3351,7 +3351,7 @@
3351
  "hf_private": true
3352
  },
3353
  {
3354
- "name": "openai/o3-mini",
3355
  "type": "chat",
3356
  "input_price_per_1m": 1.1,
3357
  "output_price_per_1m": 4.4,
@@ -3363,7 +3363,7 @@
3363
  "hf_private": true
3364
  },
3365
  {
3366
- "name": "azure/o4-mini",
3367
  "type": "chat",
3368
  "input_price_per_1m": 1.1,
3369
  "output_price_per_1m": 4.4,
@@ -3374,16 +3374,6 @@
3374
  "context_window": 200000,
3375
  "hf_private": true
3376
  },
3377
- {
3378
- "name": "together/Qwen/Qwen2.5-72B-Instruct-Turbo",
3379
- "type": "chat",
3380
- "input_price_per_1m": 1.2,
3381
- "output_price_per_1m": 1.2,
3382
- "currency": "USD",
3383
- "context_window": 32768,
3384
- "size_b": 72,
3385
- "hf_private": false
3386
- },
3387
  {
3388
  "name": "moonshot/kimi-k2-turbo-preview",
3389
  "type": "chat",
@@ -3401,33 +3391,41 @@
3401
  "hf_status": 200
3402
  },
3403
  {
3404
- "name": "google/gemini-2.5-pro",
3405
- "type": "vision",
 
 
 
 
 
 
 
 
 
 
3406
  "input_price_per_1m": 1.25,
3407
  "output_price_per_1m": 10,
3408
  "currency": "USD",
3409
  "capabilities": [
3410
- "vision",
3411
  "reasoning"
3412
  ],
3413
- "context_window": 1048576,
3414
  "hf_private": true
3415
  },
3416
  {
3417
- "name": "openai-responses/gpt-5.1-codex",
3418
- "type": "vision",
3419
  "input_price_per_1m": 1.25,
3420
  "output_price_per_1m": 10,
3421
  "currency": "USD",
3422
  "capabilities": [
3423
- "vision",
3424
  "reasoning"
3425
  ],
3426
- "context_window": 400000,
3427
  "hf_private": true
3428
  },
3429
  {
3430
- "name": "openai-responses/gpt-5.1",
3431
  "type": "vision",
3432
  "input_price_per_1m": 1.25,
3433
  "output_price_per_1m": 10,
@@ -3440,7 +3438,7 @@
3440
  "hf_private": true
3441
  },
3442
  {
3443
- "name": "openai-responses/gpt-5-codex",
3444
  "type": "vision",
3445
  "input_price_per_1m": 1.25,
3446
  "output_price_per_1m": 10,
@@ -3453,7 +3451,7 @@
3453
  "hf_private": true
3454
  },
3455
  {
3456
- "name": "openai-responses/gpt-5",
3457
  "type": "vision",
3458
  "input_price_per_1m": 1.25,
3459
  "output_price_per_1m": 10,
@@ -3466,7 +3464,7 @@
3466
  "hf_private": true
3467
  },
3468
  {
3469
- "name": "openai/gpt-5-chat",
3470
  "type": "vision",
3471
  "input_price_per_1m": 1.25,
3472
  "output_price_per_1m": 10,
@@ -3475,11 +3473,11 @@
3475
  "vision",
3476
  "reasoning"
3477
  ],
3478
- "context_window": 128000,
3479
  "hf_private": true
3480
  },
3481
  {
3482
- "name": "openai/gpt-5.1",
3483
  "type": "vision",
3484
  "input_price_per_1m": 1.25,
3485
  "output_price_per_1m": 10,
@@ -3488,7 +3486,7 @@
3488
  "vision",
3489
  "reasoning"
3490
  ],
3491
- "context_window": 400000,
3492
  "hf_private": true
3493
  },
3494
  {
@@ -3505,7 +3503,7 @@
3505
  "hf_private": true
3506
  },
3507
  {
3508
- "name": "coding/gemini-2.5-pro",
3509
  "type": "vision",
3510
  "input_price_per_1m": 1.25,
3511
  "output_price_per_1m": 10,
@@ -3514,28 +3512,24 @@
3514
  "vision",
3515
  "reasoning"
3516
  ],
3517
- "context_window": 1048576,
3518
  "hf_private": true
3519
  },
3520
  {
3521
- "name": "together/deepseek-ai/DeepSeek-V3",
3522
- "type": "chat",
3523
  "input_price_per_1m": 1.25,
3524
- "output_price_per_1m": 1.25,
3525
  "currency": "USD",
3526
- "context_window": 131072,
3527
  "capabilities": [
3528
- "tools",
3529
  "reasoning"
3530
  ],
3531
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
3532
- "size_b": 671,
3533
- "hf_private": false,
3534
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
3535
- "hf_status": 200
3536
  },
3537
  {
3538
- "name": "vertex/gemini-2.5-pro",
3539
  "type": "vision",
3540
  "input_price_per_1m": 1.25,
3541
  "output_price_per_1m": 10,
@@ -3548,31 +3542,37 @@
3548
  "hf_private": true
3549
  },
3550
  {
3551
- "name": "azure/gpt-5",
3552
- "type": "chat",
3553
  "input_price_per_1m": 1.25,
3554
  "output_price_per_1m": 10,
3555
  "currency": "USD",
3556
  "capabilities": [
 
3557
  "reasoning"
3558
  ],
3559
- "context_window": 200000,
3560
  "hf_private": true
3561
  },
3562
  {
3563
- "name": "azure/gpt-5.1",
3564
  "type": "chat",
3565
  "input_price_per_1m": 1.25,
3566
- "output_price_per_1m": 10,
3567
  "currency": "USD",
 
3568
  "capabilities": [
 
3569
  "reasoning"
3570
  ],
3571
- "context_window": 200000,
3572
- "hf_private": true
 
 
 
3573
  },
3574
  {
3575
- "name": "novita/sao10k/l3-70b-euryale-v2.1",
3576
  "type": "chat",
3577
  "input_price_per_1m": 1.48,
3578
  "output_price_per_1m": 1.48,
@@ -3582,7 +3582,7 @@
3582
  "hf_private": false
3583
  },
3584
  {
3585
- "name": "novita/sao10k/l31-70b-euryale-v2.2",
3586
  "type": "chat",
3587
  "input_price_per_1m": 1.48,
3588
  "output_price_per_1m": 1.48,
@@ -3604,20 +3604,19 @@
3604
  "hf_private": true
3605
  },
3606
  {
3607
- "name": "openai-responses/gpt-5.2",
3608
- "type": "vision",
3609
  "input_price_per_1m": 1.75,
3610
  "output_price_per_1m": 14,
3611
  "currency": "USD",
3612
  "capabilities": [
3613
- "vision",
3614
  "reasoning"
3615
  ],
3616
- "context_window": 400000,
3617
  "hf_private": true
3618
  },
3619
  {
3620
- "name": "openai-responses/gpt-5.2-codex",
3621
  "type": "vision",
3622
  "input_price_per_1m": 1.75,
3623
  "output_price_per_1m": 14,
@@ -3630,7 +3629,7 @@
3630
  "hf_private": true
3631
  },
3632
  {
3633
- "name": "openai-responses/gpt-5.3-chat",
3634
  "type": "vision",
3635
  "input_price_per_1m": 1.75,
3636
  "output_price_per_1m": 14,
@@ -3639,11 +3638,11 @@
3639
  "vision",
3640
  "reasoning"
3641
  ],
3642
- "context_window": 128000,
3643
  "hf_private": true
3644
  },
3645
  {
3646
- "name": "openai-responses/gpt-5.3-codex",
3647
  "type": "vision",
3648
  "input_price_per_1m": 1.75,
3649
  "output_price_per_1m": 14,
@@ -3652,11 +3651,11 @@
3652
  "vision",
3653
  "reasoning"
3654
  ],
3655
- "context_window": 400000,
3656
  "hf_private": true
3657
  },
3658
  {
3659
- "name": "openai/gpt-5.3-chat",
3660
  "type": "vision",
3661
  "input_price_per_1m": 1.75,
3662
  "output_price_per_1m": 14,
@@ -3665,11 +3664,11 @@
3665
  "vision",
3666
  "reasoning"
3667
  ],
3668
- "context_window": 128000,
3669
  "hf_private": true
3670
  },
3671
  {
3672
- "name": "openai/gpt-5.2",
3673
  "type": "vision",
3674
  "input_price_per_1m": 1.75,
3675
  "output_price_per_1m": 14,
@@ -3682,7 +3681,7 @@
3682
  "hf_private": true
3683
  },
3684
  {
3685
- "name": "openai/gpt-5.2-chat",
3686
  "type": "vision",
3687
  "input_price_per_1m": 1.75,
3688
  "output_price_per_1m": 14,
@@ -3691,11 +3690,11 @@
3691
  "vision",
3692
  "reasoning"
3693
  ],
3694
- "context_window": 128000,
3695
  "hf_private": true
3696
  },
3697
  {
3698
- "name": "azure/openai-responses/gpt-5.2-codex",
3699
  "type": "vision",
3700
  "input_price_per_1m": 1.75,
3701
  "output_price_per_1m": 14,
@@ -3704,23 +3703,24 @@
3704
  "vision",
3705
  "reasoning"
3706
  ],
3707
- "context_window": 400000,
3708
  "hf_private": true
3709
  },
3710
  {
3711
- "name": "azure/gpt-5.2",
3712
- "type": "chat",
3713
  "input_price_per_1m": 1.75,
3714
  "output_price_per_1m": 14,
3715
  "currency": "USD",
3716
  "capabilities": [
 
3717
  "reasoning"
3718
  ],
3719
- "context_window": 200000,
3720
  "hf_private": true
3721
  },
3722
  {
3723
- "name": "azure/gpt-5.3-codex",
3724
  "type": "vision",
3725
  "input_price_per_1m": 1.75,
3726
  "output_price_per_1m": 14,
@@ -3729,68 +3729,56 @@
3729
  "vision",
3730
  "reasoning"
3731
  ],
3732
- "context_window": 400000,
3733
- "hf_private": true
3734
- },
3735
- {
3736
- "name": "nebius/deepseek-ai/DeepSeek-V3-0324-fast",
3737
- "type": "chat",
3738
- "input_price_per_1m": 2,
3739
- "output_price_per_1m": 6,
3740
- "currency": "USD",
3741
  "context_window": 128000,
3742
  "hf_private": true
3743
  },
3744
  {
3745
- "name": "perplexity/sonar-reasoning-pro",
3746
- "type": "chat",
3747
  "input_price_per_1m": 2,
3748
  "output_price_per_1m": 8,
3749
  "currency": "USD",
3750
- "context_window": 131072,
3751
  "capabilities": [
3752
- "vision",
3753
- "reasoning"
3754
  ],
 
3755
  "hf_private": true
3756
  },
3757
  {
3758
- "name": "xai/grok-4.2-beta",
3759
  "type": "vision",
3760
  "input_price_per_1m": 2,
3761
- "output_price_per_1m": 6,
3762
  "currency": "USD",
3763
  "capabilities": [
3764
- "vision",
3765
- "reasoning"
3766
  ],
3767
- "context_window": 2000000,
3768
  "hf_private": true
3769
  },
3770
  {
3771
- "name": "xai/grok-2-1212",
3772
  "type": "chat",
3773
  "input_price_per_1m": 2,
3774
- "output_price_per_1m": 10,
3775
  "currency": "USD",
3776
  "context_window": 131072,
3777
  "hf_private": true
3778
  },
3779
  {
3780
- "name": "google/gemini-3-pro-preview",
3781
  "type": "vision",
3782
  "input_price_per_1m": 2,
3783
- "output_price_per_1m": 12,
3784
  "currency": "USD",
3785
  "capabilities": [
3786
- "vision",
3787
- "reasoning"
3788
  ],
3789
- "context_window": 1048576,
3790
  "hf_private": true
3791
  },
3792
  {
3793
- "name": "google/gemini-3.1-pro-preview",
3794
  "type": "vision",
3795
  "input_price_per_1m": 2,
3796
  "output_price_per_1m": 12,
@@ -3803,24 +3791,29 @@
3803
  "hf_private": true
3804
  },
3805
  {
3806
- "name": "mistral/pixtral-large-latest",
3807
- "type": "chat",
3808
  "input_price_per_1m": 2,
3809
- "output_price_per_1m": 5,
3810
  "currency": "USD",
3811
- "context_window": 131072,
 
 
 
 
3812
  "hf_private": true
3813
  },
3814
  {
3815
- "name": "openai-responses/gpt-4.1",
3816
  "type": "vision",
3817
  "input_price_per_1m": 2,
3818
- "output_price_per_1m": 8,
3819
  "currency": "USD",
3820
  "capabilities": [
3821
- "vision"
 
3822
  ],
3823
- "context_window": 1047576,
3824
  "hf_private": true
3825
  },
3826
  {
@@ -3849,20 +3842,29 @@
3849
  "hf_private": true
3850
  },
3851
  {
3852
- "name": "vertex/gemini-3-pro-image-preview",
3853
  "type": "vision",
3854
  "input_price_per_1m": 2,
3855
- "output_price_per_1m": 12,
3856
  "currency": "USD",
3857
  "capabilities": [
3858
  "vision",
3859
  "reasoning"
3860
  ],
3861
- "context_window": 1048576,
3862
  "hf_private": true
3863
  },
3864
  {
3865
- "name": "vertex/gemini-3-pro-preview",
 
 
 
 
 
 
 
 
 
3866
  "type": "vision",
3867
  "input_price_per_1m": 2,
3868
  "output_price_per_1m": 12,
@@ -3875,7 +3877,7 @@
3875
  "hf_private": true
3876
  },
3877
  {
3878
- "name": "vertex/gemini-3.1-pro-preview",
3879
  "type": "vision",
3880
  "input_price_per_1m": 2,
3881
  "output_price_per_1m": 12,
@@ -3888,31 +3890,29 @@
3888
  "hf_private": true
3889
  },
3890
  {
3891
- "name": "azure/openai-responses/gpt-4.1",
3892
- "type": "vision",
3893
  "input_price_per_1m": 2,
3894
- "output_price_per_1m": 8,
3895
  "currency": "USD",
3896
- "capabilities": [
3897
- "vision"
3898
- ],
3899
- "context_window": 1047576,
3900
  "hf_private": true
3901
  },
3902
  {
3903
- "name": "azure/gpt-4.1",
3904
- "type": "vision",
3905
  "input_price_per_1m": 2,
3906
  "output_price_per_1m": 8,
3907
  "currency": "USD",
 
3908
  "capabilities": [
3909
- "vision"
 
3910
  ],
3911
- "context_window": 1047576,
3912
  "hf_private": true
3913
  },
3914
  {
3915
- "name": "openai-responses/gpt-5.4",
3916
  "type": "vision",
3917
  "input_price_per_1m": 2.5,
3918
  "output_price_per_1m": 15,
@@ -3925,7 +3925,7 @@
3925
  "hf_private": true
3926
  },
3927
  {
3928
- "name": "openai/gpt-5.4",
3929
  "type": "vision",
3930
  "input_price_per_1m": 2.5,
3931
  "output_price_per_1m": 15,
@@ -3950,19 +3950,7 @@
3950
  "hf_private": true
3951
  },
3952
  {
3953
- "name": "openai/gpt-4o-2024-05-13",
3954
- "type": "vision",
3955
- "input_price_per_1m": 2.5,
3956
- "output_price_per_1m": 10,
3957
- "currency": "USD",
3958
- "capabilities": [
3959
- "vision"
3960
- ],
3961
- "context_window": 128000,
3962
- "hf_private": true
3963
- },
3964
- {
3965
- "name": "openai/gpt-4o",
3966
  "type": "vision",
3967
  "input_price_per_1m": 2.5,
3968
  "output_price_per_1m": 10,
@@ -3974,7 +3962,7 @@
3974
  "hf_private": true
3975
  },
3976
  {
3977
- "name": "openai/gpt-4o-2024-11-20",
3978
  "type": "vision",
3979
  "input_price_per_1m": 2.5,
3980
  "output_price_per_1m": 10,
@@ -3986,7 +3974,7 @@
3986
  "hf_private": true
3987
  },
3988
  {
3989
- "name": "azure/openai-responses/gpt-5.4",
3990
  "type": "vision",
3991
  "input_price_per_1m": 2.5,
3992
  "output_price_per_1m": 15,
@@ -3999,19 +3987,19 @@
3999
  "hf_private": true
4000
  },
4001
  {
4002
- "name": "perplexity/sonar-pro",
4003
- "type": "chat",
4004
- "input_price_per_1m": 3,
4005
- "output_price_per_1m": 15,
4006
  "currency": "USD",
4007
- "context_window": 204800,
4008
  "capabilities": [
4009
  "vision"
4010
  ],
 
4011
  "hf_private": true
4012
  },
4013
  {
4014
- "name": "xai/grok-4",
4015
  "type": "vision",
4016
  "input_price_per_1m": 3,
4017
  "output_price_per_1m": 15,
@@ -4019,11 +4007,11 @@
4019
  "capabilities": [
4020
  "vision"
4021
  ],
4022
- "context_window": 256000,
4023
  "hf_private": true
4024
  },
4025
  {
4026
- "name": "anthropic/claude-sonnet-4",
4027
  "type": "vision",
4028
  "input_price_per_1m": 3,
4029
  "output_price_per_1m": 15,
@@ -4032,11 +4020,11 @@
4032
  "vision",
4033
  "reasoning"
4034
  ],
4035
- "context_window": 1000000,
4036
  "hf_private": true
4037
  },
4038
  {
4039
- "name": "anthropic/claude-sonnet-4-6",
4040
  "type": "vision",
4041
  "input_price_per_1m": 3,
4042
  "output_price_per_1m": 15,
@@ -4045,11 +4033,11 @@
4045
  "vision",
4046
  "reasoning"
4047
  ],
4048
- "context_window": 1000000,
4049
  "hf_private": true
4050
  },
4051
  {
4052
- "name": "anthropic/claude-sonnet-4-5",
4053
  "type": "vision",
4054
  "input_price_per_1m": 3,
4055
  "output_price_per_1m": 15,
@@ -4058,24 +4046,23 @@
4058
  "vision",
4059
  "reasoning"
4060
  ],
4061
- "context_window": 1000000,
4062
  "hf_private": true
4063
  },
4064
  {
4065
- "name": "bedrock/claude-sonnet-4",
4066
  "type": "vision",
4067
  "input_price_per_1m": 3,
4068
  "output_price_per_1m": 15,
4069
  "currency": "USD",
4070
  "capabilities": [
4071
- "vision",
4072
- "reasoning"
4073
  ],
4074
- "context_window": 200000,
4075
  "hf_private": true
4076
  },
4077
  {
4078
- "name": "bedrock/claude-3-7-sonnet",
4079
  "type": "vision",
4080
  "input_price_per_1m": 3,
4081
  "output_price_per_1m": 15,
@@ -4088,7 +4075,7 @@
4088
  "hf_private": true
4089
  },
4090
  {
4091
- "name": "bedrock/claude-sonnet-4-6",
4092
  "type": "vision",
4093
  "input_price_per_1m": 3,
4094
  "output_price_per_1m": 15,
@@ -4097,7 +4084,7 @@
4097
  "vision",
4098
  "reasoning"
4099
  ],
4100
- "context_window": 1000000,
4101
  "hf_private": true
4102
  },
4103
  {
@@ -4114,7 +4101,7 @@
4114
  "hf_private": true
4115
  },
4116
  {
4117
- "name": "coding/claude-sonnet-4-20250514",
4118
  "type": "vision",
4119
  "input_price_per_1m": 3,
4120
  "output_price_per_1m": 15,
@@ -4123,41 +4110,24 @@
4123
  "vision",
4124
  "reasoning"
4125
  ],
4126
- "context_window": 200000,
4127
  "hf_private": true
4128
  },
4129
  {
4130
- "name": "together/deepseek-ai/DeepSeek-R1",
4131
- "type": "chat",
4132
- "input_price_per_1m": 3,
4133
- "output_price_per_1m": 7,
4134
- "currency": "USD",
4135
- "context_window": 64000,
4136
- "capabilities": [
4137
- "tools",
4138
- "reasoning"
4139
- ],
4140
- "hf_id": "deepseek-ai/DeepSeek-R1",
4141
- "size_b": 671,
4142
- "size_source": "manual",
4143
- "hf_private": false,
4144
- "hf_validated_at": "2026-03-22T19:23:09.981Z",
4145
- "hf_status": 200
4146
- },
4147
- {
4148
- "name": "vertex/claude-3-5-sonnet",
4149
  "type": "vision",
4150
  "input_price_per_1m": 3,
4151
  "output_price_per_1m": 15,
4152
  "currency": "USD",
4153
  "capabilities": [
4154
- "vision"
 
4155
  ],
4156
  "context_window": 200000,
4157
  "hf_private": true
4158
  },
4159
  {
4160
- "name": "vertex/claude-sonnet-4-5",
4161
  "type": "vision",
4162
  "input_price_per_1m": 3,
4163
  "output_price_per_1m": 15,
@@ -4166,11 +4136,11 @@
4166
  "vision",
4167
  "reasoning"
4168
  ],
4169
- "context_window": 200000,
4170
  "hf_private": true
4171
  },
4172
  {
4173
- "name": "vertex/claude-sonnet-4",
4174
  "type": "vision",
4175
  "input_price_per_1m": 3,
4176
  "output_price_per_1m": 15,
@@ -4179,11 +4149,11 @@
4179
  "vision",
4180
  "reasoning"
4181
  ],
4182
- "context_window": 200000,
4183
  "hf_private": true
4184
  },
4185
  {
4186
- "name": "vertex/claude-3-7-sonnet",
4187
  "type": "vision",
4188
  "input_price_per_1m": 3,
4189
  "output_price_per_1m": 15,
@@ -4192,14 +4162,14 @@
4192
  "vision",
4193
  "reasoning"
4194
  ],
4195
- "context_window": 200000,
4196
  "hf_private": true
4197
  },
4198
  {
4199
- "name": "novita/deepseek/deepseek-r1",
4200
  "type": "chat",
4201
- "input_price_per_1m": 4,
4202
- "output_price_per_1m": 4,
4203
  "currency": "USD",
4204
  "context_window": 64000,
4205
  "capabilities": [
@@ -4214,19 +4184,37 @@
4214
  "hf_status": 200
4215
  },
4216
  {
4217
- "name": "xai/grok-3",
4218
  "type": "chat",
4219
- "input_price_per_1m": 5,
4220
- "output_price_per_1m": 25,
4221
  "currency": "USD",
4222
- "context_window": 131072,
4223
  "capabilities": [
4224
- "tools"
4225
  ],
4226
  "hf_private": true
4227
  },
4228
  {
4229
- "name": "anthropic/claude-opus-4-5",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4230
  "type": "vision",
4231
  "input_price_per_1m": 5,
4232
  "output_price_per_1m": 25,
@@ -4239,7 +4227,7 @@
4239
  "hf_private": true
4240
  },
4241
  {
4242
- "name": "anthropic/claude-opus-4-6",
4243
  "type": "vision",
4244
  "input_price_per_1m": 5,
4245
  "output_price_per_1m": 25,
@@ -4263,6 +4251,18 @@
4263
  "context_window": 128000,
4264
  "hf_private": true
4265
  },
 
 
 
 
 
 
 
 
 
 
 
 
4266
  {
4267
  "name": "bedrock/claude-opus-4-5",
4268
  "type": "vision",
@@ -4290,7 +4290,7 @@
4290
  "hf_private": true
4291
  },
4292
  {
4293
- "name": "vertex/claude-opus-4-6",
4294
  "type": "vision",
4295
  "input_price_per_1m": 5,
4296
  "output_price_per_1m": 25,
@@ -4299,11 +4299,11 @@
4299
  "vision",
4300
  "reasoning"
4301
  ],
4302
- "context_window": 1000000,
4303
  "hf_private": true
4304
  },
4305
  {
4306
- "name": "vertex/claude-opus-4-5",
4307
  "type": "vision",
4308
  "input_price_per_1m": 5,
4309
  "output_price_per_1m": 25,
@@ -4312,7 +4312,7 @@
4312
  "vision",
4313
  "reasoning"
4314
  ],
4315
- "context_window": 200000,
4316
  "hf_private": true
4317
  },
4318
  {
@@ -4329,20 +4329,20 @@
4329
  "hf_private": true
4330
  },
4331
  {
4332
- "name": "anthropic/claude-opus-4",
4333
  "type": "vision",
4334
  "input_price_per_1m": 15,
4335
- "output_price_per_1m": 75,
4336
  "currency": "USD",
4337
  "capabilities": [
4338
  "vision",
4339
  "reasoning"
4340
  ],
4341
- "context_window": 200000,
4342
  "hf_private": true
4343
  },
4344
  {
4345
- "name": "anthropic/claude-opus-4-1",
4346
  "type": "vision",
4347
  "input_price_per_1m": 15,
4348
  "output_price_per_1m": 75,
@@ -4355,16 +4355,16 @@
4355
  "hf_private": true
4356
  },
4357
  {
4358
- "name": "openai-responses/gpt-5-pro",
4359
  "type": "vision",
4360
  "input_price_per_1m": 15,
4361
- "output_price_per_1m": 120,
4362
  "currency": "USD",
4363
  "capabilities": [
4364
  "vision",
4365
  "reasoning"
4366
  ],
4367
- "context_window": 400000,
4368
  "hf_private": true
4369
  },
4370
  {
@@ -4381,7 +4381,7 @@
4381
  "hf_private": true
4382
  },
4383
  {
4384
- "name": "bedrock/claude-opus-4",
4385
  "type": "vision",
4386
  "input_price_per_1m": 15,
4387
  "output_price_per_1m": 75,
@@ -4394,7 +4394,7 @@
4394
  "hf_private": true
4395
  },
4396
  {
4397
- "name": "coding/claude-opus-4-20250514",
4398
  "type": "vision",
4399
  "input_price_per_1m": 15,
4400
  "output_price_per_1m": 75,
@@ -4407,7 +4407,7 @@
4407
  "hf_private": true
4408
  },
4409
  {
4410
- "name": "vertex/claude-opus-4-1",
4411
  "type": "vision",
4412
  "input_price_per_1m": 15,
4413
  "output_price_per_1m": 75,
@@ -4420,7 +4420,7 @@
4420
  "hf_private": true
4421
  },
4422
  {
4423
- "name": "vertex/claude-opus-4",
4424
  "type": "vision",
4425
  "input_price_per_1m": 15,
4426
  "output_price_per_1m": 75,
@@ -4446,7 +4446,7 @@
4446
  "hf_private": true
4447
  },
4448
  {
4449
- "name": "openai-responses/gpt-5.4-pro",
4450
  "type": "vision",
4451
  "input_price_per_1m": 30,
4452
  "output_price_per_1m": 180,
@@ -4459,7 +4459,7 @@
4459
  "hf_private": true
4460
  },
4461
  {
4462
- "name": "openai/gpt-5.4-pro",
4463
  "type": "vision",
4464
  "input_price_per_1m": 30,
4465
  "output_price_per_1m": 180,
@@ -4472,7 +4472,7 @@
4472
  "hf_private": true
4473
  },
4474
  {
4475
- "name": "azure/openai-responses/gpt-5.4-pro",
4476
  "type": "vision",
4477
  "input_price_per_1m": 30,
4478
  "output_price_per_1m": 180,
@@ -5052,7 +5052,10 @@
5052
  "currency": "USD",
5053
  "size_b": 405,
5054
  "flavor": "base",
5055
- "hf_private": false
 
 
 
5056
  },
5057
  {
5058
  "name": "gemma-3-27b-it",
@@ -5296,7 +5299,14 @@
5296
  "output_price_per_1m": 2,
5297
  "currency": "EUR",
5298
  "size_b": 123,
5299
- "hf_private": false
 
 
 
 
 
 
 
5300
  },
5301
  {
5302
  "name": "whisper-large-v3",
 
1163
  "gdpr_compliant": true,
1164
  "eu_endpoints": true,
1165
  "models": [
 
 
 
 
 
 
 
 
 
 
1166
  {
1167
  "name": "novita/meta-llama/llama-3.2-1b-instruct",
1168
  "type": "chat",
 
1176
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1177
  "hf_status": 200
1178
  },
1179
+ {
1180
+ "name": "deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo",
1181
+ "type": "chat",
1182
+ "input_price_per_1m": 0.02,
1183
+ "output_price_per_1m": 0.05,
1184
+ "currency": "USD",
1185
+ "context_window": 131072,
1186
+ "size_b": 8,
1187
+ "hf_private": false
1188
+ },
1189
  {
1190
  "name": "openai/gpt-5-nano",
1191
  "type": "vision",
 
1229
  "hf_status": 200
1230
  },
1231
  {
1232
+ "name": "azure/gpt-5-nano",
1233
+ "type": "chat",
1234
  "input_price_per_1m": 0.05,
1235
  "output_price_per_1m": 0.4,
1236
  "currency": "USD",
1237
  "capabilities": [
 
1238
  "reasoning"
1239
  ],
1240
+ "context_window": 200000,
1241
  "hf_private": true
1242
  },
1243
  {
1244
+ "name": "novita/meta-llama/llama-3.1-8b-instruct",
1245
  "type": "chat",
1246
  "input_price_per_1m": 0.05,
1247
  "output_price_per_1m": 0.05,
1248
  "currency": "USD",
1249
+ "context_window": 16384,
1250
  "size_b": 8,
1251
+ "capabilities": [
1252
+ "tools"
1253
+ ],
1254
+ "hf_private": false,
1255
+ "hf_id": "meta-llama/Meta-Llama-3.1-8B-Instruct",
1256
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
1257
+ "hf_status": 200
1258
  },
1259
  {
1260
  "name": "novita/Sao10K/L3-8B-Stheno-v3.2",
 
1267
  "hf_private": false
1268
  },
1269
  {
1270
+ "name": "novita/sao10k/l3-8b-lunaris",
1271
  "type": "chat",
1272
  "input_price_per_1m": 0.05,
1273
  "output_price_per_1m": 0.05,
1274
  "currency": "USD",
1275
+ "context_window": 8192,
1276
  "size_b": 8,
1277
+ "hf_private": false
 
 
 
 
 
 
1278
  },
1279
  {
1280
+ "name": "openai-responses/gpt-5-nano",
1281
+ "type": "vision",
1282
  "input_price_per_1m": 0.05,
1283
+ "output_price_per_1m": 0.4,
1284
  "currency": "USD",
 
1285
  "capabilities": [
1286
+ "vision",
1287
+ "reasoning"
1288
  ],
1289
+ "context_window": 400000,
1290
  "hf_private": true
1291
  },
1292
  {
1293
+ "name": "alibaba/qwen-turbo",
1294
  "type": "chat",
1295
  "input_price_per_1m": 0.05,
1296
+ "output_price_per_1m": 0.2,
1297
  "currency": "USD",
1298
+ "context_window": 1000000,
1299
  "capabilities": [
1300
+ "tools"
1301
  ],
 
1302
  "hf_private": true
1303
  },
1304
  {
 
1349
  "hf_status": 200
1350
  },
1351
  {
1352
+ "name": "azure/openai-responses/gpt-4.1-nano",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1353
  "type": "vision",
1354
  "input_price_per_1m": 0.1,
1355
  "output_price_per_1m": 0.4,
1356
  "currency": "USD",
1357
  "capabilities": [
1358
+ "vision"
 
1359
  ],
1360
+ "context_window": 1047576,
1361
  "hf_private": true
1362
  },
1363
  {
1364
+ "name": "azure/gpt-4.1-nano",
1365
  "type": "vision",
1366
  "input_price_per_1m": 0.1,
1367
  "output_price_per_1m": 0.4,
 
1369
  "capabilities": [
1370
  "vision"
1371
  ],
1372
+ "context_window": 1047576,
1373
  "hf_private": true
1374
  },
1375
  {
1376
+ "name": "mistral/devstral-small-2507",
1377
  "type": "chat",
1378
  "input_price_per_1m": 0.1,
1379
  "output_price_per_1m": 0.3,
 
1389
  "hf_status": 200
1390
  },
1391
  {
1392
+ "name": "mistral/devstral-small-latest",
 
 
 
 
 
 
 
 
 
1393
  "type": "chat",
1394
  "input_price_per_1m": 0.1,
1395
  "output_price_per_1m": 0.3,
 
1404
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1405
  "hf_status": 200
1406
  },
1407
+ {
1408
+ "name": "mistral/mistral-small-2503",
1409
+ "type": "chat",
1410
+ "input_price_per_1m": 0.1,
1411
+ "output_price_per_1m": 0.3,
1412
+ "currency": "USD",
1413
+ "context_window": 32768,
1414
+ "hf_private": true
1415
+ },
1416
  {
1417
  "name": "openai-responses/gpt-4.1-nano",
1418
  "type": "vision",
 
1425
  "context_window": 1047576,
1426
  "hf_private": true
1427
  },
1428
+ {
1429
+ "name": "vertex/gemini-2.5-flash-lite",
1430
+ "type": "vision",
1431
+ "input_price_per_1m": 0.1,
1432
+ "output_price_per_1m": 0.4,
1433
+ "currency": "USD",
1434
+ "capabilities": [
1435
+ "vision",
1436
+ "reasoning"
1437
+ ],
1438
+ "context_window": 1048576,
1439
+ "hf_private": true
1440
+ },
1441
  {
1442
  "name": "openai/gpt-4.1-nano",
1443
  "type": "vision",
 
1451
  "hf_private": true
1452
  },
1453
  {
1454
+ "name": "deepinfra/Qwen/Qwen3-32B",
1455
  "type": "chat",
1456
  "input_price_per_1m": 0.1,
1457
+ "output_price_per_1m": 0.3,
1458
  "currency": "USD",
1459
+ "context_window": 40000,
1460
+ "size_b": 32,
1461
+ "capabilities": [
1462
+ "tools",
1463
+ "reasoning"
1464
+ ],
1465
+ "hf_id": "Qwen/Qwen3-32B",
1466
+ "hf_private": false,
1467
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
1468
+ "hf_status": 200
1469
  },
1470
  {
1471
+ "name": "google/gemini-2.0-flash-001",
1472
  "type": "vision",
1473
  "input_price_per_1m": 0.1,
1474
  "output_price_per_1m": 0.4,
1475
  "currency": "USD",
1476
  "capabilities": [
1477
+ "vision"
 
1478
  ],
1479
  "context_window": 1048576,
1480
  "hf_private": true
1481
  },
1482
  {
1483
+ "name": "google/gemini-2.5-flash-lite",
1484
  "type": "vision",
1485
  "input_price_per_1m": 0.1,
1486
  "output_price_per_1m": 0.4,
1487
  "currency": "USD",
1488
  "capabilities": [
1489
+ "vision",
1490
+ "reasoning"
1491
  ],
1492
+ "context_window": 1048576,
1493
  "hf_private": true
1494
  },
1495
  {
1496
+ "name": "groq/openai/gpt-oss-20b",
1497
+ "type": "chat",
1498
  "input_price_per_1m": 0.1,
1499
+ "output_price_per_1m": 0.5,
1500
  "currency": "USD",
1501
+ "context_window": 131072,
1502
+ "size_b": 20,
1503
  "capabilities": [
1504
+ "tools",
1505
+ "reasoning"
1506
  ],
1507
+ "hf_id": "openai/gpt-oss-20b",
1508
+ "hf_private": false,
1509
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
1510
+ "hf_status": 200
1511
+ },
1512
+ {
1513
+ "name": "together/meta-llama/Meta-Llama-3-8B-Instruct-Lite",
1514
+ "type": "chat",
1515
+ "input_price_per_1m": 0.1,
1516
+ "output_price_per_1m": 0.1,
1517
+ "currency": "USD",
1518
+ "context_window": 8192,
1519
+ "size_b": 8,
1520
+ "hf_private": false
1521
  },
1522
  {
1523
  "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct-Turbo",
 
1575
  "hf_status": 200
1576
  },
1577
  {
1578
+ "name": "novita/deepseek/deepseek-r1-distill-qwen-14b",
1579
  "type": "chat",
1580
  "input_price_per_1m": 0.15,
1581
+ "output_price_per_1m": 0.15,
1582
  "currency": "USD",
1583
+ "context_window": 128000,
1584
+ "size_b": 14,
1585
  "capabilities": [
1586
  "tools",
1587
  "reasoning"
1588
  ],
1589
+ "hf_id": "deepseek-ai/DeepSeek-R1",
1590
+ "size_source": "manual",
1591
  "hf_private": false,
1592
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1593
  "hf_status": 200
1594
  },
1595
  {
1596
+ "name": "mistral/mistral-small-2603",
1597
+ "type": "vision",
1598
  "input_price_per_1m": 0.15,
1599
  "output_price_per_1m": 0.6,
1600
  "currency": "USD",
1601
  "capabilities": [
1602
+ "vision",
1603
  "reasoning"
1604
  ],
1605
+ "context_window": 256000,
1606
+ "size_b": 119,
1607
+ "hf_id": "mistralai/Mistral-Small-4-119B-2603",
1608
  "hf_private": false,
1609
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1610
  "hf_status": 200
1611
  },
 
 
 
 
 
 
 
 
 
 
1612
  {
1613
  "name": "mistral/mistral-small-latest",
1614
  "type": "vision",
 
1622
  "context_window": 256000,
1623
  "hf_private": true
1624
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1625
  {
1626
  "name": "openai/gpt-4o-mini",
1627
  "type": "vision",
 
1635
  "hf_private": true
1636
  },
1637
  {
1638
+ "name": "parasail/parasail-qwen3-235b-a22b-instruct-2507",
1639
  "type": "chat",
1640
  "input_price_per_1m": 0.15,
1641
+ "output_price_per_1m": 0.85,
1642
  "currency": "USD",
1643
+ "context_window": 262144,
1644
+ "size_b": 235,
1645
+ "hf_private": false
1646
+ },
1647
+ {
1648
+ "name": "groq/openai/gpt-oss-120b",
1649
+ "type": "chat",
1650
+ "input_price_per_1m": 0.15,
1651
+ "output_price_per_1m": 0.75,
1652
+ "currency": "USD",
1653
+ "context_window": 131072,
1654
+ "size_b": 120,
1655
  "capabilities": [
1656
  "tools",
1657
  "reasoning"
1658
  ],
1659
+ "hf_id": "openai/gpt-oss-120b",
1660
+ "hf_private": false,
1661
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
1662
+ "hf_status": 200
1663
+ },
1664
+ {
1665
+ "name": "nebius/openai/gpt-oss-120b",
1666
+ "type": "chat",
1667
+ "input_price_per_1m": 0.15,
1668
+ "output_price_per_1m": 0.6,
1669
+ "currency": "USD",
1670
+ "capabilities": [
1671
+ "reasoning"
1672
+ ],
1673
+ "context_window": 131000,
1674
+ "size_b": 120,
1675
+ "hf_id": "openai/gpt-oss-120b",
1676
  "hf_private": false,
1677
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1678
  "hf_status": 200
 
1704
  "hf_private": false
1705
  },
1706
  {
1707
+ "name": "novita/qwen/qwen3-235b-a22b-fp8",
1708
  "type": "chat",
1709
  "input_price_per_1m": 0.2,
1710
+ "output_price_per_1m": 0.8,
1711
  "currency": "USD",
1712
+ "context_window": 128000,
1713
+ "size_b": 235,
1714
  "capabilities": [
1715
  "tools",
1716
  "reasoning"
1717
  ],
1718
+ "hf_id": "Qwen/Qwen3-235B-A22B",
 
1719
  "hf_private": false,
1720
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1721
  "hf_status": 200
1722
  },
1723
  {
1724
+ "name": "novita/meta-llama/llama-4-maverick-17b-128e-instruct-fp8",
1725
  "type": "chat",
1726
  "input_price_per_1m": 0.2,
1727
+ "output_price_per_1m": 0.85,
1728
  "currency": "USD",
1729
+ "context_window": 1048576,
1730
+ "size_b": 17,
1731
  "capabilities": [
1732
+ "vision",
1733
+ "tools"
1734
  ],
1735
+ "hf_private": false
 
 
 
1736
  },
1737
  {
1738
+ "name": "openai-responses/gpt-5.4-nano",
1739
+ "type": "vision",
1740
  "input_price_per_1m": 0.2,
1741
+ "output_price_per_1m": 1.25,
1742
  "currency": "USD",
 
1743
  "capabilities": [
1744
  "vision",
 
1745
  "reasoning"
1746
  ],
1747
+ "context_window": 400000,
1748
  "hf_private": true
1749
  },
1750
  {
1751
+ "name": "openai/gpt-5.4-nano",
1752
  "type": "vision",
1753
  "input_price_per_1m": 0.2,
1754
+ "output_price_per_1m": 1.25,
1755
  "currency": "USD",
1756
  "capabilities": [
1757
+ "vision",
1758
+ "reasoning"
1759
  ],
1760
+ "context_window": 400000,
1761
  "hf_private": true
1762
  },
1763
  {
1764
+ "name": "xai/grok-4-1-fast-reasoning",
1765
  "type": "vision",
1766
  "input_price_per_1m": 0.2,
1767
+ "output_price_per_1m": 0.5,
1768
  "currency": "USD",
1769
  "capabilities": [
1770
  "vision"
1771
  ],
1772
+ "context_window": 2000000,
1773
  "hf_private": true
1774
  },
1775
  {
1776
+ "name": "xai/grok-code-fast-1",
1777
  "type": "vision",
1778
  "input_price_per_1m": 0.2,
1779
+ "output_price_per_1m": 1.5,
1780
  "currency": "USD",
1781
  "capabilities": [
1782
  "vision"
1783
  ],
1784
+ "context_window": 256000,
1785
  "hf_private": true
1786
  },
1787
  {
 
1799
  "hf_private": true
1800
  },
1801
  {
1802
+ "name": "xai/grok-4-1-fast-non-reasoning",
1803
  "type": "vision",
1804
  "input_price_per_1m": 0.2,
1805
+ "output_price_per_1m": 0.5,
1806
  "currency": "USD",
1807
  "capabilities": [
1808
+ "vision"
 
1809
  ],
1810
+ "context_window": 2000000,
1811
  "hf_private": true
1812
  },
1813
  {
1814
+ "name": "xai/grok-4-fast",
1815
+ "type": "chat",
1816
  "input_price_per_1m": 0.2,
1817
+ "output_price_per_1m": 0.5,
1818
  "currency": "USD",
1819
+ "context_window": 2000000,
1820
  "capabilities": [
1821
  "vision",
1822
+ "tools",
1823
  "reasoning"
1824
  ],
 
1825
  "hf_private": true
1826
  },
1827
  {
1828
+ "name": "deepinfra/Qwen/Qwen3-235B-A22B",
1829
  "type": "chat",
1830
  "input_price_per_1m": 0.2,
1831
+ "output_price_per_1m": 0.6,
1832
  "currency": "USD",
1833
+ "context_window": 40000,
1834
+ "size_b": 235,
1835
  "capabilities": [
1836
+ "tools",
1837
+ "reasoning"
1838
  ],
1839
+ "hf_id": "Qwen/Qwen3-235B-A22B",
1840
+ "hf_private": false,
1841
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
1842
+ "hf_status": 200
1843
  },
1844
  {
1845
+ "name": "deepinfra/zai-org/GLM-4.5-Air",
1846
  "type": "chat",
1847
  "input_price_per_1m": 0.2,
1848
+ "output_price_per_1m": 1.1,
1849
  "currency": "USD",
1850
+ "context_window": 131072,
 
1851
  "capabilities": [
1852
  "tools",
1853
  "reasoning"
1854
  ],
1855
+ "hf_id": "zai-org/GLM-4.5-Air",
1856
+ "size_b": 110.5,
1857
  "hf_private": false,
1858
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1859
  "hf_status": 200
 
1884
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1885
  "hf_status": 200
1886
  },
1887
+ {
1888
+ "name": "deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct",
1889
+ "type": "chat",
1890
+ "input_price_per_1m": 0.23,
1891
+ "output_price_per_1m": 0.4,
1892
+ "currency": "USD",
1893
+ "context_window": 130815,
1894
+ "size_b": 70,
1895
+ "hf_private": false
1896
+ },
1897
  {
1898
  "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct",
1899
  "type": "chat",
 
1926
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
1927
  "hf_status": 200
1928
  },
 
 
 
 
 
 
 
 
 
 
1929
  {
1930
  "name": "deepinfra/Qwen/Qwen2.5-72B-Instruct",
1931
  "type": "chat",
 
1943
  "hf_status": 200
1944
  },
1945
  {
1946
+ "name": "azure/gpt-5-mini",
1947
+ "type": "chat",
1948
  "input_price_per_1m": 0.25,
1949
+ "output_price_per_1m": 2,
1950
  "currency": "USD",
1951
  "capabilities": [
1952
+ "reasoning"
1953
  ],
1954
+ "context_window": 200000,
1955
  "hf_private": true
1956
  },
1957
  {
 
1990
  "hf_private": true
1991
  },
1992
  {
1993
+ "name": "google/gemini-3.1-flash-lite-preview",
1994
+ "type": "vision",
1995
  "input_price_per_1m": 0.25,
1996
+ "output_price_per_1m": 1.5,
1997
  "currency": "USD",
1998
  "capabilities": [
1999
+ "vision"
2000
  ],
2001
+ "context_window": 1048576,
2002
  "hf_private": true
2003
  },
2004
  {
 
2044
  "hf_private": true
2045
  },
2046
  {
2047
+ "name": "novita/minimax-m2.7",
2048
+ "type": "vision",
2049
  "input_price_per_1m": 0.3,
2050
+ "output_price_per_1m": 1.2,
2051
  "currency": "USD",
2052
  "capabilities": [
2053
+ "vision",
2054
  "reasoning"
2055
  ],
2056
+ "context_window": 200000,
 
 
2057
  "hf_private": false,
2058
+ "size_b": 230,
2059
+ "size_source": "manual",
2060
+ "hf_id": "MiniMaxAI/MiniMax-M2.7",
2061
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2062
  "hf_status": 200
2063
  },
2064
  {
2065
+ "name": "novita/deepseek/deepseek-r1-distill-qwen-32b",
2066
  "type": "chat",
2067
  "input_price_per_1m": 0.3,
2068
+ "output_price_per_1m": 0.3,
2069
  "currency": "USD",
2070
+ "context_window": 12800,
2071
+ "size_b": 32,
2072
  "capabilities": [
2073
  "reasoning"
2074
  ],
2075
+ "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",
 
 
2076
  "hf_private": false,
2077
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2078
  "hf_status": 200
2079
  },
2080
  {
2081
+ "name": "novita/MiniMax-M2.7",
2082
+ "type": "vision",
2083
  "input_price_per_1m": 0.3,
2084
+ "output_price_per_1m": 1.2,
2085
  "currency": "USD",
 
2086
  "capabilities": [
2087
+ "vision",
2088
  "reasoning"
2089
  ],
2090
+ "context_window": 200000,
 
2091
  "hf_private": false,
2092
+ "size_b": 230,
2093
+ "size_source": "manual",
2094
+ "hf_id": "MiniMaxAI/MiniMax-M2.7",
2095
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2096
  "hf_status": 200
2097
  },
2098
  {
2099
+ "name": "minimaxi/MiniMax-M2.7",
2100
+ "type": "vision",
 
 
 
 
 
 
 
 
 
 
2101
  "input_price_per_1m": 0.3,
2102
+ "output_price_per_1m": 1.2,
2103
  "currency": "USD",
2104
  "capabilities": [
2105
+ "vision",
2106
  "reasoning"
2107
  ],
2108
+ "context_window": 200000,
2109
+ "hf_private": false,
2110
+ "size_b": 230,
2111
+ "size_source": "manual",
2112
+ "hf_id": "MiniMaxAI/MiniMax-M2.7",
2113
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
2114
+ "hf_status": 200
2115
  },
2116
  {
2117
+ "name": "minimaxi/MiniMax-M2.5",
2118
  "type": "vision",
2119
  "input_price_per_1m": 0.3,
2120
+ "output_price_per_1m": 1.2,
2121
  "currency": "USD",
2122
  "capabilities": [
2123
  "vision",
2124
  "reasoning"
2125
  ],
2126
+ "context_window": 200000,
2127
+ "hf_id": "MiniMaxAI/MiniMax-M2.5",
2128
+ "size_b": 228.7,
2129
+ "hf_private": false,
2130
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
2131
+ "hf_status": 200
2132
  },
2133
  {
2134
+ "name": "minimaxi/MiniMax-M2",
2135
+ "type": "chat",
2136
+ "input_price_per_1m": 0.3,
2137
+ "output_price_per_1m": 1.2,
2138
+ "currency": "USD",
2139
+ "context_window": 200000,
2140
+ "capabilities": [
2141
+ "tools",
2142
+ "reasoning"
2143
+ ],
2144
+ "hf_id": "MiniMaxAI/MiniMax-M2",
2145
+ "size_b": 228.7,
2146
+ "hf_private": false,
2147
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
2148
+ "hf_status": 200
2149
+ },
2150
+ {
2151
+ "name": "mistral/codestral-latest",
2152
  "type": "chat",
2153
  "input_price_per_1m": 0.3,
2154
  "output_price_per_1m": 0.9,
 
2157
  "hf_private": true
2158
  },
2159
  {
2160
+ "name": "vertex/gemini-2.5-flash",
2161
  "type": "vision",
2162
  "input_price_per_1m": 0.3,
2163
+ "output_price_per_1m": 2.5,
2164
  "currency": "USD",
2165
  "capabilities": [
2166
  "vision",
2167
  "reasoning"
2168
  ],
2169
+ "context_window": 1048576,
2170
+ "hf_private": true
 
 
 
 
 
2171
  },
2172
  {
2173
+ "name": "vertex/gemini-2.5-flash-image",
2174
  "type": "vision",
2175
  "input_price_per_1m": 0.3,
2176
+ "output_price_per_1m": 2.5,
2177
  "currency": "USD",
2178
  "capabilities": [
2179
  "vision",
2180
  "reasoning"
2181
  ],
2182
+ "context_window": 1048576,
2183
+ "hf_private": true
 
 
 
 
 
2184
  },
2185
  {
2186
+ "name": "xai/grok-3-mini",
2187
  "type": "chat",
2188
  "input_price_per_1m": 0.3,
2189
+ "output_price_per_1m": 0.5,
2190
  "currency": "USD",
 
 
2191
  "capabilities": [
2192
  "reasoning"
2193
  ],
2194
+ "context_window": 131072,
2195
+ "hf_private": true
 
 
2196
  },
2197
  {
2198
  "name": "coding/gemini-2.5-flash",
 
2208
  "hf_private": true
2209
  },
2210
  {
2211
+ "name": "deepinfra/deepseek-ai/DeepSeek-V3.1",
2212
  "type": "chat",
2213
  "input_price_per_1m": 0.3,
2214
+ "output_price_per_1m": 1,
2215
  "currency": "USD",
2216
+ "context_window": 163840,
2217
+ "capabilities": [
2218
+ "tools",
2219
+ "reasoning"
2220
+ ],
2221
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
2222
+ "size_b": 671,
2223
+ "hf_private": false,
2224
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
2225
+ "hf_status": 200
2226
  },
2227
  {
2228
+ "name": "google/gemini-2.5-flash",
2229
  "type": "vision",
2230
  "input_price_per_1m": 0.3,
2231
+ "output_price_per_1m": 2.5,
2232
  "currency": "USD",
2233
  "capabilities": [
2234
+ "vision",
2235
+ "reasoning"
2236
  ],
2237
  "context_window": 1048576,
2238
  "hf_private": true
2239
  },
2240
  {
2241
+ "name": "parasail/parasail-gemma3-27b-it",
2242
+ "type": "chat",
2243
  "input_price_per_1m": 0.3,
2244
+ "output_price_per_1m": 0.5,
2245
  "currency": "USD",
2246
+ "context_window": 128000,
2247
+ "size_b": 27,
2248
+ "hf_private": false
 
 
 
 
 
 
 
 
2249
  },
2250
  {
2251
+ "name": "nebius/minimax/minimax-m2.1",
2252
  "type": "chat",
2253
  "input_price_per_1m": 0.3,
2254
  "output_price_per_1m": 1.2,
2255
  "currency": "USD",
 
2256
  "capabilities": [
 
2257
  "reasoning"
2258
  ],
2259
+ "context_window": 200000,
2260
+ "hf_id": "MiniMaxAI/MiniMax-M2.1",
2261
  "size_b": 228.7,
2262
  "hf_private": false,
2263
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2264
  "hf_status": 200
2265
  },
2266
  {
2267
+ "name": "nebius/deepseek-ai/DeepSeek-V3.2",
2268
+ "type": "chat",
2269
  "input_price_per_1m": 0.3,
2270
+ "output_price_per_1m": 0.45,
2271
  "currency": "USD",
2272
  "capabilities": [
 
2273
  "reasoning"
2274
  ],
2275
+ "context_window": 164000,
2276
+ "hf_id": "deepseek-ai/DeepSeek-V3.2",
2277
+ "size_b": 685.4,
2278
  "hf_private": false,
2279
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2280
  "hf_status": 200
2281
  },
2282
  {
2283
+ "name": "together/Qwen/Qwen2.5-7B-Instruct-Turbo",
2284
+ "type": "chat",
2285
  "input_price_per_1m": 0.3,
2286
+ "output_price_per_1m": 0.3,
2287
  "currency": "USD",
2288
+ "context_window": 32768,
2289
+ "size_b": 7,
2290
+ "hf_private": false
 
 
 
2291
  },
2292
  {
2293
+ "name": "alibaba/qwen3-coder-flash",
2294
  "type": "vision",
2295
  "input_price_per_1m": 0.3,
2296
+ "output_price_per_1m": 1.5,
2297
  "currency": "USD",
2298
  "capabilities": [
2299
+ "vision"
 
2300
  ],
2301
  "context_window": 1048576,
2302
  "hf_private": true
 
2344
  "hf_status": 200
2345
  },
2346
  {
2347
+ "name": "azure/gpt-4.1-mini",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2348
  "type": "vision",
2349
  "input_price_per_1m": 0.4,
2350
  "output_price_per_1m": 1.6,
 
2356
  "hf_private": true
2357
  },
2358
  {
2359
+ "name": "azure/openai-responses/gpt-4.1-mini",
2360
  "type": "vision",
2361
  "input_price_per_1m": 0.4,
2362
  "output_price_per_1m": 1.6,
 
2394
  "hf_status": 200
2395
  },
2396
  {
2397
+ "name": "mistral/devstral-medium-2507",
2398
  "type": "chat",
2399
  "input_price_per_1m": 0.4,
2400
+ "output_price_per_1m": 2,
2401
  "currency": "USD",
2402
  "context_window": 131072,
2403
  "capabilities": [
 
2406
  "hf_private": true
2407
  },
2408
  {
2409
+ "name": "mistral/mistral-medium-latest",
2410
+ "type": "chat",
2411
+ "input_price_per_1m": 0.4,
2412
+ "output_price_per_1m": 2,
2413
+ "currency": "USD",
2414
+ "context_window": 131072,
2415
+ "hf_private": true
2416
+ },
2417
+ {
2418
+ "name": "mistral/devstral-latest",
2419
+ "type": "chat",
2420
+ "input_price_per_1m": 0.4,
2421
+ "output_price_per_1m": 2,
2422
+ "currency": "USD",
2423
+ "context_window": 256000,
2424
+ "hf_private": true
2425
+ },
2426
+ {
2427
+ "name": "openai-responses/gpt-4.1-mini",
2428
  "type": "vision",
2429
  "input_price_per_1m": 0.4,
2430
  "output_price_per_1m": 1.6,
 
2436
  "hf_private": true
2437
  },
2438
  {
2439
+ "name": "openai/gpt-4.1-mini",
2440
  "type": "vision",
2441
  "input_price_per_1m": 0.4,
2442
  "output_price_per_1m": 1.6,
 
2448
  "hf_private": true
2449
  },
2450
  {
2451
+ "name": "deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2452
  "type": "chat",
2453
+ "input_price_per_1m": 0.4,
2454
+ "output_price_per_1m": 1.6,
2455
  "currency": "USD",
2456
+ "context_window": 262144,
2457
+ "size_b": 480,
2458
  "capabilities": [
2459
+ "tools"
 
2460
  ],
2461
+ "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct",
 
2462
  "hf_private": false,
2463
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2464
  "hf_status": 200
2465
  },
2466
  {
2467
+ "name": "nebius/zai-org/GLM-4.7",
2468
+ "type": "chat",
2469
+ "input_price_per_1m": 0.4,
2470
+ "output_price_per_1m": 2,
2471
  "currency": "USD",
2472
  "capabilities": [
 
2473
  "reasoning"
2474
  ],
2475
+ "context_window": 200000,
2476
+ "hf_id": "zai-org/GLM-4.7",
2477
+ "size_b": 358.3,
2478
  "hf_private": false,
2479
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2480
  "hf_status": 200
2481
  },
2482
  {
2483
+ "name": "nebius/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2484
  "type": "chat",
2485
+ "input_price_per_1m": 0.4,
2486
+ "output_price_per_1m": 1.8,
2487
  "currency": "USD",
2488
+ "context_window": 262000,
2489
+ "size_b": 480,
2490
  "capabilities": [
2491
  "tools"
2492
  ],
2493
+ "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct",
 
2494
  "hf_private": false,
2495
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2496
  "hf_status": 200
2497
  },
2498
  {
2499
+ "name": "alibaba/qwen-plus",
2500
+ "type": "chat",
2501
+ "input_price_per_1m": 0.4,
2502
+ "output_price_per_1m": 1.2,
 
 
 
 
 
 
 
 
 
 
 
 
 
2503
  "currency": "USD",
2504
+ "context_window": 131072,
2505
  "capabilities": [
2506
+ "tools"
 
2507
  ],
 
2508
  "hf_private": true
2509
  },
2510
  {
 
2546
  "hf_private": true
2547
  },
2548
  {
2549
+ "name": "google/gemini-3.1-flash-image-preview",
2550
+ "type": "vision",
2551
+ "input_price_per_1m": 0.5,
2552
+ "output_price_per_1m": 2,
2553
  "currency": "USD",
 
 
2554
  "capabilities": [
2555
+ "vision",
2556
+ "reasoning"
2557
  ],
2558
+ "context_window": 131072,
2559
+ "hf_private": true
 
 
2560
  },
2561
  {
2562
+ "name": "google/gemini-3-flash-preview",
2563
+ "type": "vision",
2564
+ "input_price_per_1m": 0.5,
2565
+ "output_price_per_1m": 3,
2566
  "currency": "USD",
2567
  "capabilities": [
2568
+ "vision",
2569
  "reasoning"
2570
  ],
2571
+ "context_window": 1048576,
2572
  "hf_private": true
2573
  },
2574
  {
2575
+ "name": "nebius/deepseek-ai/DeepSeek-V3-0324",
2576
+ "type": "chat",
2577
+ "input_price_per_1m": 0.5,
2578
+ "output_price_per_1m": 1.5,
2579
  "currency": "USD",
2580
+ "context_window": 128000,
2581
  "capabilities": [
2582
+ "tools",
2583
  "reasoning"
2584
  ],
2585
+ "size_b": 685,
2586
+ "hf_id": "deepseek-ai/DeepSeek-V3-0324",
 
2587
  "hf_private": false,
2588
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2589
  "hf_status": 200
2590
  },
2591
  {
2592
+ "name": "nebius/moonshotai/Kimi-K2-Instruct",
2593
  "type": "chat",
2594
+ "input_price_per_1m": 0.5,
2595
+ "output_price_per_1m": 2.4,
2596
  "currency": "USD",
2597
+ "context_window": 131000,
2598
  "capabilities": [
2599
  "tools"
2600
  ],
 
2605
  "hf_status": 200
2606
  },
2607
  {
2608
+ "name": "nebius/moonshotai/kimi-k2.5",
2609
+ "type": "vision",
2610
+ "input_price_per_1m": 0.5,
2611
+ "output_price_per_1m": 2.5,
2612
  "currency": "USD",
 
2613
  "capabilities": [
2614
+ "vision",
2615
  "reasoning"
2616
  ],
2617
+ "context_window": 256000,
2618
+ "hf_id": "moonshotai/Kimi-K2.5",
2619
+ "size_b": 1058.6,
2620
  "hf_private": false,
2621
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2622
  "hf_status": 200
2623
  },
2624
  {
2625
+ "name": "novita/meta-llama/llama-3-70b-instruct",
2626
  "type": "chat",
2627
+ "input_price_per_1m": 0.51,
2628
+ "output_price_per_1m": 0.74,
2629
  "currency": "USD",
2630
+ "context_window": 8192,
2631
+ "size_b": 70,
2632
  "capabilities": [
2633
+ "tools"
 
2634
  ],
 
 
2635
  "hf_private": false,
2636
+ "hf_id": "meta-llama/Meta-Llama-3-70B-Instruct",
2637
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2638
  "hf_status": 200
2639
  },
2640
  {
2641
+ "name": "openai/o4-mini",
2642
  "type": "chat",
2643
+ "input_price_per_1m": 0.55,
2644
  "output_price_per_1m": 2.2,
2645
  "currency": "USD",
2646
  "capabilities": [
2647
  "reasoning"
2648
  ],
2649
+ "context_window": 200000,
2650
+ "hf_private": true
 
 
 
 
2651
  },
2652
  {
2653
+ "name": "vertex/deepseek-v3.2",
2654
+ "type": "vision",
2655
+ "input_price_per_1m": 0.56,
2656
+ "output_price_per_1m": 1.68,
2657
  "currency": "USD",
2658
  "capabilities": [
2659
+ "vision",
2660
  "reasoning"
2661
  ],
2662
+ "context_window": 163840,
2663
+ "hf_id": "deepseek-ai/DeepSeek-V3.2",
2664
+ "size_b": 685.4,
2665
  "hf_private": false,
2666
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2667
  "hf_status": 200
2668
  },
2669
  {
2670
+ "name": "novita/moonshotai/kimi-k2-instruct",
2671
  "type": "chat",
2672
+ "input_price_per_1m": 0.57,
2673
+ "output_price_per_1m": 2.3,
2674
  "currency": "USD",
2675
+ "context_window": 131072,
2676
  "capabilities": [
2677
+ "tools"
2678
  ],
2679
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
2680
+ "size_b": 1026.5,
 
2681
  "hf_private": false,
2682
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2683
  "hf_status": 200
 
2716
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2717
  "hf_status": 200
2718
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2719
  {
2720
  "name": "minimaxi/MiniMax-M2.7-highspeed",
2721
  "type": "vision",
 
2748
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2749
  "hf_status": 200
2750
  },
2751
+ {
2752
+ "name": "moonshot/kimi-k2-0711-preview",
2753
+ "type": "chat",
2754
+ "input_price_per_1m": 0.6,
2755
+ "output_price_per_1m": 2.5,
2756
+ "currency": "USD",
2757
+ "context_window": 131072,
2758
+ "capabilities": [
2759
+ "tools"
2760
+ ],
2761
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
2762
+ "size_b": 1026.5,
2763
+ "hf_private": false,
2764
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
2765
+ "hf_status": 200
2766
+ },
2767
  {
2768
  "name": "moonshot/kimi-k2.5",
2769
  "type": "vision",
 
2831
  "hf_status": 200
2832
  },
2833
  {
2834
+ "name": "zai/GLM-4.7",
2835
  "type": "chat",
2836
  "input_price_per_1m": 0.6,
2837
+ "output_price_per_1m": 2.2,
2838
+ "currency": "USD",
2839
+ "capabilities": [
2840
+ "reasoning"
2841
+ ],
2842
+ "context_window": 200000,
2843
+ "hf_id": "zai-org/GLM-4.7",
2844
+ "size_b": 358.3,
2845
+ "hf_private": false,
2846
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
2847
+ "hf_status": 200
2848
+ },
2849
+ {
2850
+ "name": "zai/GLM-4.5",
2851
+ "type": "chat",
2852
+ "input_price_per_1m": 0.6,
2853
+ "output_price_per_1m": 2.2,
2854
  "currency": "USD",
2855
+ "capabilities": [
2856
+ "reasoning"
2857
+ ],
2858
  "context_window": 131072,
2859
+ "hf_id": "zai-org/GLM-4.5",
2860
+ "size_b": 358.3,
2861
+ "hf_private": false,
2862
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
2863
+ "hf_status": 200
2864
+ },
2865
+ {
2866
+ "name": "zai/GLM-4.6",
2867
+ "type": "chat",
2868
+ "input_price_per_1m": 0.6,
2869
+ "output_price_per_1m": 2.2,
2870
+ "currency": "USD",
2871
  "capabilities": [
2872
+ "reasoning"
2873
  ],
2874
+ "context_window": 200000,
2875
+ "hf_id": "zai-org/GLM-4.6",
2876
+ "size_b": 356.8,
2877
+ "hf_private": false,
2878
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
2879
+ "hf_status": 200
2880
+ },
2881
+ {
2882
+ "name": "deepinfra/zai-org/GLM-4.5",
2883
+ "type": "chat",
2884
+ "input_price_per_1m": 0.6,
2885
+ "output_price_per_1m": 2.2,
2886
+ "currency": "USD",
2887
+ "context_window": 131072,
2888
+ "capabilities": [
2889
+ "tools",
2890
+ "reasoning"
2891
+ ],
2892
+ "hf_id": "zai-org/GLM-4.5",
2893
+ "size_b": 358.3,
2894
+ "hf_private": false,
2895
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
2896
+ "hf_status": 200
2897
+ },
2898
+ {
2899
+ "name": "nebius/zai-org/GLM-4.5",
2900
+ "type": "chat",
2901
+ "input_price_per_1m": 0.6,
2902
+ "output_price_per_1m": 2.2,
2903
+ "currency": "USD",
2904
+ "context_window": 128000,
2905
+ "capabilities": [
2906
+ "tools",
2907
+ "reasoning"
2908
+ ],
2909
+ "hf_id": "zai-org/GLM-4.5",
2910
+ "size_b": 358.3,
2911
+ "hf_private": false,
2912
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
2913
+ "hf_status": 200
2914
+ },
2915
+ {
2916
+ "name": "alibaba/qwen3.5",
2917
+ "type": "vision",
2918
+ "input_price_per_1m": 0.6,
2919
+ "output_price_per_1m": 3.6,
2920
+ "currency": "USD",
2921
+ "capabilities": [
2922
+ "vision",
2923
+ "reasoning"
2924
+ ],
2925
+ "context_window": 256000,
2926
+ "size_b": 9,
2927
+ "hf_id": "Qwen/Qwen3.5-9B",
2928
  "hf_private": false,
2929
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
2930
  "hf_status": 200
 
2956
  "hf_private": true
2957
  },
2958
  {
2959
+ "name": "novita/deepseek/deepseek-r1-turbo",
2960
+ "type": "chat",
2961
  "input_price_per_1m": 0.7,
2962
+ "output_price_per_1m": 2.5,
2963
  "currency": "USD",
2964
+ "context_window": 64000,
2965
  "capabilities": [
2966
+ "tools",
2967
+ "reasoning"
2968
  ],
2969
+ "hf_id": "deepseek-ai/DeepSeek-R1",
2970
+ "size_b": 671,
2971
+ "size_source": "manual",
2972
+ "hf_private": false,
2973
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
2974
+ "hf_status": 200
2975
  },
2976
  {
2977
  "name": "novita/deepseek/deepseek-prover-v2-671b",
 
2984
  "hf_private": false
2985
  },
2986
  {
2987
+ "name": "parasail/parasail-qwen25-vl-72b-instruct",
2988
+ "type": "vision",
2989
  "input_price_per_1m": 0.7,
2990
+ "output_price_per_1m": 0.7,
2991
  "currency": "USD",
 
2992
  "capabilities": [
2993
+ "vision"
 
2994
  ],
2995
+ "context_window": 32768,
2996
+ "size_b": 72,
2997
+ "hf_private": false
 
 
 
2998
  },
2999
  {
3000
  "name": "openai-responses/gpt-5.4-mini",
 
3023
  "hf_private": true
3024
  },
3025
  {
3026
+ "name": "novita/deepseek/deepseek-r1-distill-llama-70b",
3027
  "type": "chat",
3028
  "input_price_per_1m": 0.8,
3029
+ "output_price_per_1m": 0.8,
3030
  "currency": "USD",
3031
+ "context_window": 32000,
3032
+ "size_b": 70,
3033
  "capabilities": [
 
3034
  "reasoning"
3035
  ],
3036
+ "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
 
3037
  "hf_private": false,
3038
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3039
  "hf_status": 200
3040
  },
3041
  {
3042
+ "name": "novita/qwen/qwen2.5-vl-72b-instruct",
3043
  "type": "chat",
3044
  "input_price_per_1m": 0.8,
3045
  "output_price_per_1m": 0.8,
3046
  "currency": "USD",
3047
+ "context_window": 96000,
3048
+ "size_b": 72,
3049
+ "capabilities": [
3050
+ "vision"
3051
+ ],
3052
+ "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
3053
  "hf_private": false,
3054
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
 
3055
  "hf_status": 200
3056
  },
3057
  {
3058
+ "name": "deepinfra/meta-llama/Meta-Llama-3.1-405B-Instruct",
3059
  "type": "chat",
3060
  "input_price_per_1m": 0.8,
3061
  "output_price_per_1m": 0.8,
3062
  "currency": "USD",
3063
+ "context_window": 130815,
3064
+ "size_b": 405,
 
 
 
 
3065
  "hf_private": false,
3066
+ "hf_id": "meta-llama/Llama-3.1-405B-Instruct",
3067
+ "hf_validated_at": "2026-03-22T19:58:46.149Z",
3068
  "hf_status": 200
3069
  },
3070
  {
3071
+ "name": "nebius/deepseek-ai/DeepSeek-R1-0528",
3072
  "type": "chat",
3073
  "input_price_per_1m": 0.8,
3074
+ "output_price_per_1m": 2.4,
3075
  "currency": "USD",
3076
+ "context_window": 164000,
 
3077
  "capabilities": [
3078
+ "tools",
3079
+ "reasoning"
3080
  ],
3081
+ "hf_id": "deepseek-ai/DeepSeek-R1-0528",
3082
+ "size_b": 684.5,
3083
  "hf_private": false,
3084
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3085
  "hf_status": 200
 
3189
  "hf_status": 200
3190
  },
3191
  {
3192
+ "name": "novita/GLM-5",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3193
  "type": "chat",
3194
  "input_price_per_1m": 1,
3195
+ "output_price_per_1m": 3.2,
3196
  "currency": "USD",
 
3197
  "capabilities": [
3198
+ "reasoning"
3199
  ],
3200
+ "context_window": 202800,
3201
+ "hf_id": "zai-org/GLM-5",
3202
+ "size_b": 753.9,
3203
  "hf_private": false,
3204
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3205
  "hf_status": 200
 
3222
  "hf_status": 200
3223
  },
3224
  {
3225
+ "name": "vertex/claude-haiku-4-5",
3226
+ "type": "vision",
3227
  "input_price_per_1m": 1,
3228
+ "output_price_per_1m": 5,
3229
  "currency": "USD",
 
3230
  "capabilities": [
3231
  "vision"
3232
  ],
3233
+ "context_window": 200000,
3234
  "hf_private": true
3235
  },
3236
  {
3237
+ "name": "openai/o3",
3238
+ "type": "vision",
3239
+ "input_price_per_1m": 1,
3240
+ "output_price_per_1m": 4,
3241
+ "currency": "USD",
3242
+ "capabilities": [
3243
+ "vision",
3244
+ "reasoning"
3245
+ ],
3246
+ "context_window": 200000,
3247
+ "hf_private": true
3248
+ },
3249
+ {
3250
+ "name": "bedrock/claude-haiku-4-5",
3251
  "type": "vision",
3252
  "input_price_per_1m": 1,
3253
  "output_price_per_1m": 5,
 
3259
  "hf_private": true
3260
  },
3261
  {
3262
+ "name": "anthropic/claude-haiku-4-5",
3263
  "type": "vision",
3264
  "input_price_per_1m": 1,
3265
+ "output_price_per_1m": 5,
3266
  "currency": "USD",
3267
  "capabilities": [
3268
+ "vision"
 
3269
  ],
3270
  "context_window": 200000,
3271
  "hf_private": true
3272
  },
3273
  {
3274
+ "name": "groq/moonshotai/kimi-k2-instruct",
3275
  "type": "chat",
3276
  "input_price_per_1m": 1,
3277
+ "output_price_per_1m": 3,
3278
  "currency": "USD",
3279
+ "context_window": 131072,
3280
  "capabilities": [
3281
+ "tools"
3282
  ],
3283
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
3284
+ "size_b": 1026.5,
 
3285
  "hf_private": false,
3286
  "hf_validated_at": "2026-03-22T19:23:09.981Z",
3287
  "hf_status": 200
3288
  },
3289
  {
3290
+ "name": "groq/moonshotai/Kimi-K2-Instruct-0905",
3291
+ "type": "chat",
3292
  "input_price_per_1m": 1,
3293
+ "output_price_per_1m": 3,
3294
  "currency": "USD",
3295
+ "context_window": 256000,
3296
  "capabilities": [
3297
+ "tools"
3298
  ],
3299
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
3300
+ "size_b": 1026.5,
3301
+ "hf_private": false,
3302
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
3303
+ "hf_status": 200
3304
  },
3305
  {
3306
  "name": "alibaba/qwen3-coder-plus",
 
3315
  "hf_private": true
3316
  },
3317
  {
3318
+ "name": "perplexity/sonar",
3319
+ "type": "chat",
3320
  "input_price_per_1m": 1,
3321
+ "output_price_per_1m": 1,
3322
  "currency": "USD",
3323
+ "context_window": 131072,
3324
  "capabilities": [
3325
  "vision"
3326
  ],
 
3327
  "hf_private": true
3328
  },
3329
  {
3330
+ "name": "azure/o4-mini",
3331
  "type": "chat",
3332
  "input_price_per_1m": 1.1,
3333
  "output_price_per_1m": 4.4,
 
3339
  "hf_private": true
3340
  },
3341
  {
3342
+ "name": "openai-responses/o3-mini",
3343
  "type": "chat",
3344
  "input_price_per_1m": 1.1,
3345
  "output_price_per_1m": 4.4,
 
3351
  "hf_private": true
3352
  },
3353
  {
3354
+ "name": "openai-responses/o4-mini",
3355
  "type": "chat",
3356
  "input_price_per_1m": 1.1,
3357
  "output_price_per_1m": 4.4,
 
3363
  "hf_private": true
3364
  },
3365
  {
3366
+ "name": "openai/o3-mini",
3367
  "type": "chat",
3368
  "input_price_per_1m": 1.1,
3369
  "output_price_per_1m": 4.4,
 
3374
  "context_window": 200000,
3375
  "hf_private": true
3376
  },
 
 
 
 
 
 
 
 
 
 
3377
  {
3378
  "name": "moonshot/kimi-k2-turbo-preview",
3379
  "type": "chat",
 
3391
  "hf_status": 200
3392
  },
3393
  {
3394
+ "name": "together/Qwen/Qwen2.5-72B-Instruct-Turbo",
3395
+ "type": "chat",
3396
+ "input_price_per_1m": 1.2,
3397
+ "output_price_per_1m": 1.2,
3398
+ "currency": "USD",
3399
+ "context_window": 32768,
3400
+ "size_b": 72,
3401
+ "hf_private": false
3402
+ },
3403
+ {
3404
+ "name": "azure/gpt-5",
3405
+ "type": "chat",
3406
  "input_price_per_1m": 1.25,
3407
  "output_price_per_1m": 10,
3408
  "currency": "USD",
3409
  "capabilities": [
 
3410
  "reasoning"
3411
  ],
3412
+ "context_window": 200000,
3413
  "hf_private": true
3414
  },
3415
  {
3416
+ "name": "azure/gpt-5.1",
3417
+ "type": "chat",
3418
  "input_price_per_1m": 1.25,
3419
  "output_price_per_1m": 10,
3420
  "currency": "USD",
3421
  "capabilities": [
 
3422
  "reasoning"
3423
  ],
3424
+ "context_window": 200000,
3425
  "hf_private": true
3426
  },
3427
  {
3428
+ "name": "openai-responses/gpt-5-codex",
3429
  "type": "vision",
3430
  "input_price_per_1m": 1.25,
3431
  "output_price_per_1m": 10,
 
3438
  "hf_private": true
3439
  },
3440
  {
3441
+ "name": "openai-responses/gpt-5.1",
3442
  "type": "vision",
3443
  "input_price_per_1m": 1.25,
3444
  "output_price_per_1m": 10,
 
3451
  "hf_private": true
3452
  },
3453
  {
3454
+ "name": "openai-responses/gpt-5.1-codex",
3455
  "type": "vision",
3456
  "input_price_per_1m": 1.25,
3457
  "output_price_per_1m": 10,
 
3464
  "hf_private": true
3465
  },
3466
  {
3467
+ "name": "openai-responses/gpt-5",
3468
  "type": "vision",
3469
  "input_price_per_1m": 1.25,
3470
  "output_price_per_1m": 10,
 
3473
  "vision",
3474
  "reasoning"
3475
  ],
3476
+ "context_window": 400000,
3477
  "hf_private": true
3478
  },
3479
  {
3480
+ "name": "vertex/gemini-2.5-pro",
3481
  "type": "vision",
3482
  "input_price_per_1m": 1.25,
3483
  "output_price_per_1m": 10,
 
3486
  "vision",
3487
  "reasoning"
3488
  ],
3489
+ "context_window": 1048576,
3490
  "hf_private": true
3491
  },
3492
  {
 
3503
  "hf_private": true
3504
  },
3505
  {
3506
+ "name": "openai/gpt-5-chat",
3507
  "type": "vision",
3508
  "input_price_per_1m": 1.25,
3509
  "output_price_per_1m": 10,
 
3512
  "vision",
3513
  "reasoning"
3514
  ],
3515
+ "context_window": 128000,
3516
  "hf_private": true
3517
  },
3518
  {
3519
+ "name": "openai/gpt-5.1",
3520
+ "type": "vision",
3521
  "input_price_per_1m": 1.25,
3522
+ "output_price_per_1m": 10,
3523
  "currency": "USD",
 
3524
  "capabilities": [
3525
+ "vision",
3526
  "reasoning"
3527
  ],
3528
+ "context_window": 400000,
3529
+ "hf_private": true
 
 
 
3530
  },
3531
  {
3532
+ "name": "coding/gemini-2.5-pro",
3533
  "type": "vision",
3534
  "input_price_per_1m": 1.25,
3535
  "output_price_per_1m": 10,
 
3542
  "hf_private": true
3543
  },
3544
  {
3545
+ "name": "google/gemini-2.5-pro",
3546
+ "type": "vision",
3547
  "input_price_per_1m": 1.25,
3548
  "output_price_per_1m": 10,
3549
  "currency": "USD",
3550
  "capabilities": [
3551
+ "vision",
3552
  "reasoning"
3553
  ],
3554
+ "context_window": 1048576,
3555
  "hf_private": true
3556
  },
3557
  {
3558
+ "name": "together/deepseek-ai/DeepSeek-V3",
3559
  "type": "chat",
3560
  "input_price_per_1m": 1.25,
3561
+ "output_price_per_1m": 1.25,
3562
  "currency": "USD",
3563
+ "context_window": 131072,
3564
  "capabilities": [
3565
+ "tools",
3566
  "reasoning"
3567
  ],
3568
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
3569
+ "size_b": 671,
3570
+ "hf_private": false,
3571
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
3572
+ "hf_status": 200
3573
  },
3574
  {
3575
+ "name": "novita/sao10k/l31-70b-euryale-v2.2",
3576
  "type": "chat",
3577
  "input_price_per_1m": 1.48,
3578
  "output_price_per_1m": 1.48,
 
3582
  "hf_private": false
3583
  },
3584
  {
3585
+ "name": "novita/sao10k/l3-70b-euryale-v2.1",
3586
  "type": "chat",
3587
  "input_price_per_1m": 1.48,
3588
  "output_price_per_1m": 1.48,
 
3604
  "hf_private": true
3605
  },
3606
  {
3607
+ "name": "azure/gpt-5.2",
3608
+ "type": "chat",
3609
  "input_price_per_1m": 1.75,
3610
  "output_price_per_1m": 14,
3611
  "currency": "USD",
3612
  "capabilities": [
 
3613
  "reasoning"
3614
  ],
3615
+ "context_window": 200000,
3616
  "hf_private": true
3617
  },
3618
  {
3619
+ "name": "azure/gpt-5.3-codex",
3620
  "type": "vision",
3621
  "input_price_per_1m": 1.75,
3622
  "output_price_per_1m": 14,
 
3629
  "hf_private": true
3630
  },
3631
  {
3632
+ "name": "azure/openai-responses/gpt-5.2-codex",
3633
  "type": "vision",
3634
  "input_price_per_1m": 1.75,
3635
  "output_price_per_1m": 14,
 
3638
  "vision",
3639
  "reasoning"
3640
  ],
3641
+ "context_window": 400000,
3642
  "hf_private": true
3643
  },
3644
  {
3645
+ "name": "openai-responses/gpt-5.3-chat",
3646
  "type": "vision",
3647
  "input_price_per_1m": 1.75,
3648
  "output_price_per_1m": 14,
 
3651
  "vision",
3652
  "reasoning"
3653
  ],
3654
+ "context_window": 128000,
3655
  "hf_private": true
3656
  },
3657
  {
3658
+ "name": "openai-responses/gpt-5.2",
3659
  "type": "vision",
3660
  "input_price_per_1m": 1.75,
3661
  "output_price_per_1m": 14,
 
3664
  "vision",
3665
  "reasoning"
3666
  ],
3667
+ "context_window": 400000,
3668
  "hf_private": true
3669
  },
3670
  {
3671
+ "name": "openai-responses/gpt-5.2-codex",
3672
  "type": "vision",
3673
  "input_price_per_1m": 1.75,
3674
  "output_price_per_1m": 14,
 
3681
  "hf_private": true
3682
  },
3683
  {
3684
+ "name": "openai-responses/gpt-5.3-codex",
3685
  "type": "vision",
3686
  "input_price_per_1m": 1.75,
3687
  "output_price_per_1m": 14,
 
3690
  "vision",
3691
  "reasoning"
3692
  ],
3693
+ "context_window": 400000,
3694
  "hf_private": true
3695
  },
3696
  {
3697
+ "name": "openai/gpt-5.3-chat",
3698
  "type": "vision",
3699
  "input_price_per_1m": 1.75,
3700
  "output_price_per_1m": 14,
 
3703
  "vision",
3704
  "reasoning"
3705
  ],
3706
+ "context_window": 128000,
3707
  "hf_private": true
3708
  },
3709
  {
3710
+ "name": "openai/gpt-5.2",
3711
+ "type": "vision",
3712
  "input_price_per_1m": 1.75,
3713
  "output_price_per_1m": 14,
3714
  "currency": "USD",
3715
  "capabilities": [
3716
+ "vision",
3717
  "reasoning"
3718
  ],
3719
+ "context_window": 400000,
3720
  "hf_private": true
3721
  },
3722
  {
3723
+ "name": "openai/gpt-5.2-chat",
3724
  "type": "vision",
3725
  "input_price_per_1m": 1.75,
3726
  "output_price_per_1m": 14,
 
3729
  "vision",
3730
  "reasoning"
3731
  ],
 
 
 
 
 
 
 
 
 
3732
  "context_window": 128000,
3733
  "hf_private": true
3734
  },
3735
  {
3736
+ "name": "azure/openai-responses/gpt-4.1",
3737
+ "type": "vision",
3738
  "input_price_per_1m": 2,
3739
  "output_price_per_1m": 8,
3740
  "currency": "USD",
 
3741
  "capabilities": [
3742
+ "vision"
 
3743
  ],
3744
+ "context_window": 1047576,
3745
  "hf_private": true
3746
  },
3747
  {
3748
+ "name": "azure/gpt-4.1",
3749
  "type": "vision",
3750
  "input_price_per_1m": 2,
3751
+ "output_price_per_1m": 8,
3752
  "currency": "USD",
3753
  "capabilities": [
3754
+ "vision"
 
3755
  ],
3756
+ "context_window": 1047576,
3757
  "hf_private": true
3758
  },
3759
  {
3760
+ "name": "mistral/pixtral-large-latest",
3761
  "type": "chat",
3762
  "input_price_per_1m": 2,
3763
+ "output_price_per_1m": 5,
3764
  "currency": "USD",
3765
  "context_window": 131072,
3766
  "hf_private": true
3767
  },
3768
  {
3769
+ "name": "openai-responses/gpt-4.1",
3770
  "type": "vision",
3771
  "input_price_per_1m": 2,
3772
+ "output_price_per_1m": 8,
3773
  "currency": "USD",
3774
  "capabilities": [
3775
+ "vision"
 
3776
  ],
3777
+ "context_window": 1047576,
3778
  "hf_private": true
3779
  },
3780
  {
3781
+ "name": "vertex/gemini-3-pro-preview",
3782
  "type": "vision",
3783
  "input_price_per_1m": 2,
3784
  "output_price_per_1m": 12,
 
3791
  "hf_private": true
3792
  },
3793
  {
3794
+ "name": "vertex/gemini-3.1-pro-preview",
3795
+ "type": "vision",
3796
  "input_price_per_1m": 2,
3797
+ "output_price_per_1m": 12,
3798
  "currency": "USD",
3799
+ "capabilities": [
3800
+ "vision",
3801
+ "reasoning"
3802
+ ],
3803
+ "context_window": 1048576,
3804
  "hf_private": true
3805
  },
3806
  {
3807
+ "name": "vertex/gemini-3-pro-image-preview",
3808
  "type": "vision",
3809
  "input_price_per_1m": 2,
3810
+ "output_price_per_1m": 12,
3811
  "currency": "USD",
3812
  "capabilities": [
3813
+ "vision",
3814
+ "reasoning"
3815
  ],
3816
+ "context_window": 1048576,
3817
  "hf_private": true
3818
  },
3819
  {
 
3842
  "hf_private": true
3843
  },
3844
  {
3845
+ "name": "xai/grok-4.2-beta",
3846
  "type": "vision",
3847
  "input_price_per_1m": 2,
3848
+ "output_price_per_1m": 6,
3849
  "currency": "USD",
3850
  "capabilities": [
3851
  "vision",
3852
  "reasoning"
3853
  ],
3854
+ "context_window": 2000000,
3855
  "hf_private": true
3856
  },
3857
  {
3858
+ "name": "xai/grok-2-1212",
3859
+ "type": "chat",
3860
+ "input_price_per_1m": 2,
3861
+ "output_price_per_1m": 10,
3862
+ "currency": "USD",
3863
+ "context_window": 131072,
3864
+ "hf_private": true
3865
+ },
3866
+ {
3867
+ "name": "google/gemini-3.1-pro-preview",
3868
  "type": "vision",
3869
  "input_price_per_1m": 2,
3870
  "output_price_per_1m": 12,
 
3877
  "hf_private": true
3878
  },
3879
  {
3880
+ "name": "google/gemini-3-pro-preview",
3881
  "type": "vision",
3882
  "input_price_per_1m": 2,
3883
  "output_price_per_1m": 12,
 
3890
  "hf_private": true
3891
  },
3892
  {
3893
+ "name": "nebius/deepseek-ai/DeepSeek-V3-0324-fast",
3894
+ "type": "chat",
3895
  "input_price_per_1m": 2,
3896
+ "output_price_per_1m": 6,
3897
  "currency": "USD",
3898
+ "context_window": 128000,
 
 
 
3899
  "hf_private": true
3900
  },
3901
  {
3902
+ "name": "perplexity/sonar-reasoning-pro",
3903
+ "type": "chat",
3904
  "input_price_per_1m": 2,
3905
  "output_price_per_1m": 8,
3906
  "currency": "USD",
3907
+ "context_window": 131072,
3908
  "capabilities": [
3909
+ "vision",
3910
+ "reasoning"
3911
  ],
 
3912
  "hf_private": true
3913
  },
3914
  {
3915
+ "name": "azure/openai-responses/gpt-5.4",
3916
  "type": "vision",
3917
  "input_price_per_1m": 2.5,
3918
  "output_price_per_1m": 15,
 
3925
  "hf_private": true
3926
  },
3927
  {
3928
+ "name": "openai-responses/gpt-5.4",
3929
  "type": "vision",
3930
  "input_price_per_1m": 2.5,
3931
  "output_price_per_1m": 15,
 
3950
  "hf_private": true
3951
  },
3952
  {
3953
+ "name": "openai/gpt-4o-2024-11-20",
 
 
 
 
 
 
 
 
 
 
 
 
3954
  "type": "vision",
3955
  "input_price_per_1m": 2.5,
3956
  "output_price_per_1m": 10,
 
3962
  "hf_private": true
3963
  },
3964
  {
3965
+ "name": "openai/gpt-4o-2024-05-13",
3966
  "type": "vision",
3967
  "input_price_per_1m": 2.5,
3968
  "output_price_per_1m": 10,
 
3974
  "hf_private": true
3975
  },
3976
  {
3977
+ "name": "openai/gpt-5.4",
3978
  "type": "vision",
3979
  "input_price_per_1m": 2.5,
3980
  "output_price_per_1m": 15,
 
3987
  "hf_private": true
3988
  },
3989
  {
3990
+ "name": "openai/gpt-4o",
3991
+ "type": "vision",
3992
+ "input_price_per_1m": 2.5,
3993
+ "output_price_per_1m": 10,
3994
  "currency": "USD",
 
3995
  "capabilities": [
3996
  "vision"
3997
  ],
3998
+ "context_window": 128000,
3999
  "hf_private": true
4000
  },
4001
  {
4002
+ "name": "vertex/claude-3-5-sonnet",
4003
  "type": "vision",
4004
  "input_price_per_1m": 3,
4005
  "output_price_per_1m": 15,
 
4007
  "capabilities": [
4008
  "vision"
4009
  ],
4010
+ "context_window": 200000,
4011
  "hf_private": true
4012
  },
4013
  {
4014
+ "name": "vertex/claude-sonnet-4",
4015
  "type": "vision",
4016
  "input_price_per_1m": 3,
4017
  "output_price_per_1m": 15,
 
4020
  "vision",
4021
  "reasoning"
4022
  ],
4023
+ "context_window": 200000,
4024
  "hf_private": true
4025
  },
4026
  {
4027
+ "name": "vertex/claude-sonnet-4-5",
4028
  "type": "vision",
4029
  "input_price_per_1m": 3,
4030
  "output_price_per_1m": 15,
 
4033
  "vision",
4034
  "reasoning"
4035
  ],
4036
+ "context_window": 200000,
4037
  "hf_private": true
4038
  },
4039
  {
4040
+ "name": "vertex/claude-3-7-sonnet",
4041
  "type": "vision",
4042
  "input_price_per_1m": 3,
4043
  "output_price_per_1m": 15,
 
4046
  "vision",
4047
  "reasoning"
4048
  ],
4049
+ "context_window": 200000,
4050
  "hf_private": true
4051
  },
4052
  {
4053
+ "name": "xai/grok-4",
4054
  "type": "vision",
4055
  "input_price_per_1m": 3,
4056
  "output_price_per_1m": 15,
4057
  "currency": "USD",
4058
  "capabilities": [
4059
+ "vision"
 
4060
  ],
4061
+ "context_window": 256000,
4062
  "hf_private": true
4063
  },
4064
  {
4065
+ "name": "coding/claude-sonnet-4-20250514",
4066
  "type": "vision",
4067
  "input_price_per_1m": 3,
4068
  "output_price_per_1m": 15,
 
4075
  "hf_private": true
4076
  },
4077
  {
4078
+ "name": "bedrock/claude-sonnet-4",
4079
  "type": "vision",
4080
  "input_price_per_1m": 3,
4081
  "output_price_per_1m": 15,
 
4084
  "vision",
4085
  "reasoning"
4086
  ],
4087
+ "context_window": 200000,
4088
  "hf_private": true
4089
  },
4090
  {
 
4101
  "hf_private": true
4102
  },
4103
  {
4104
+ "name": "bedrock/claude-sonnet-4-6",
4105
  "type": "vision",
4106
  "input_price_per_1m": 3,
4107
  "output_price_per_1m": 15,
 
4110
  "vision",
4111
  "reasoning"
4112
  ],
4113
+ "context_window": 1000000,
4114
  "hf_private": true
4115
  },
4116
  {
4117
+ "name": "bedrock/claude-3-7-sonnet",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4118
  "type": "vision",
4119
  "input_price_per_1m": 3,
4120
  "output_price_per_1m": 15,
4121
  "currency": "USD",
4122
  "capabilities": [
4123
+ "vision",
4124
+ "reasoning"
4125
  ],
4126
  "context_window": 200000,
4127
  "hf_private": true
4128
  },
4129
  {
4130
+ "name": "anthropic/claude-sonnet-4",
4131
  "type": "vision",
4132
  "input_price_per_1m": 3,
4133
  "output_price_per_1m": 15,
 
4136
  "vision",
4137
  "reasoning"
4138
  ],
4139
+ "context_window": 1000000,
4140
  "hf_private": true
4141
  },
4142
  {
4143
+ "name": "anthropic/claude-sonnet-4-6",
4144
  "type": "vision",
4145
  "input_price_per_1m": 3,
4146
  "output_price_per_1m": 15,
 
4149
  "vision",
4150
  "reasoning"
4151
  ],
4152
+ "context_window": 1000000,
4153
  "hf_private": true
4154
  },
4155
  {
4156
+ "name": "anthropic/claude-sonnet-4-5",
4157
  "type": "vision",
4158
  "input_price_per_1m": 3,
4159
  "output_price_per_1m": 15,
 
4162
  "vision",
4163
  "reasoning"
4164
  ],
4165
+ "context_window": 1000000,
4166
  "hf_private": true
4167
  },
4168
  {
4169
+ "name": "together/deepseek-ai/DeepSeek-R1",
4170
  "type": "chat",
4171
+ "input_price_per_1m": 3,
4172
+ "output_price_per_1m": 7,
4173
  "currency": "USD",
4174
  "context_window": 64000,
4175
  "capabilities": [
 
4184
  "hf_status": 200
4185
  },
4186
  {
4187
+ "name": "perplexity/sonar-pro",
4188
  "type": "chat",
4189
+ "input_price_per_1m": 3,
4190
+ "output_price_per_1m": 15,
4191
  "currency": "USD",
4192
+ "context_window": 204800,
4193
  "capabilities": [
4194
+ "vision"
4195
  ],
4196
  "hf_private": true
4197
  },
4198
  {
4199
+ "name": "novita/deepseek/deepseek-r1",
4200
+ "type": "chat",
4201
+ "input_price_per_1m": 4,
4202
+ "output_price_per_1m": 4,
4203
+ "currency": "USD",
4204
+ "context_window": 64000,
4205
+ "capabilities": [
4206
+ "tools",
4207
+ "reasoning"
4208
+ ],
4209
+ "hf_id": "deepseek-ai/DeepSeek-R1",
4210
+ "size_b": 671,
4211
+ "size_source": "manual",
4212
+ "hf_private": false,
4213
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
4214
+ "hf_status": 200
4215
+ },
4216
+ {
4217
+ "name": "vertex/claude-opus-4-5",
4218
  "type": "vision",
4219
  "input_price_per_1m": 5,
4220
  "output_price_per_1m": 25,
 
4227
  "hf_private": true
4228
  },
4229
  {
4230
+ "name": "vertex/claude-opus-4-6",
4231
  "type": "vision",
4232
  "input_price_per_1m": 5,
4233
  "output_price_per_1m": 25,
 
4251
  "context_window": 128000,
4252
  "hf_private": true
4253
  },
4254
+ {
4255
+ "name": "xai/grok-3",
4256
+ "type": "chat",
4257
+ "input_price_per_1m": 5,
4258
+ "output_price_per_1m": 25,
4259
+ "currency": "USD",
4260
+ "context_window": 131072,
4261
+ "capabilities": [
4262
+ "tools"
4263
+ ],
4264
+ "hf_private": true
4265
+ },
4266
  {
4267
  "name": "bedrock/claude-opus-4-5",
4268
  "type": "vision",
 
4290
  "hf_private": true
4291
  },
4292
  {
4293
+ "name": "anthropic/claude-opus-4-5",
4294
  "type": "vision",
4295
  "input_price_per_1m": 5,
4296
  "output_price_per_1m": 25,
 
4299
  "vision",
4300
  "reasoning"
4301
  ],
4302
+ "context_window": 200000,
4303
  "hf_private": true
4304
  },
4305
  {
4306
+ "name": "anthropic/claude-opus-4-6",
4307
  "type": "vision",
4308
  "input_price_per_1m": 5,
4309
  "output_price_per_1m": 25,
 
4312
  "vision",
4313
  "reasoning"
4314
  ],
4315
+ "context_window": 1000000,
4316
  "hf_private": true
4317
  },
4318
  {
 
4329
  "hf_private": true
4330
  },
4331
  {
4332
+ "name": "openai-responses/gpt-5-pro",
4333
  "type": "vision",
4334
  "input_price_per_1m": 15,
4335
+ "output_price_per_1m": 120,
4336
  "currency": "USD",
4337
  "capabilities": [
4338
  "vision",
4339
  "reasoning"
4340
  ],
4341
+ "context_window": 400000,
4342
  "hf_private": true
4343
  },
4344
  {
4345
+ "name": "vertex/claude-opus-4",
4346
  "type": "vision",
4347
  "input_price_per_1m": 15,
4348
  "output_price_per_1m": 75,
 
4355
  "hf_private": true
4356
  },
4357
  {
4358
+ "name": "vertex/claude-opus-4-1",
4359
  "type": "vision",
4360
  "input_price_per_1m": 15,
4361
+ "output_price_per_1m": 75,
4362
  "currency": "USD",
4363
  "capabilities": [
4364
  "vision",
4365
  "reasoning"
4366
  ],
4367
+ "context_window": 200000,
4368
  "hf_private": true
4369
  },
4370
  {
 
4381
  "hf_private": true
4382
  },
4383
  {
4384
+ "name": "coding/claude-opus-4-20250514",
4385
  "type": "vision",
4386
  "input_price_per_1m": 15,
4387
  "output_price_per_1m": 75,
 
4394
  "hf_private": true
4395
  },
4396
  {
4397
+ "name": "bedrock/claude-opus-4",
4398
  "type": "vision",
4399
  "input_price_per_1m": 15,
4400
  "output_price_per_1m": 75,
 
4407
  "hf_private": true
4408
  },
4409
  {
4410
+ "name": "anthropic/claude-opus-4-1",
4411
  "type": "vision",
4412
  "input_price_per_1m": 15,
4413
  "output_price_per_1m": 75,
 
4420
  "hf_private": true
4421
  },
4422
  {
4423
+ "name": "anthropic/claude-opus-4",
4424
  "type": "vision",
4425
  "input_price_per_1m": 15,
4426
  "output_price_per_1m": 75,
 
4446
  "hf_private": true
4447
  },
4448
  {
4449
+ "name": "azure/openai-responses/gpt-5.4-pro",
4450
  "type": "vision",
4451
  "input_price_per_1m": 30,
4452
  "output_price_per_1m": 180,
 
4459
  "hf_private": true
4460
  },
4461
  {
4462
+ "name": "openai-responses/gpt-5.4-pro",
4463
  "type": "vision",
4464
  "input_price_per_1m": 30,
4465
  "output_price_per_1m": 180,
 
4472
  "hf_private": true
4473
  },
4474
  {
4475
+ "name": "openai/gpt-5.4-pro",
4476
  "type": "vision",
4477
  "input_price_per_1m": 30,
4478
  "output_price_per_1m": 180,
 
5052
  "currency": "USD",
5053
  "size_b": 405,
5054
  "flavor": "base",
5055
+ "hf_private": false,
5056
+ "hf_id": "NousResearch/Hermes-3-Llama-3.1-405B",
5057
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
5058
+ "hf_status": 200
5059
  },
5060
  {
5061
  "name": "gemma-3-27b-it",
 
5299
  "output_price_per_1m": 2,
5300
  "currency": "EUR",
5301
  "size_b": 123,
5302
+ "hf_private": false,
5303
+ "size_source": "manual",
5304
+ "hf_id": "mistralai/Devstral-2-123B-Instruct-2512",
5305
+ "capabilities": [
5306
+ "tools"
5307
+ ],
5308
+ "hf_validated_at": "2026-03-22T19:23:09.981Z",
5309
+ "hf_status": 200
5310
  },
5311
  {
5312
  "name": "whisper-large-v3",
scripts/fetch-providers.js CHANGED
@@ -248,6 +248,8 @@ const MANUAL_HF_ID_MAP = {
248
  'magistral small': 'mistralai/Magistral-Small-2506',
249
  'pixtral large': 'mistralai/Pixtral-Large-Instruct-2411',
250
  'hermes 3 llama 3.1 405b': 'NousResearch/Hermes-3-Llama-3.1-405B',
 
 
251
  };
252
 
253
  const MANUAL_OLLAMA_ID_MAP = {
 
248
  'magistral small': 'mistralai/Magistral-Small-2506',
249
  'pixtral large': 'mistralai/Pixtral-Large-Instruct-2411',
250
  'hermes 3 llama 3.1 405b': 'NousResearch/Hermes-3-Llama-3.1-405B',
251
+ 'hermes 3 llama 3.1 405b base': 'NousResearch/Hermes-3-Llama-3.1-405B',
252
+ 'devstral 2 123b instruct 2512': 'mistralai/Devstral-2-123B-Instruct-2512',
253
  };
254
 
255
  const MANUAL_OLLAMA_ID_MAP = {