CrispStrobe commited on
Commit
128b3b8
·
1 Parent(s): 901bb12

fix: resolve minified HF metadata by fetching raw config.json; improved BERT-style param estimation

Browse files
Files changed (2) hide show
  1. data/providers.json +693 -673
  2. scripts/fetch-providers.js +44 -12
data/providers.json CHANGED
@@ -133,7 +133,8 @@
133
  "input_price_per_1m": 0.015,
134
  "output_price_per_1m": 0,
135
  "currency": "USD",
136
- "hf_id": "BAAI/bge-large-en-v1.5"
 
137
  },
138
  {
139
  "name": "bge-m3",
@@ -251,7 +252,8 @@
251
  "input_price_per_1m": 0.065,
252
  "output_price_per_1m": 0,
253
  "currency": "CHF",
254
- "hf_id": "BAAI/bge-multilingual-gemma2"
 
255
  },
256
  {
257
  "name": "All MiniLM L12 v2",
@@ -277,7 +279,8 @@
277
  "input_price_per_1m": 0.006,
278
  "output_price_per_1m": 0,
279
  "currency": "CHF",
280
- "hf_id": "openai/whisper-large-v3"
 
281
  },
282
  {
283
  "name": "Photomaker V2",
@@ -342,7 +345,8 @@
342
  ],
343
  "size_b": 122.61,
344
  "hf_id": "mistralai/Mistral-Large-Instruct-2411",
345
- "hf_private": true
 
346
  },
347
  {
348
  "name": "GPT-5.4 Thinking",
@@ -484,7 +488,8 @@
484
  ],
485
  "size_b": 122.61,
486
  "hf_id": "mistralai/Mistral-Large-Instruct-2411",
487
- "hf_private": true
 
488
  },
489
  {
490
  "name": "Llama 4 Maverick",
@@ -1049,22 +1054,22 @@
1049
  "eu_endpoints": true,
1050
  "models": [
1051
  {
1052
- "name": "novita/meta-llama/llama-3.2-1b-instruct",
1053
  "type": "chat",
1054
  "input_price_per_1m": 0.02,
1055
- "output_price_per_1m": 0.02,
1056
  "currency": "USD",
1057
- "context_window": 131000,
1058
- "size_b": 1
1059
  },
1060
  {
1061
- "name": "deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo",
1062
  "type": "chat",
1063
  "input_price_per_1m": 0.02,
1064
- "output_price_per_1m": 0.05,
1065
  "currency": "USD",
1066
- "context_window": 131072,
1067
- "size_b": 8
1068
  },
1069
  {
1070
  "name": "openai/gpt-5-nano",
@@ -1102,26 +1107,28 @@
1102
  "hf_id": "meta-llama/Meta-Llama-3-8B-Instruct"
1103
  },
1104
  {
1105
- "name": "novita/sao10k/l3-8b-lunaris",
1106
- "type": "chat",
1107
  "input_price_per_1m": 0.05,
1108
- "output_price_per_1m": 0.05,
1109
  "currency": "USD",
1110
- "context_window": 8192,
1111
- "size_b": 8
 
 
 
1112
  },
1113
  {
1114
- "name": "novita/meta-llama/llama-3.1-8b-instruct",
1115
  "type": "chat",
1116
  "input_price_per_1m": 0.05,
1117
- "output_price_per_1m": 0.05,
1118
  "currency": "USD",
1119
- "context_window": 16384,
1120
- "size_b": 8,
1121
  "capabilities": [
1122
  "tools"
1123
  ],
1124
- "hf_id": "meta-llama/Meta-Llama-3.1-8B-Instruct"
1125
  },
1126
  {
1127
  "name": "novita/Sao10K/L3-8B-Stheno-v3.2",
@@ -1133,28 +1140,26 @@
1133
  "size_b": 8
1134
  },
1135
  {
1136
- "name": "azure/gpt-5-nano",
1137
- "type": "vision",
1138
  "input_price_per_1m": 0.05,
1139
- "output_price_per_1m": 0.4,
1140
  "currency": "USD",
1141
- "capabilities": [
1142
- "reasoning"
1143
- ],
1144
- "context_window": 200000,
1145
- "hf_private": true
1146
  },
1147
  {
1148
- "name": "alibaba/qwen-turbo",
1149
  "type": "chat",
1150
  "input_price_per_1m": 0.05,
1151
- "output_price_per_1m": 0.2,
1152
  "currency": "USD",
1153
- "context_window": 1000000,
 
1154
  "capabilities": [
1155
  "tools"
1156
  ],
1157
- "hf_private": true
1158
  },
1159
  {
1160
  "name": "openai-responses/gpt-5-nano",
@@ -1206,27 +1211,31 @@
1206
  "size_b": 13
1207
  },
1208
  {
1209
- "name": "together/meta-llama/Meta-Llama-3-8B-Instruct-Lite",
1210
  "type": "chat",
1211
  "input_price_per_1m": 0.1,
1212
- "output_price_per_1m": 0.1,
1213
  "currency": "USD",
1214
- "context_window": 8192,
1215
- "size_b": 8
 
 
 
 
 
1216
  },
1217
  {
1218
- "name": "groq/openai/gpt-oss-20b",
1219
  "type": "chat",
1220
  "input_price_per_1m": 0.1,
1221
- "output_price_per_1m": 0.5,
1222
  "currency": "USD",
1223
  "context_window": 131072,
1224
- "size_b": 20,
1225
  "capabilities": [
1226
- "tools",
1227
- "reasoning"
1228
  ],
1229
- "hf_id": "openai/gpt-oss-20b"
 
1230
  },
1231
  {
1232
  "name": "mistral/mistral-small-2503",
@@ -1251,33 +1260,21 @@
1251
  "size_b": 24
1252
  },
1253
  {
1254
- "name": "mistral/devstral-small-latest",
1255
  "type": "chat",
1256
  "input_price_per_1m": 0.1,
1257
- "output_price_per_1m": 0.3,
1258
  "currency": "USD",
1259
  "context_window": 131072,
 
1260
  "capabilities": [
1261
- "tools"
1262
- ],
1263
- "hf_id": "mistralai/Devstral-Small-2507",
1264
- "size_b": 24
1265
- },
1266
- {
1267
- "name": "vertex/gemini-2.5-flash-lite",
1268
- "type": "vision",
1269
- "input_price_per_1m": 0.1,
1270
- "output_price_per_1m": 0.4,
1271
- "currency": "USD",
1272
- "capabilities": [
1273
- "vision",
1274
  "reasoning"
1275
  ],
1276
- "context_window": 1048576,
1277
- "hf_private": true
1278
  },
1279
  {
1280
- "name": "azure/gpt-4.1-nano",
1281
  "type": "vision",
1282
  "input_price_per_1m": 0.1,
1283
  "output_price_per_1m": 0.4,
@@ -1289,7 +1286,7 @@
1289
  "hf_private": true
1290
  },
1291
  {
1292
- "name": "azure/openai-responses/gpt-4.1-nano",
1293
  "type": "vision",
1294
  "input_price_per_1m": 0.1,
1295
  "output_price_per_1m": 0.4,
@@ -1301,7 +1298,7 @@
1301
  "hf_private": true
1302
  },
1303
  {
1304
- "name": "google/gemini-2.5-flash-lite",
1305
  "type": "vision",
1306
  "input_price_per_1m": 0.1,
1307
  "output_price_per_1m": 0.4,
@@ -1313,6 +1310,15 @@
1313
  "context_window": 1048576,
1314
  "hf_private": true
1315
  },
 
 
 
 
 
 
 
 
 
1316
  {
1317
  "name": "google/gemini-2.0-flash-001",
1318
  "type": "vision",
@@ -1326,18 +1332,17 @@
1326
  "hf_private": true
1327
  },
1328
  {
1329
- "name": "deepinfra/Qwen/Qwen3-32B",
1330
- "type": "chat",
1331
  "input_price_per_1m": 0.1,
1332
- "output_price_per_1m": 0.3,
1333
  "currency": "USD",
1334
- "context_window": 40000,
1335
- "size_b": 32,
1336
  "capabilities": [
1337
- "tools",
1338
  "reasoning"
1339
  ],
1340
- "hf_id": "Qwen/Qwen3-32B"
 
1341
  },
1342
  {
1343
  "name": "openai-responses/gpt-4.1-nano",
@@ -1411,34 +1416,6 @@
1411
  "context_window": 8192,
1412
  "size_b": 8
1413
  },
1414
- {
1415
- "name": "novita/deepseek/deepseek-r1-distill-qwen-14b",
1416
- "type": "chat",
1417
- "input_price_per_1m": 0.15,
1418
- "output_price_per_1m": 0.15,
1419
- "currency": "USD",
1420
- "context_window": 128000,
1421
- "size_b": 14,
1422
- "capabilities": [
1423
- "tools",
1424
- "reasoning"
1425
- ],
1426
- "hf_id": "deepseek-ai/DeepSeek-R1"
1427
- },
1428
- {
1429
- "name": "groq/openai/gpt-oss-120b",
1430
- "type": "chat",
1431
- "input_price_per_1m": 0.15,
1432
- "output_price_per_1m": 0.75,
1433
- "currency": "USD",
1434
- "context_window": 131072,
1435
- "size_b": 120,
1436
- "capabilities": [
1437
- "tools",
1438
- "reasoning"
1439
- ],
1440
- "hf_id": "openai/gpt-oss-120b"
1441
- },
1442
  {
1443
  "name": "mistral/mistral-small-2603",
1444
  "type": "vision",
@@ -1476,16 +1453,18 @@
1476
  "size_b": 235
1477
  },
1478
  {
1479
- "name": "openai/gpt-4o-mini",
1480
- "type": "vision",
1481
  "input_price_per_1m": 0.15,
1482
- "output_price_per_1m": 0.6,
1483
  "currency": "USD",
 
 
1484
  "capabilities": [
1485
- "vision"
 
1486
  ],
1487
- "context_window": 128000,
1488
- "hf_private": true
1489
  },
1490
  {
1491
  "name": "nebius/openai/gpt-oss-120b",
@@ -1500,6 +1479,32 @@
1500
  "size_b": 120,
1501
  "hf_id": "openai/gpt-oss-120b"
1502
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1503
  {
1504
  "name": "novita/mistralai/mistral-nemo",
1505
  "type": "chat",
@@ -1522,43 +1527,6 @@
1522
  "context_window": 131072,
1523
  "size_b": 8
1524
  },
1525
- {
1526
- "name": "together/meta-llama/LlamaGuard-2-8b",
1527
- "type": "chat",
1528
- "input_price_per_1m": 0.2,
1529
- "output_price_per_1m": 0.2,
1530
- "currency": "USD",
1531
- "context_window": 8192,
1532
- "size_b": 8
1533
- },
1534
- {
1535
- "name": "novita/meta-llama/llama-4-maverick-17b-128e-instruct-fp8",
1536
- "type": "vision",
1537
- "input_price_per_1m": 0.2,
1538
- "output_price_per_1m": 0.85,
1539
- "currency": "USD",
1540
- "context_window": 1048576,
1541
- "size_b": 17,
1542
- "capabilities": [
1543
- "vision",
1544
- "tools"
1545
- ],
1546
- "hf_id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct"
1547
- },
1548
- {
1549
- "name": "novita/qwen/qwen3-235b-a22b-fp8",
1550
- "type": "chat",
1551
- "input_price_per_1m": 0.2,
1552
- "output_price_per_1m": 0.8,
1553
- "currency": "USD",
1554
- "context_window": 128000,
1555
- "size_b": 235,
1556
- "capabilities": [
1557
- "tools",
1558
- "reasoning"
1559
- ],
1560
- "hf_id": "Qwen/Qwen3-235B-A22B"
1561
- },
1562
  {
1563
  "name": "deepinfra/Qwen/Qwen3-235B-A22B",
1564
  "type": "chat",
@@ -1601,29 +1569,57 @@
1601
  "hf_id": "Qwen/Qwen3-30B-A3B-Instruct-2507"
1602
  },
1603
  {
1604
- "name": "xai/grok-4-fast",
1605
  "type": "vision",
1606
  "input_price_per_1m": 0.2,
1607
- "output_price_per_1m": 0.5,
1608
  "currency": "USD",
1609
- "context_window": 2000000,
 
1610
  "capabilities": [
1611
  "vision",
1612
- "tools",
1613
- "reasoning"
1614
  ],
1615
- "hf_private": true
1616
  },
1617
  {
1618
- "name": "xai/grok-4-1-fast-reasoning",
1619
- "type": "vision",
1620
- "input_price_per_1m": 0.2,
1621
- "output_price_per_1m": 0.5,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1622
  "currency": "USD",
1623
  "capabilities": [
1624
  "vision"
1625
  ],
 
 
 
 
 
 
 
 
 
1626
  "context_window": 2000000,
 
 
 
 
 
1627
  "hf_private": true
1628
  },
1629
  {
@@ -1653,17 +1649,26 @@
1653
  "hf_private": true
1654
  },
1655
  {
1656
- "name": "xai/grok-code-fast-1",
1657
  "type": "vision",
1658
  "input_price_per_1m": 0.2,
1659
- "output_price_per_1m": 1.5,
1660
  "currency": "USD",
1661
  "capabilities": [
1662
  "vision"
1663
  ],
1664
- "context_window": 256000,
1665
  "hf_private": true
1666
  },
 
 
 
 
 
 
 
 
 
1667
  {
1668
  "name": "openai-responses/gpt-5.4-nano",
1669
  "type": "vision",
@@ -1691,52 +1696,52 @@
1691
  "hf_private": true
1692
  },
1693
  {
1694
- "name": "deepinfra/Qwen/Qwen2.5-72B-Instruct",
1695
- "type": "vision",
1696
  "input_price_per_1m": 0.23,
1697
- "output_price_per_1m": 0.4,
1698
  "currency": "USD",
1699
- "context_window": 131072,
1700
- "size_b": 72,
1701
  "capabilities": [
1702
- "vision"
1703
  ],
1704
- "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct"
1705
  },
1706
  {
1707
- "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct",
1708
  "type": "chat",
1709
  "input_price_per_1m": 0.23,
1710
  "output_price_per_1m": 0.4,
1711
  "currency": "USD",
1712
- "context_window": 131072,
1713
- "size_b": 70,
1714
- "capabilities": [
1715
- "tools"
1716
- ],
1717
- "hf_id": "meta-llama/Llama-3.3-70B-Instruct"
1718
  },
1719
  {
1720
- "name": "deepinfra/deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1721
  "type": "chat",
1722
  "input_price_per_1m": 0.23,
1723
- "output_price_per_1m": 0.69,
1724
  "currency": "USD",
1725
- "context_window": 64000,
1726
  "size_b": 70,
1727
  "capabilities": [
1728
- "reasoning"
1729
  ],
1730
- "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B"
1731
  },
1732
  {
1733
- "name": "deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct",
1734
- "type": "chat",
1735
  "input_price_per_1m": 0.23,
1736
  "output_price_per_1m": 0.4,
1737
  "currency": "USD",
1738
- "context_window": 130815,
1739
- "size_b": 70
 
 
 
 
1740
  },
1741
  {
1742
  "name": "mistral/open-mistral-7b",
@@ -1748,27 +1753,27 @@
1748
  "size_b": 7
1749
  },
1750
  {
1751
- "name": "vertex/gemini-3.1-flash-lite-preview",
1752
  "type": "vision",
1753
  "input_price_per_1m": 0.25,
1754
- "output_price_per_1m": 1.5,
1755
  "currency": "USD",
1756
  "capabilities": [
1757
- "vision"
1758
  ],
1759
- "context_window": 1048576,
1760
  "hf_private": true
1761
  },
1762
  {
1763
- "name": "azure/gpt-5-mini",
1764
  "type": "vision",
1765
  "input_price_per_1m": 0.25,
1766
- "output_price_per_1m": 2,
1767
  "currency": "USD",
1768
  "capabilities": [
1769
- "reasoning"
1770
  ],
1771
- "context_window": 200000,
1772
  "hf_private": true
1773
  },
1774
  {
@@ -1832,57 +1837,51 @@
1832
  "hf_private": true
1833
  },
1834
  {
1835
- "name": "together/Qwen/Qwen2.5-7B-Instruct-Turbo",
1836
  "type": "chat",
1837
  "input_price_per_1m": 0.3,
1838
- "output_price_per_1m": 0.3,
1839
  "currency": "USD",
1840
- "context_window": 32768,
1841
- "size_b": 7
 
 
 
 
 
1842
  },
1843
  {
1844
- "name": "novita/minimax-m2.7",
1845
- "type": "vision",
1846
  "input_price_per_1m": 0.3,
1847
- "output_price_per_1m": 1.2,
1848
  "currency": "USD",
1849
- "capabilities": [
1850
- "vision",
1851
- "reasoning"
1852
- ],
1853
- "context_window": 200000,
1854
- "hf_id": "MiniMaxAI/MiniMax-M2.7",
1855
  "hf_private": true
1856
  },
1857
  {
1858
- "name": "novita/deepseek/deepseek-r1-distill-qwen-32b",
1859
  "type": "chat",
1860
  "input_price_per_1m": 0.3,
1861
- "output_price_per_1m": 0.3,
1862
  "currency": "USD",
1863
- "context_window": 12800,
1864
- "size_b": 32,
1865
- "capabilities": [
1866
- "reasoning"
1867
- ],
1868
- "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B"
1869
  },
1870
  {
1871
- "name": "novita/MiniMax-M2.7",
1872
  "type": "vision",
1873
  "input_price_per_1m": 0.3,
1874
- "output_price_per_1m": 1.2,
1875
  "currency": "USD",
1876
  "capabilities": [
1877
- "vision",
1878
- "reasoning"
1879
  ],
1880
- "context_window": 200000,
1881
- "hf_id": "MiniMaxAI/MiniMax-M2.7",
1882
  "hf_private": true
1883
  },
1884
  {
1885
- "name": "coding/gemini-2.5-flash",
1886
  "type": "vision",
1887
  "input_price_per_1m": 0.3,
1888
  "output_price_per_1m": 2.5,
@@ -1895,16 +1894,7 @@
1895
  "hf_private": true
1896
  },
1897
  {
1898
- "name": "mistral/codestral-latest",
1899
- "type": "chat",
1900
- "input_price_per_1m": 0.3,
1901
- "output_price_per_1m": 0.9,
1902
- "currency": "USD",
1903
- "context_window": 131072,
1904
- "hf_private": true
1905
- },
1906
- {
1907
- "name": "vertex/gemini-2.5-flash",
1908
  "type": "vision",
1909
  "input_price_per_1m": 0.3,
1910
  "output_price_per_1m": 2.5,
@@ -1917,64 +1907,70 @@
1917
  "hf_private": true
1918
  },
1919
  {
1920
- "name": "vertex/gemini-2.5-flash-image",
1921
- "type": "vision",
1922
  "input_price_per_1m": 0.3,
1923
- "output_price_per_1m": 2.5,
1924
  "currency": "USD",
1925
  "capabilities": [
1926
- "vision",
1927
  "reasoning"
1928
  ],
1929
- "context_window": 1048576,
1930
- "hf_private": true
 
1931
  },
1932
  {
1933
- "name": "parasail/parasail-gemma3-27b-it",
1934
  "type": "chat",
1935
  "input_price_per_1m": 0.3,
1936
- "output_price_per_1m": 0.5,
1937
  "currency": "USD",
1938
- "context_window": 128000,
1939
- "size_b": 27
 
 
 
 
1940
  },
1941
  {
1942
- "name": "google/gemini-2.5-flash",
1943
- "type": "vision",
1944
  "input_price_per_1m": 0.3,
1945
- "output_price_per_1m": 2.5,
1946
  "currency": "USD",
 
 
1947
  "capabilities": [
1948
- "vision",
1949
  "reasoning"
1950
  ],
1951
- "context_window": 1048576,
1952
- "hf_private": true
1953
  },
1954
  {
1955
- "name": "deepinfra/deepseek-ai/DeepSeek-V3.1",
1956
- "type": "chat",
1957
  "input_price_per_1m": 0.3,
1958
- "output_price_per_1m": 1,
1959
  "currency": "USD",
1960
- "context_window": 163840,
1961
  "capabilities": [
1962
- "tools",
1963
  "reasoning"
1964
  ],
1965
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
1966
- "size_b": 671
 
1967
  },
1968
  {
1969
- "name": "alibaba/qwen3-coder-flash",
1970
  "type": "vision",
1971
  "input_price_per_1m": 0.3,
1972
- "output_price_per_1m": 1.5,
1973
  "currency": "USD",
1974
  "capabilities": [
1975
- "vision"
 
1976
  ],
1977
- "context_window": 1048576,
 
1978
  "hf_private": true
1979
  },
1980
  {
@@ -2032,33 +2028,42 @@
2032
  "hf_private": true
2033
  },
2034
  {
2035
- "name": "nebius/deepseek-ai/DeepSeek-V3.2",
2036
- "type": "chat",
2037
  "input_price_per_1m": 0.3,
2038
- "output_price_per_1m": 0.45,
2039
  "currency": "USD",
2040
  "capabilities": [
 
2041
  "reasoning"
2042
  ],
2043
- "context_window": 164000,
2044
- "hf_id": "deepseek-ai/DeepSeek-V3.2",
2045
- "size_b": 685.4
2046
  },
2047
  {
2048
- "name": "nebius/minimax/minimax-m2.1",
2049
  "type": "chat",
2050
  "input_price_per_1m": 0.3,
2051
- "output_price_per_1m": 1.2,
2052
  "currency": "USD",
2053
- "capabilities": [
2054
- "reasoning"
2055
- ],
2056
- "context_window": 200000,
2057
- "hf_id": "MiniMaxAI/MiniMax-M2.1",
2058
- "size_b": 228.7
2059
  },
2060
  {
2061
- "name": "deepinfra/meta-llama/Llama-3.2-90B-Vision-Instruct",
 
 
 
 
 
 
 
 
 
 
 
 
 
2062
  "type": "chat",
2063
  "input_price_per_1m": 0.35,
2064
  "output_price_per_1m": 0.4,
@@ -2093,35 +2098,37 @@
2093
  "hf_id": "meta-llama/Llama-3.3-70B-Instruct"
2094
  },
2095
  {
2096
- "name": "novita/deepseek/deepseek-v3-0324",
2097
  "type": "chat",
2098
  "input_price_per_1m": 0.4,
2099
- "output_price_per_1m": 1.3,
2100
  "currency": "USD",
2101
- "context_window": 128000,
 
2102
  "capabilities": [
2103
- "tools",
2104
- "reasoning"
2105
  ],
2106
- "size_b": 685,
2107
- "hf_id": "deepseek-ai/DeepSeek-V3-0324"
2108
  },
2109
  {
2110
- "name": "novita/deepseek/deepseek-v3-turbo",
2111
  "type": "chat",
2112
  "input_price_per_1m": 0.4,
2113
- "output_price_per_1m": 1.3,
2114
  "currency": "USD",
2115
- "context_window": 128000,
2116
  "hf_private": true
2117
  },
2118
  {
2119
- "name": "mistral/mistral-medium-latest",
2120
  "type": "chat",
2121
  "input_price_per_1m": 0.4,
2122
  "output_price_per_1m": 2,
2123
  "currency": "USD",
2124
  "context_window": 131072,
 
 
 
2125
  "hf_private": true
2126
  },
2127
  {
@@ -2134,19 +2141,19 @@
2134
  "hf_private": true
2135
  },
2136
  {
2137
- "name": "mistral/devstral-medium-2507",
2138
- "type": "chat",
2139
  "input_price_per_1m": 0.4,
2140
- "output_price_per_1m": 2,
2141
  "currency": "USD",
2142
- "context_window": 131072,
2143
  "capabilities": [
2144
- "tools"
2145
  ],
 
2146
  "hf_private": true
2147
  },
2148
  {
2149
- "name": "azure/gpt-4.1-mini",
2150
  "type": "vision",
2151
  "input_price_per_1m": 0.4,
2152
  "output_price_per_1m": 1.6,
@@ -2158,24 +2165,24 @@
2158
  "hf_private": true
2159
  },
2160
  {
2161
- "name": "azure/openai-responses/gpt-4.1-mini",
2162
- "type": "vision",
2163
  "input_price_per_1m": 0.4,
2164
- "output_price_per_1m": 1.6,
2165
  "currency": "USD",
 
2166
  "capabilities": [
2167
- "vision"
2168
  ],
2169
- "context_window": 1047576,
2170
  "hf_private": true
2171
  },
2172
  {
2173
- "name": "deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2174
  "type": "chat",
2175
  "input_price_per_1m": 0.4,
2176
- "output_price_per_1m": 1.6,
2177
  "currency": "USD",
2178
- "context_window": 262144,
2179
  "size_b": 480,
2180
  "capabilities": [
2181
  "tools"
@@ -2183,15 +2190,39 @@
2183
  "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct"
2184
  },
2185
  {
2186
- "name": "alibaba/qwen-plus",
2187
  "type": "chat",
2188
  "input_price_per_1m": 0.4,
2189
- "output_price_per_1m": 1.2,
2190
  "currency": "USD",
2191
- "context_window": 131072,
2192
  "capabilities": [
2193
- "tools"
2194
  ],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2195
  "hf_private": true
2196
  },
2197
  {
@@ -2218,32 +2249,6 @@
2218
  "context_window": 1047576,
2219
  "hf_private": true
2220
  },
2221
- {
2222
- "name": "nebius/zai-org/GLM-4.7",
2223
- "type": "chat",
2224
- "input_price_per_1m": 0.4,
2225
- "output_price_per_1m": 2,
2226
- "currency": "USD",
2227
- "capabilities": [
2228
- "reasoning"
2229
- ],
2230
- "context_window": 200000,
2231
- "hf_id": "zai-org/GLM-4.7",
2232
- "size_b": 358.3
2233
- },
2234
- {
2235
- "name": "nebius/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2236
- "type": "chat",
2237
- "input_price_per_1m": 0.4,
2238
- "output_price_per_1m": 1.8,
2239
- "currency": "USD",
2240
- "context_window": 262000,
2241
- "size_b": 480,
2242
- "capabilities": [
2243
- "tools"
2244
- ],
2245
- "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct"
2246
- },
2247
  {
2248
  "name": "mistral/mistral-large-latest",
2249
  "type": "chat",
@@ -2256,19 +2261,6 @@
2256
  ],
2257
  "hf_private": true
2258
  },
2259
- {
2260
- "name": "vertex/gemini-3.1-flash-image-preview",
2261
- "type": "vision",
2262
- "input_price_per_1m": 0.5,
2263
- "output_price_per_1m": 2,
2264
- "currency": "USD",
2265
- "capabilities": [
2266
- "vision",
2267
- "reasoning"
2268
- ],
2269
- "context_window": 131072,
2270
- "hf_private": true
2271
- },
2272
  {
2273
  "name": "vertex/gemini-3-flash-preview",
2274
  "type": "vision",
@@ -2283,7 +2275,7 @@
2283
  "hf_private": true
2284
  },
2285
  {
2286
- "name": "google/gemini-3.1-flash-image-preview",
2287
  "type": "vision",
2288
  "input_price_per_1m": 0.5,
2289
  "output_price_per_1m": 2,
@@ -2295,19 +2287,6 @@
2295
  "context_window": 131072,
2296
  "hf_private": true
2297
  },
2298
- {
2299
- "name": "google/gemini-3-flash-preview",
2300
- "type": "vision",
2301
- "input_price_per_1m": 0.5,
2302
- "output_price_per_1m": 3,
2303
- "currency": "USD",
2304
- "capabilities": [
2305
- "vision",
2306
- "reasoning"
2307
- ],
2308
- "context_window": 1048576,
2309
- "hf_private": true
2310
- },
2311
  {
2312
  "name": "nebius/moonshotai/kimi-k2.5",
2313
  "type": "vision",
@@ -2349,6 +2328,32 @@
2349
  "hf_id": "moonshotai/Kimi-K2-Instruct",
2350
  "size_b": 1026.5
2351
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2352
  {
2353
  "name": "novita/meta-llama/llama-3-70b-instruct",
2354
  "type": "chat",
@@ -2402,21 +2407,7 @@
2402
  "size_b": 1026.5
2403
  },
2404
  {
2405
- "name": "novita/zai-org/glm-4.6",
2406
- "type": "chat",
2407
- "input_price_per_1m": 0.6,
2408
- "output_price_per_1m": 2.2,
2409
- "currency": "USD",
2410
- "context_window": 204800,
2411
- "capabilities": [
2412
- "tools",
2413
- "reasoning"
2414
- ],
2415
- "hf_id": "zai-org/GLM-4.6",
2416
- "size_b": 356.8
2417
- },
2418
- {
2419
- "name": "novita/zai-org/glm-4.5",
2420
  "type": "chat",
2421
  "input_price_per_1m": 0.6,
2422
  "output_price_per_1m": 2.2,
@@ -2468,20 +2459,6 @@
2468
  "hf_id": "zai-org/GLM-4.6",
2469
  "size_b": 356.8
2470
  },
2471
- {
2472
- "name": "deepinfra/zai-org/GLM-4.5",
2473
- "type": "chat",
2474
- "input_price_per_1m": 0.6,
2475
- "output_price_per_1m": 2.2,
2476
- "currency": "USD",
2477
- "context_window": 131072,
2478
- "capabilities": [
2479
- "tools",
2480
- "reasoning"
2481
- ],
2482
- "hf_id": "zai-org/GLM-4.5",
2483
- "size_b": 358.3
2484
- },
2485
  {
2486
  "name": "alibaba/qwen3.5",
2487
  "type": "vision",
@@ -2497,35 +2474,35 @@
2497
  "hf_id": "Qwen/Qwen3.5-9B"
2498
  },
2499
  {
2500
- "name": "minimaxi/MiniMax-M2.7-highspeed",
2501
  "type": "vision",
2502
  "input_price_per_1m": 0.6,
2503
- "output_price_per_1m": 2.4,
2504
  "currency": "USD",
2505
  "capabilities": [
2506
  "vision",
2507
  "reasoning"
2508
  ],
2509
- "context_window": 200000,
2510
- "hf_id": "MiniMaxAI/MiniMax-M2.7",
2511
- "hf_private": true
2512
  },
2513
  {
2514
- "name": "minimaxi/MiniMax-M2.5-highspeed",
2515
- "type": "vision",
2516
  "input_price_per_1m": 0.6,
2517
- "output_price_per_1m": 2.4,
2518
  "currency": "USD",
 
2519
  "capabilities": [
2520
- "vision",
2521
  "reasoning"
2522
  ],
2523
- "context_window": 200000,
2524
- "hf_id": "MiniMaxAI/MiniMax-M2.5",
2525
- "size_b": 228.7
2526
  },
2527
  {
2528
- "name": "moonshot/kimi-k2-0711-preview",
2529
  "type": "chat",
2530
  "input_price_per_1m": 0.6,
2531
  "output_price_per_1m": 2.5,
@@ -2534,76 +2511,104 @@
2534
  "capabilities": [
2535
  "tools"
2536
  ],
2537
- "hf_id": "moonshotai/Kimi-K2-Instruct",
2538
  "size_b": 1026.5
2539
  },
2540
  {
2541
- "name": "moonshot/kimi-k2.5",
2542
- "type": "vision",
2543
  "input_price_per_1m": 0.6,
2544
- "output_price_per_1m": 3,
2545
  "currency": "USD",
 
2546
  "capabilities": [
2547
- "vision",
2548
- "reasoning"
2549
  ],
2550
- "context_window": 262144,
2551
- "hf_id": "moonshotai/Kimi-K2.5",
2552
- "size_b": 1058.6
2553
  },
2554
  {
2555
- "name": "moonshot/kimi-k2-thinking-turbo",
2556
  "type": "chat",
2557
  "input_price_per_1m": 0.6,
2558
  "output_price_per_1m": 2.5,
2559
  "currency": "USD",
2560
  "context_window": 131072,
 
 
 
 
 
 
 
 
 
 
 
 
 
2561
  "capabilities": [
2562
  "tools",
2563
  "reasoning"
2564
  ],
2565
- "hf_id": "moonshotai/Kimi-K2-Thinking",
2566
- "size_b": 1058.1
2567
  },
2568
  {
2569
- "name": "moonshot/kimi-k2-0905-preview",
2570
  "type": "chat",
2571
  "input_price_per_1m": 0.6,
2572
- "output_price_per_1m": 2.5,
2573
  "currency": "USD",
2574
  "context_window": 131072,
2575
  "capabilities": [
2576
- "tools"
 
2577
  ],
2578
- "hf_id": "moonshotai/Kimi-K2-Instruct-0905",
2579
- "size_b": 1026.5
2580
  },
2581
  {
2582
- "name": "moonshot/kimi-k2-thinking",
2583
  "type": "chat",
2584
  "input_price_per_1m": 0.6,
2585
- "output_price_per_1m": 2.5,
2586
  "currency": "USD",
2587
- "context_window": 131072,
2588
  "capabilities": [
2589
- "tools"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2590
  ],
2591
- "hf_id": "moonshotai/Kimi-K2-Instruct",
2592
- "size_b": 1026.5
 
2593
  },
2594
  {
2595
- "name": "nebius/zai-org/GLM-4.5",
2596
- "type": "chat",
2597
  "input_price_per_1m": 0.6,
2598
- "output_price_per_1m": 2.2,
2599
  "currency": "USD",
2600
- "context_window": 128000,
2601
  "capabilities": [
2602
- "tools",
2603
  "reasoning"
2604
  ],
2605
- "hf_id": "zai-org/GLM-4.5",
2606
- "size_b": 358.3
 
2607
  },
2608
  {
2609
  "name": "novita/microsoft/wizardlm-2-8x22b",
@@ -2627,6 +2632,18 @@
2627
  "context_window": 400000,
2628
  "hf_private": true
2629
  },
 
 
 
 
 
 
 
 
 
 
 
 
2630
  {
2631
  "name": "novita/deepseek/deepseek-prover-v2-671b",
2632
  "type": "chat",
@@ -2650,18 +2667,6 @@
2650
  "hf_id": "deepseek-ai/DeepSeek-R1",
2651
  "size_b": 671
2652
  },
2653
- {
2654
- "name": "parasail/parasail-qwen25-vl-72b-instruct",
2655
- "type": "vision",
2656
- "input_price_per_1m": 0.7,
2657
- "output_price_per_1m": 0.7,
2658
- "currency": "USD",
2659
- "capabilities": [
2660
- "vision"
2661
- ],
2662
- "context_window": 32768,
2663
- "size_b": 72
2664
- },
2665
  {
2666
  "name": "openai-responses/gpt-5.4-mini",
2667
  "type": "vision",
@@ -2688,6 +2693,29 @@
2688
  "context_window": 400000,
2689
  "hf_private": true
2690
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2691
  {
2692
  "name": "novita/deepseek/deepseek-r1-distill-llama-70b",
2693
  "type": "chat",
@@ -2715,27 +2743,18 @@
2715
  "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct"
2716
  },
2717
  {
2718
- "name": "deepinfra/meta-llama/Meta-Llama-3.1-405B-Instruct",
2719
- "type": "chat",
2720
- "input_price_per_1m": 0.8,
2721
- "output_price_per_1m": 0.8,
2722
- "currency": "USD",
2723
- "context_window": 130815,
2724
- "size_b": 405
2725
- },
2726
- {
2727
- "name": "nebius/deepseek-ai/DeepSeek-R1-0528",
2728
  "type": "chat",
2729
- "input_price_per_1m": 0.8,
2730
- "output_price_per_1m": 2.4,
2731
  "currency": "USD",
2732
- "context_window": 164000,
2733
  "capabilities": [
2734
  "tools",
2735
  "reasoning"
2736
  ],
2737
- "hf_id": "deepseek-ai/DeepSeek-R1-0528",
2738
- "size_b": 684.5
2739
  },
2740
  {
2741
  "name": "deepinfra/deepseek-ai/DeepSeek-V3",
@@ -2751,20 +2770,6 @@
2751
  "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
2752
  "size_b": 671
2753
  },
2754
- {
2755
- "name": "deepinfra/deepseek-ai/DeepSeek-R1",
2756
- "type": "chat",
2757
- "input_price_per_1m": 0.85,
2758
- "output_price_per_1m": 2.5,
2759
- "currency": "USD",
2760
- "context_window": 64000,
2761
- "capabilities": [
2762
- "tools",
2763
- "reasoning"
2764
- ],
2765
- "hf_id": "deepseek-ai/DeepSeek-R1",
2766
- "size_b": 671
2767
- },
2768
  {
2769
  "name": "alibaba/qwen3-max",
2770
  "type": "vision",
@@ -2823,39 +2828,24 @@
2823
  "hf_private": true
2824
  },
2825
  {
2826
- "name": "novita/GLM-5",
2827
- "type": "chat",
2828
- "input_price_per_1m": 1,
2829
- "output_price_per_1m": 3.2,
2830
- "currency": "USD",
2831
- "capabilities": [
2832
- "reasoning"
2833
- ],
2834
- "context_window": 202800,
2835
- "hf_id": "zai-org/GLM-5",
2836
- "size_b": 753.9
2837
- },
2838
- {
2839
- "name": "zai/GLM-5",
2840
  "type": "vision",
2841
  "input_price_per_1m": 1,
2842
- "output_price_per_1m": 3.2,
2843
  "currency": "USD",
2844
  "capabilities": [
2845
- "vision",
2846
- "reasoning"
2847
  ],
2848
  "context_window": 200000,
2849
- "hf_id": "zai-org/GLM-5",
2850
- "size_b": 753.9
2851
  },
2852
  {
2853
- "name": "groq/moonshotai/kimi-k2-instruct",
2854
  "type": "chat",
2855
  "input_price_per_1m": 1,
2856
  "output_price_per_1m": 3,
2857
  "currency": "USD",
2858
- "context_window": 131072,
2859
  "capabilities": [
2860
  "tools"
2861
  ],
@@ -2863,12 +2853,12 @@
2863
  "size_b": 1026.5
2864
  },
2865
  {
2866
- "name": "groq/moonshotai/Kimi-K2-Instruct-0905",
2867
  "type": "chat",
2868
  "input_price_per_1m": 1,
2869
  "output_price_per_1m": 3,
2870
  "currency": "USD",
2871
- "context_window": 256000,
2872
  "capabilities": [
2873
  "tools"
2874
  ],
@@ -2876,43 +2866,45 @@
2876
  "size_b": 1026.5
2877
  },
2878
  {
2879
- "name": "anthropic/claude-haiku-4-5",
2880
  "type": "vision",
2881
  "input_price_per_1m": 1,
2882
- "output_price_per_1m": 5,
2883
  "currency": "USD",
 
2884
  "capabilities": [
2885
  "vision"
2886
  ],
2887
- "context_window": 200000,
2888
  "hf_private": true
2889
  },
2890
  {
2891
- "name": "vertex/claude-haiku-4-5",
2892
  "type": "vision",
2893
  "input_price_per_1m": 1,
2894
- "output_price_per_1m": 5,
2895
  "currency": "USD",
2896
  "capabilities": [
2897
- "vision"
 
2898
  ],
2899
  "context_window": 200000,
2900
- "hf_private": true
 
2901
  },
2902
  {
2903
- "name": "perplexity/sonar",
2904
  "type": "vision",
2905
  "input_price_per_1m": 1,
2906
- "output_price_per_1m": 1,
2907
  "currency": "USD",
2908
- "context_window": 131072,
2909
  "capabilities": [
2910
  "vision"
2911
  ],
 
2912
  "hf_private": true
2913
  },
2914
  {
2915
- "name": "alibaba/qwen3-coder-plus",
2916
  "type": "vision",
2917
  "input_price_per_1m": 1,
2918
  "output_price_per_1m": 5,
@@ -2920,9 +2912,22 @@
2920
  "capabilities": [
2921
  "vision"
2922
  ],
2923
- "context_window": 1048576,
2924
  "hf_private": true
2925
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
2926
  {
2927
  "name": "bedrock/claude-haiku-4-5",
2928
  "type": "vision",
@@ -2996,15 +3001,6 @@
2996
  "context_window": 200000,
2997
  "hf_private": true
2998
  },
2999
- {
3000
- "name": "together/Qwen/Qwen2.5-72B-Instruct-Turbo",
3001
- "type": "chat",
3002
- "input_price_per_1m": 1.2,
3003
- "output_price_per_1m": 1.2,
3004
- "currency": "USD",
3005
- "context_window": 32768,
3006
- "size_b": 72
3007
- },
3008
  {
3009
  "name": "moonshot/kimi-k2-turbo-preview",
3010
  "type": "chat",
@@ -3019,30 +3015,36 @@
3019
  "size_b": 1026.5
3020
  },
3021
  {
3022
- "name": "together/deepseek-ai/DeepSeek-V3",
3023
  "type": "chat",
 
 
 
 
 
 
 
 
 
3024
  "input_price_per_1m": 1.25,
3025
- "output_price_per_1m": 1.25,
3026
  "currency": "USD",
3027
- "context_window": 131072,
3028
  "capabilities": [
3029
- "tools",
3030
  "reasoning"
3031
  ],
3032
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
3033
- "size_b": 671
3034
  },
3035
  {
3036
- "name": "coding/gemini-2.5-pro",
3037
  "type": "vision",
3038
  "input_price_per_1m": 1.25,
3039
  "output_price_per_1m": 10,
3040
  "currency": "USD",
3041
  "capabilities": [
3042
- "vision",
3043
  "reasoning"
3044
  ],
3045
- "context_window": 1048576,
3046
  "hf_private": true
3047
  },
3048
  {
@@ -3059,28 +3061,31 @@
3059
  "hf_private": true
3060
  },
3061
  {
3062
- "name": "azure/gpt-5.1",
3063
  "type": "vision",
3064
  "input_price_per_1m": 1.25,
3065
  "output_price_per_1m": 10,
3066
  "currency": "USD",
3067
  "capabilities": [
 
3068
  "reasoning"
3069
  ],
3070
- "context_window": 200000,
3071
  "hf_private": true
3072
  },
3073
  {
3074
- "name": "azure/gpt-5",
3075
- "type": "vision",
3076
  "input_price_per_1m": 1.25,
3077
- "output_price_per_1m": 10,
3078
  "currency": "USD",
 
3079
  "capabilities": [
 
3080
  "reasoning"
3081
  ],
3082
- "context_window": 200000,
3083
- "hf_private": true
3084
  },
3085
  {
3086
  "name": "google/gemini-2.5-pro",
@@ -3096,7 +3101,7 @@
3096
  "hf_private": true
3097
  },
3098
  {
3099
- "name": "openai-responses/gpt-5-codex",
3100
  "type": "vision",
3101
  "input_price_per_1m": 1.25,
3102
  "output_price_per_1m": 10,
@@ -3109,7 +3114,7 @@
3109
  "hf_private": true
3110
  },
3111
  {
3112
- "name": "openai-responses/gpt-5",
3113
  "type": "vision",
3114
  "input_price_per_1m": 1.25,
3115
  "output_price_per_1m": 10,
@@ -3122,7 +3127,7 @@
3122
  "hf_private": true
3123
  },
3124
  {
3125
- "name": "openai-responses/gpt-5.1-codex",
3126
  "type": "vision",
3127
  "input_price_per_1m": 1.25,
3128
  "output_price_per_1m": 10,
@@ -3135,7 +3140,7 @@
3135
  "hf_private": true
3136
  },
3137
  {
3138
- "name": "openai-responses/gpt-5.1",
3139
  "type": "vision",
3140
  "input_price_per_1m": 1.25,
3141
  "output_price_per_1m": 10,
@@ -3148,7 +3153,7 @@
3148
  "hf_private": true
3149
  },
3150
  {
3151
- "name": "openai/gpt-5-chat",
3152
  "type": "vision",
3153
  "input_price_per_1m": 1.25,
3154
  "output_price_per_1m": 10,
@@ -3157,11 +3162,11 @@
3157
  "vision",
3158
  "reasoning"
3159
  ],
3160
- "context_window": 128000,
3161
  "hf_private": true
3162
  },
3163
  {
3164
- "name": "openai/gpt-5.1",
3165
  "type": "vision",
3166
  "input_price_per_1m": 1.25,
3167
  "output_price_per_1m": 10,
@@ -3170,11 +3175,11 @@
3170
  "vision",
3171
  "reasoning"
3172
  ],
3173
- "context_window": 400000,
3174
  "hf_private": true
3175
  },
3176
  {
3177
- "name": "openai/gpt-5.1-chat",
3178
  "type": "vision",
3179
  "input_price_per_1m": 1.25,
3180
  "output_price_per_1m": 10,
@@ -3187,7 +3192,7 @@
3187
  "hf_private": true
3188
  },
3189
  {
3190
- "name": "novita/sao10k/l3-70b-euryale-v2.1",
3191
  "type": "chat",
3192
  "input_price_per_1m": 1.48,
3193
  "output_price_per_1m": 1.48,
@@ -3196,7 +3201,7 @@
3196
  "size_b": 70
3197
  },
3198
  {
3199
- "name": "novita/sao10k/l31-70b-euryale-v2.2",
3200
  "type": "chat",
3201
  "input_price_per_1m": 1.48,
3202
  "output_price_per_1m": 1.48,
@@ -3216,6 +3221,18 @@
3216
  ],
3217
  "hf_private": true
3218
  },
 
 
 
 
 
 
 
 
 
 
 
 
3219
  {
3220
  "name": "azure/gpt-5.3-codex",
3221
  "type": "vision",
@@ -3243,15 +3260,16 @@
3243
  "hf_private": true
3244
  },
3245
  {
3246
- "name": "azure/gpt-5.2",
3247
  "type": "vision",
3248
  "input_price_per_1m": 1.75,
3249
  "output_price_per_1m": 14,
3250
  "currency": "USD",
3251
  "capabilities": [
 
3252
  "reasoning"
3253
  ],
3254
- "context_window": 200000,
3255
  "hf_private": true
3256
  },
3257
  {
@@ -3280,19 +3298,6 @@
3280
  "context_window": 400000,
3281
  "hf_private": true
3282
  },
3283
- {
3284
- "name": "openai-responses/gpt-5.3-chat",
3285
- "type": "vision",
3286
- "input_price_per_1m": 1.75,
3287
- "output_price_per_1m": 14,
3288
- "currency": "USD",
3289
- "capabilities": [
3290
- "vision",
3291
- "reasoning"
3292
- ],
3293
- "context_window": 128000,
3294
- "hf_private": true
3295
- },
3296
  {
3297
  "name": "openai-responses/gpt-5.2",
3298
  "type": "vision",
@@ -3307,7 +3312,7 @@
3307
  "hf_private": true
3308
  },
3309
  {
3310
- "name": "openai/gpt-5.3-chat",
3311
  "type": "vision",
3312
  "input_price_per_1m": 1.75,
3313
  "output_price_per_1m": 14,
@@ -3316,11 +3321,11 @@
3316
  "vision",
3317
  "reasoning"
3318
  ],
3319
- "context_window": 128000,
3320
  "hf_private": true
3321
  },
3322
  {
3323
- "name": "openai/gpt-5.2",
3324
  "type": "vision",
3325
  "input_price_per_1m": 1.75,
3326
  "output_price_per_1m": 14,
@@ -3329,11 +3334,11 @@
3329
  "vision",
3330
  "reasoning"
3331
  ],
3332
- "context_window": 400000,
3333
  "hf_private": true
3334
  },
3335
  {
3336
- "name": "openai/gpt-5.2-chat",
3337
  "type": "vision",
3338
  "input_price_per_1m": 1.75,
3339
  "output_price_per_1m": 14,
@@ -3355,46 +3360,20 @@
3355
  "hf_private": true
3356
  },
3357
  {
3358
- "name": "vertex/gemini-3-pro-preview",
3359
- "type": "vision",
3360
- "input_price_per_1m": 2,
3361
- "output_price_per_1m": 12,
3362
- "currency": "USD",
3363
- "capabilities": [
3364
- "vision",
3365
- "reasoning"
3366
- ],
3367
- "context_window": 1048576,
3368
- "hf_private": true
3369
- },
3370
- {
3371
- "name": "vertex/gemini-3.1-pro-preview",
3372
- "type": "vision",
3373
- "input_price_per_1m": 2,
3374
- "output_price_per_1m": 12,
3375
- "currency": "USD",
3376
- "capabilities": [
3377
- "vision",
3378
- "reasoning"
3379
- ],
3380
- "context_window": 1048576,
3381
- "hf_private": true
3382
- },
3383
- {
3384
- "name": "vertex/gemini-3-pro-image-preview",
3385
  "type": "vision",
3386
  "input_price_per_1m": 2,
3387
- "output_price_per_1m": 12,
3388
  "currency": "USD",
 
3389
  "capabilities": [
3390
  "vision",
3391
  "reasoning"
3392
  ],
3393
- "context_window": 1048576,
3394
  "hf_private": true
3395
  },
3396
  {
3397
- "name": "azure/openai-responses/gpt-4.1",
3398
  "type": "vision",
3399
  "input_price_per_1m": 2,
3400
  "output_price_per_1m": 8,
@@ -3406,7 +3385,7 @@
3406
  "hf_private": true
3407
  },
3408
  {
3409
- "name": "azure/gpt-4.1",
3410
  "type": "vision",
3411
  "input_price_per_1m": 2,
3412
  "output_price_per_1m": 8,
@@ -3418,20 +3397,20 @@
3418
  "hf_private": true
3419
  },
3420
  {
3421
- "name": "perplexity/sonar-reasoning-pro",
3422
  "type": "vision",
3423
  "input_price_per_1m": 2,
3424
- "output_price_per_1m": 8,
3425
  "currency": "USD",
3426
- "context_window": 131072,
3427
  "capabilities": [
3428
  "vision",
3429
  "reasoning"
3430
  ],
 
3431
  "hf_private": true
3432
  },
3433
  {
3434
- "name": "google/gemini-3-pro-preview",
3435
  "type": "vision",
3436
  "input_price_per_1m": 2,
3437
  "output_price_per_1m": 12,
@@ -3444,7 +3423,7 @@
3444
  "hf_private": true
3445
  },
3446
  {
3447
- "name": "google/gemini-3.1-pro-preview",
3448
  "type": "vision",
3449
  "input_price_per_1m": 2,
3450
  "output_price_per_1m": 12,
@@ -3456,6 +3435,15 @@
3456
  "context_window": 1048576,
3457
  "hf_private": true
3458
  },
 
 
 
 
 
 
 
 
 
3459
  {
3460
  "name": "xai/grok-2-1212",
3461
  "type": "chat",
@@ -3479,19 +3467,33 @@
3479
  "hf_private": true
3480
  },
3481
  {
3482
- "name": "openai-responses/gpt-4.1",
3483
  "type": "vision",
3484
  "input_price_per_1m": 2,
3485
- "output_price_per_1m": 8,
3486
  "currency": "USD",
3487
  "capabilities": [
3488
- "vision"
 
3489
  ],
3490
- "context_window": 1047576,
3491
  "hf_private": true
3492
  },
3493
  {
3494
- "name": "openai/gpt-4.1",
 
 
 
 
 
 
 
 
 
 
 
 
 
3495
  "type": "vision",
3496
  "input_price_per_1m": 2,
3497
  "output_price_per_1m": 8,
@@ -3516,12 +3518,15 @@
3516
  "hf_private": true
3517
  },
3518
  {
3519
- "name": "nebius/deepseek-ai/DeepSeek-V3-0324-fast",
3520
- "type": "chat",
3521
  "input_price_per_1m": 2,
3522
- "output_price_per_1m": 6,
3523
  "currency": "USD",
3524
- "context_window": 128000,
 
 
 
3525
  "hf_private": true
3526
  },
3527
  {
@@ -3563,20 +3568,7 @@
3563
  "hf_private": true
3564
  },
3565
  {
3566
- "name": "openai/gpt-5.4",
3567
- "type": "vision",
3568
- "input_price_per_1m": 2.5,
3569
- "output_price_per_1m": 15,
3570
- "currency": "USD",
3571
- "capabilities": [
3572
- "vision",
3573
- "reasoning"
3574
- ],
3575
- "context_window": 1050000,
3576
- "hf_private": true
3577
- },
3578
- {
3579
- "name": "openai/gpt-4o-2024-05-13",
3580
  "type": "vision",
3581
  "input_price_per_1m": 2.5,
3582
  "output_price_per_1m": 10,
@@ -3588,15 +3580,16 @@
3588
  "hf_private": true
3589
  },
3590
  {
3591
- "name": "openai/gpt-4o-2024-08-06",
3592
  "type": "vision",
3593
  "input_price_per_1m": 2.5,
3594
- "output_price_per_1m": 10,
3595
  "currency": "USD",
3596
  "capabilities": [
3597
- "vision"
 
3598
  ],
3599
- "context_window": 128000,
3600
  "hf_private": true
3601
  },
3602
  {
@@ -3612,30 +3605,15 @@
3612
  "hf_private": true
3613
  },
3614
  {
3615
- "name": "together/deepseek-ai/DeepSeek-R1",
3616
- "type": "chat",
3617
- "input_price_per_1m": 3,
3618
- "output_price_per_1m": 7,
3619
- "currency": "USD",
3620
- "context_window": 64000,
3621
- "capabilities": [
3622
- "tools",
3623
- "reasoning"
3624
- ],
3625
- "hf_id": "deepseek-ai/DeepSeek-R1",
3626
- "size_b": 671
3627
- },
3628
- {
3629
- "name": "coding/claude-sonnet-4-20250514",
3630
  "type": "vision",
3631
- "input_price_per_1m": 3,
3632
- "output_price_per_1m": 15,
3633
  "currency": "USD",
3634
  "capabilities": [
3635
- "vision",
3636
- "reasoning"
3637
  ],
3638
- "context_window": 200000,
3639
  "hf_private": true
3640
  },
3641
  {
@@ -3678,15 +3656,15 @@
3678
  "hf_private": true
3679
  },
3680
  {
3681
- "name": "vertex/claude-3-5-sonnet",
3682
  "type": "vision",
3683
  "input_price_per_1m": 3,
3684
  "output_price_per_1m": 15,
3685
  "currency": "USD",
 
3686
  "capabilities": [
3687
  "vision"
3688
  ],
3689
- "context_window": 200000,
3690
  "hf_private": true
3691
  },
3692
  {
@@ -3729,15 +3707,15 @@
3729
  "hf_private": true
3730
  },
3731
  {
3732
- "name": "perplexity/sonar-pro",
3733
  "type": "vision",
3734
  "input_price_per_1m": 3,
3735
  "output_price_per_1m": 15,
3736
  "currency": "USD",
3737
- "context_window": 204800,
3738
  "capabilities": [
3739
  "vision"
3740
  ],
 
3741
  "hf_private": true
3742
  },
3743
  {
@@ -3753,7 +3731,7 @@
3753
  "hf_private": true
3754
  },
3755
  {
3756
- "name": "bedrock/claude-3-7-sonnet",
3757
  "type": "vision",
3758
  "input_price_per_1m": 3,
3759
  "output_price_per_1m": 15,
@@ -3766,7 +3744,21 @@
3766
  "hf_private": true
3767
  },
3768
  {
3769
- "name": "bedrock/claude-sonnet-4-6",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3770
  "type": "vision",
3771
  "input_price_per_1m": 3,
3772
  "output_price_per_1m": 15,
@@ -3775,11 +3767,11 @@
3775
  "vision",
3776
  "reasoning"
3777
  ],
3778
- "context_window": 1000000,
3779
  "hf_private": true
3780
  },
3781
  {
3782
- "name": "bedrock/claude-sonnet-4-5",
3783
  "type": "vision",
3784
  "input_price_per_1m": 3,
3785
  "output_price_per_1m": 15,
@@ -3792,7 +3784,7 @@
3792
  "hf_private": true
3793
  },
3794
  {
3795
- "name": "bedrock/claude-sonnet-4",
3796
  "type": "vision",
3797
  "input_price_per_1m": 3,
3798
  "output_price_per_1m": 15,
@@ -3804,6 +3796,19 @@
3804
  "context_window": 200000,
3805
  "hf_private": true
3806
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
3807
  {
3808
  "name": "novita/deepseek/deepseek-r1",
3809
  "type": "chat",
@@ -3819,7 +3824,7 @@
3819
  "size_b": 671
3820
  },
3821
  {
3822
- "name": "anthropic/claude-opus-4-6",
3823
  "type": "vision",
3824
  "input_price_per_1m": 5,
3825
  "output_price_per_1m": 25,
@@ -3828,11 +3833,11 @@
3828
  "vision",
3829
  "reasoning"
3830
  ],
3831
- "context_window": 1000000,
3832
  "hf_private": true
3833
  },
3834
  {
3835
- "name": "anthropic/claude-opus-4-5",
3836
  "type": "vision",
3837
  "input_price_per_1m": 5,
3838
  "output_price_per_1m": 25,
@@ -3841,11 +3846,11 @@
3841
  "vision",
3842
  "reasoning"
3843
  ],
3844
- "context_window": 200000,
3845
  "hf_private": true
3846
  },
3847
  {
3848
- "name": "vertex/claude-opus-4-5",
3849
  "type": "vision",
3850
  "input_price_per_1m": 5,
3851
  "output_price_per_1m": 25,
@@ -3854,11 +3859,11 @@
3854
  "vision",
3855
  "reasoning"
3856
  ],
3857
- "context_window": 200000,
3858
  "hf_private": true
3859
  },
3860
  {
3861
- "name": "vertex/claude-opus-4-6",
3862
  "type": "vision",
3863
  "input_price_per_1m": 5,
3864
  "output_price_per_1m": 25,
@@ -3867,7 +3872,7 @@
3867
  "vision",
3868
  "reasoning"
3869
  ],
3870
- "context_window": 1000000,
3871
  "hf_private": true
3872
  },
3873
  {
@@ -3934,7 +3939,7 @@
3934
  "hf_private": true
3935
  },
3936
  {
3937
- "name": "coding/claude-opus-4-20250514",
3938
  "type": "vision",
3939
  "input_price_per_1m": 15,
3940
  "output_price_per_1m": 75,
@@ -3947,7 +3952,7 @@
3947
  "hf_private": true
3948
  },
3949
  {
3950
- "name": "anthropic/claude-opus-4",
3951
  "type": "vision",
3952
  "input_price_per_1m": 15,
3953
  "output_price_per_1m": 75,
@@ -3960,7 +3965,7 @@
3960
  "hf_private": true
3961
  },
3962
  {
3963
- "name": "anthropic/claude-opus-4-1",
3964
  "type": "vision",
3965
  "input_price_per_1m": 15,
3966
  "output_price_per_1m": 75,
@@ -3973,7 +3978,7 @@
3973
  "hf_private": true
3974
  },
3975
  {
3976
- "name": "vertex/claude-opus-4",
3977
  "type": "vision",
3978
  "input_price_per_1m": 15,
3979
  "output_price_per_1m": 75,
@@ -3986,7 +3991,7 @@
3986
  "hf_private": true
3987
  },
3988
  {
3989
- "name": "vertex/claude-opus-4-1",
3990
  "type": "vision",
3991
  "input_price_per_1m": 15,
3992
  "output_price_per_1m": 75,
@@ -4410,7 +4415,8 @@
4410
  "output_price_per_1m": 1.5,
4411
  "currency": "USD",
4412
  "flavor": "base",
4413
- "hf_id": "deepseek-ai/DeepSeek-V3"
 
4414
  },
4415
  {
4416
  "name": "DeepSeek-V3 (base)",
@@ -4419,7 +4425,8 @@
4419
  "output_price_per_1m": 1.5,
4420
  "currency": "USD",
4421
  "flavor": "base",
4422
- "hf_id": "deepseek-ai/DeepSeek-V3"
 
4423
  },
4424
  {
4425
  "name": "Llama-3.3-70B-Instruct (fast)",
@@ -4671,7 +4678,8 @@
4671
  "input_price_per_1m": 0.01,
4672
  "output_price_per_1m": 0,
4673
  "currency": "USD",
4674
- "hf_id": "BAAI/bge-multilingual-gemma2"
 
4675
  },
4676
  {
4677
  "name": "bge-en-icl",
@@ -4764,7 +4772,8 @@
4764
  "input_price_per_1m": 0.003,
4765
  "output_price_per_1m": 0,
4766
  "currency": "EUR",
4767
- "hf_id": "openai/whisper-large-v3"
 
4768
  },
4769
  {
4770
  "name": "holo2-30b-a3b",
@@ -4864,7 +4873,8 @@
4864
  "input_price_per_1m": 0.1,
4865
  "output_price_per_1m": 0,
4866
  "currency": "EUR",
4867
- "hf_id": "BAAI/bge-multilingual-gemma2"
 
4868
  },
4869
  {
4870
  "name": "llama-3.1-8b-instruct",
@@ -4924,7 +4934,8 @@
4924
  ],
4925
  "size_b": 122.61,
4926
  "hf_id": "mistralai/Mistral-Large-Instruct-2411",
4927
- "hf_private": true
 
4928
  },
4929
  {
4930
  "name": "Mistral Small 4",
@@ -5180,7 +5191,8 @@
5180
  "tools"
5181
  ],
5182
  "hf_id": "mistralai/Mistral-Nemo-Instruct-2407",
5183
- "size_b": 12
 
5184
  },
5185
  {
5186
  "name": "Mistral 7B",
@@ -5202,7 +5214,8 @@
5202
  "capabilities": [
5203
  "tools"
5204
  ],
5205
- "hf_id": "mistralai/Mixtral-8x7B-Instruct-v0.1"
 
5206
  },
5207
  {
5208
  "name": "Mixtral 8x22B",
@@ -5215,7 +5228,8 @@
5215
  "capabilities": [
5216
  "tools"
5217
  ],
5218
- "hf_id": "mistralai/Mixtral-8x22B-Instruct-v0.1"
 
5219
  }
5220
  ]
5221
  },
@@ -6741,7 +6755,8 @@
6741
  "hf_id": "MiniMaxAI/MiniMax-Text-01",
6742
  "capabilities": [
6743
  "vision"
6744
- ]
 
6745
  },
6746
  {
6747
  "name": "qwen/qwen-2.5-vl-7b-instruct",
@@ -6888,7 +6903,8 @@
6888
  "capabilities": [
6889
  "tools",
6890
  "reasoning"
6891
- ]
 
6892
  },
6893
  {
6894
  "name": "inception/mercury",
@@ -7065,7 +7081,8 @@
7065
  "capabilities": [
7066
  "tools",
7067
  "reasoning"
7068
- ]
 
7069
  },
7070
  {
7071
  "name": "baidu/ernie-4.5-300b-a47b",
@@ -7312,7 +7329,8 @@
7312
  "hf_id": "deepseek-ai/DeepSeek-V3.2-Speciale",
7313
  "capabilities": [
7314
  "reasoning"
7315
- ]
 
7316
  },
7317
  {
7318
  "name": "moonshotai/kimi-k2-0905",
@@ -9600,7 +9618,8 @@
9600
  "input_price_per_1m": 0.111,
9601
  "output_price_per_1m": 0,
9602
  "currency": "USD",
9603
- "hf_id": "openai/whisper-large-v3"
 
9604
  },
9605
  {
9606
  "name": "Whisper Large v3 Turbo",
@@ -9608,7 +9627,8 @@
9608
  "input_price_per_1m": 0.04,
9609
  "output_price_per_1m": 0,
9610
  "currency": "USD",
9611
- "hf_id": "openai/whisper-large-v3-turbo"
 
9612
  }
9613
  ]
9614
  },
 
133
  "input_price_per_1m": 0.015,
134
  "output_price_per_1m": 0,
135
  "currency": "USD",
136
+ "hf_id": "BAAI/bge-large-en-v1.5",
137
+ "size_b": 0.33
138
  },
139
  {
140
  "name": "bge-m3",
 
252
  "input_price_per_1m": 0.065,
253
  "output_price_per_1m": 0,
254
  "currency": "CHF",
255
+ "hf_id": "BAAI/bge-multilingual-gemma2",
256
+ "size_b": 7.4
257
  },
258
  {
259
  "name": "All MiniLM L12 v2",
 
279
  "input_price_per_1m": 0.006,
280
  "output_price_per_1m": 0,
281
  "currency": "CHF",
282
+ "hf_id": "openai/whisper-large-v3",
283
+ "size_b": 0.7
284
  },
285
  {
286
  "name": "Photomaker V2",
 
345
  ],
346
  "size_b": 122.61,
347
  "hf_id": "mistralai/Mistral-Large-Instruct-2411",
348
+ "hf_private": true,
349
+ "ollama_id": "mistral-large"
350
  },
351
  {
352
  "name": "GPT-5.4 Thinking",
 
488
  ],
489
  "size_b": 122.61,
490
  "hf_id": "mistralai/Mistral-Large-Instruct-2411",
491
+ "hf_private": true,
492
+ "ollama_id": "mistral-large"
493
  },
494
  {
495
  "name": "Llama 4 Maverick",
 
1054
  "eu_endpoints": true,
1055
  "models": [
1056
  {
1057
+ "name": "deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo",
1058
  "type": "chat",
1059
  "input_price_per_1m": 0.02,
1060
+ "output_price_per_1m": 0.05,
1061
  "currency": "USD",
1062
+ "context_window": 131072,
1063
+ "size_b": 8
1064
  },
1065
  {
1066
+ "name": "novita/meta-llama/llama-3.2-1b-instruct",
1067
  "type": "chat",
1068
  "input_price_per_1m": 0.02,
1069
+ "output_price_per_1m": 0.02,
1070
  "currency": "USD",
1071
+ "context_window": 131000,
1072
+ "size_b": 1
1073
  },
1074
  {
1075
  "name": "openai/gpt-5-nano",
 
1107
  "hf_id": "meta-llama/Meta-Llama-3-8B-Instruct"
1108
  },
1109
  {
1110
+ "name": "azure/gpt-5-nano",
1111
+ "type": "vision",
1112
  "input_price_per_1m": 0.05,
1113
+ "output_price_per_1m": 0.4,
1114
  "currency": "USD",
1115
+ "capabilities": [
1116
+ "reasoning"
1117
+ ],
1118
+ "context_window": 200000,
1119
+ "hf_private": true
1120
  },
1121
  {
1122
+ "name": "alibaba/qwen-turbo",
1123
  "type": "chat",
1124
  "input_price_per_1m": 0.05,
1125
+ "output_price_per_1m": 0.2,
1126
  "currency": "USD",
1127
+ "context_window": 1000000,
 
1128
  "capabilities": [
1129
  "tools"
1130
  ],
1131
+ "hf_private": true
1132
  },
1133
  {
1134
  "name": "novita/Sao10K/L3-8B-Stheno-v3.2",
 
1140
  "size_b": 8
1141
  },
1142
  {
1143
+ "name": "novita/sao10k/l3-8b-lunaris",
1144
+ "type": "chat",
1145
  "input_price_per_1m": 0.05,
1146
+ "output_price_per_1m": 0.05,
1147
  "currency": "USD",
1148
+ "context_window": 8192,
1149
+ "size_b": 8
 
 
 
1150
  },
1151
  {
1152
+ "name": "novita/meta-llama/llama-3.1-8b-instruct",
1153
  "type": "chat",
1154
  "input_price_per_1m": 0.05,
1155
+ "output_price_per_1m": 0.05,
1156
  "currency": "USD",
1157
+ "context_window": 16384,
1158
+ "size_b": 8,
1159
  "capabilities": [
1160
  "tools"
1161
  ],
1162
+ "hf_id": "meta-llama/Meta-Llama-3.1-8B-Instruct"
1163
  },
1164
  {
1165
  "name": "openai-responses/gpt-5-nano",
 
1211
  "size_b": 13
1212
  },
1213
  {
1214
+ "name": "deepinfra/Qwen/Qwen3-32B",
1215
  "type": "chat",
1216
  "input_price_per_1m": 0.1,
1217
+ "output_price_per_1m": 0.3,
1218
  "currency": "USD",
1219
+ "context_window": 40000,
1220
+ "size_b": 32,
1221
+ "capabilities": [
1222
+ "tools",
1223
+ "reasoning"
1224
+ ],
1225
+ "hf_id": "Qwen/Qwen3-32B"
1226
  },
1227
  {
1228
+ "name": "mistral/devstral-small-latest",
1229
  "type": "chat",
1230
  "input_price_per_1m": 0.1,
1231
+ "output_price_per_1m": 0.3,
1232
  "currency": "USD",
1233
  "context_window": 131072,
 
1234
  "capabilities": [
1235
+ "tools"
 
1236
  ],
1237
+ "hf_id": "mistralai/Devstral-Small-2507",
1238
+ "size_b": 24
1239
  },
1240
  {
1241
  "name": "mistral/mistral-small-2503",
 
1260
  "size_b": 24
1261
  },
1262
  {
1263
+ "name": "groq/openai/gpt-oss-20b",
1264
  "type": "chat",
1265
  "input_price_per_1m": 0.1,
1266
+ "output_price_per_1m": 0.5,
1267
  "currency": "USD",
1268
  "context_window": 131072,
1269
+ "size_b": 20,
1270
  "capabilities": [
1271
+ "tools",
 
 
 
 
 
 
 
 
 
 
 
 
1272
  "reasoning"
1273
  ],
1274
+ "hf_id": "openai/gpt-oss-20b"
 
1275
  },
1276
  {
1277
+ "name": "azure/openai-responses/gpt-4.1-nano",
1278
  "type": "vision",
1279
  "input_price_per_1m": 0.1,
1280
  "output_price_per_1m": 0.4,
 
1286
  "hf_private": true
1287
  },
1288
  {
1289
+ "name": "azure/gpt-4.1-nano",
1290
  "type": "vision",
1291
  "input_price_per_1m": 0.1,
1292
  "output_price_per_1m": 0.4,
 
1298
  "hf_private": true
1299
  },
1300
  {
1301
+ "name": "vertex/gemini-2.5-flash-lite",
1302
  "type": "vision",
1303
  "input_price_per_1m": 0.1,
1304
  "output_price_per_1m": 0.4,
 
1310
  "context_window": 1048576,
1311
  "hf_private": true
1312
  },
1313
+ {
1314
+ "name": "together/meta-llama/Meta-Llama-3-8B-Instruct-Lite",
1315
+ "type": "chat",
1316
+ "input_price_per_1m": 0.1,
1317
+ "output_price_per_1m": 0.1,
1318
+ "currency": "USD",
1319
+ "context_window": 8192,
1320
+ "size_b": 8
1321
+ },
1322
  {
1323
  "name": "google/gemini-2.0-flash-001",
1324
  "type": "vision",
 
1332
  "hf_private": true
1333
  },
1334
  {
1335
+ "name": "google/gemini-2.5-flash-lite",
1336
+ "type": "vision",
1337
  "input_price_per_1m": 0.1,
1338
+ "output_price_per_1m": 0.4,
1339
  "currency": "USD",
 
 
1340
  "capabilities": [
1341
+ "vision",
1342
  "reasoning"
1343
  ],
1344
+ "context_window": 1048576,
1345
+ "hf_private": true
1346
  },
1347
  {
1348
  "name": "openai-responses/gpt-4.1-nano",
 
1416
  "context_window": 8192,
1417
  "size_b": 8
1418
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1419
  {
1420
  "name": "mistral/mistral-small-2603",
1421
  "type": "vision",
 
1453
  "size_b": 235
1454
  },
1455
  {
1456
+ "name": "groq/openai/gpt-oss-120b",
1457
+ "type": "chat",
1458
  "input_price_per_1m": 0.15,
1459
+ "output_price_per_1m": 0.75,
1460
  "currency": "USD",
1461
+ "context_window": 131072,
1462
+ "size_b": 120,
1463
  "capabilities": [
1464
+ "tools",
1465
+ "reasoning"
1466
  ],
1467
+ "hf_id": "openai/gpt-oss-120b"
 
1468
  },
1469
  {
1470
  "name": "nebius/openai/gpt-oss-120b",
 
1479
  "size_b": 120,
1480
  "hf_id": "openai/gpt-oss-120b"
1481
  },
1482
+ {
1483
+ "name": "novita/deepseek/deepseek-r1-distill-qwen-14b",
1484
+ "type": "chat",
1485
+ "input_price_per_1m": 0.15,
1486
+ "output_price_per_1m": 0.15,
1487
+ "currency": "USD",
1488
+ "context_window": 128000,
1489
+ "size_b": 14,
1490
+ "capabilities": [
1491
+ "tools",
1492
+ "reasoning"
1493
+ ],
1494
+ "hf_id": "deepseek-ai/DeepSeek-R1"
1495
+ },
1496
+ {
1497
+ "name": "openai/gpt-4o-mini",
1498
+ "type": "vision",
1499
+ "input_price_per_1m": 0.15,
1500
+ "output_price_per_1m": 0.6,
1501
+ "currency": "USD",
1502
+ "capabilities": [
1503
+ "vision"
1504
+ ],
1505
+ "context_window": 128000,
1506
+ "hf_private": true
1507
+ },
1508
  {
1509
  "name": "novita/mistralai/mistral-nemo",
1510
  "type": "chat",
 
1527
  "context_window": 131072,
1528
  "size_b": 8
1529
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1530
  {
1531
  "name": "deepinfra/Qwen/Qwen3-235B-A22B",
1532
  "type": "chat",
 
1569
  "hf_id": "Qwen/Qwen3-30B-A3B-Instruct-2507"
1570
  },
1571
  {
1572
+ "name": "novita/meta-llama/llama-4-maverick-17b-128e-instruct-fp8",
1573
  "type": "vision",
1574
  "input_price_per_1m": 0.2,
1575
+ "output_price_per_1m": 0.85,
1576
  "currency": "USD",
1577
+ "context_window": 1048576,
1578
+ "size_b": 17,
1579
  "capabilities": [
1580
  "vision",
1581
+ "tools"
 
1582
  ],
1583
+ "hf_id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct"
1584
  },
1585
  {
1586
+ "name": "novita/qwen/qwen3-235b-a22b-fp8",
1587
+ "type": "chat",
1588
+ "input_price_per_1m": 0.2,
1589
+ "output_price_per_1m": 0.8,
1590
+ "currency": "USD",
1591
+ "context_window": 128000,
1592
+ "size_b": 235,
1593
+ "capabilities": [
1594
+ "tools",
1595
+ "reasoning"
1596
+ ],
1597
+ "hf_id": "Qwen/Qwen3-235B-A22B"
1598
+ },
1599
+ {
1600
+ "name": "xai/grok-code-fast-1",
1601
+ "type": "vision",
1602
+ "input_price_per_1m": 0.2,
1603
+ "output_price_per_1m": 1.5,
1604
  "currency": "USD",
1605
  "capabilities": [
1606
  "vision"
1607
  ],
1608
+ "context_window": 256000,
1609
+ "hf_private": true
1610
+ },
1611
+ {
1612
+ "name": "xai/grok-4-fast",
1613
+ "type": "vision",
1614
+ "input_price_per_1m": 0.2,
1615
+ "output_price_per_1m": 0.5,
1616
+ "currency": "USD",
1617
  "context_window": 2000000,
1618
+ "capabilities": [
1619
+ "vision",
1620
+ "tools",
1621
+ "reasoning"
1622
+ ],
1623
  "hf_private": true
1624
  },
1625
  {
 
1649
  "hf_private": true
1650
  },
1651
  {
1652
+ "name": "xai/grok-4-1-fast-reasoning",
1653
  "type": "vision",
1654
  "input_price_per_1m": 0.2,
1655
+ "output_price_per_1m": 0.5,
1656
  "currency": "USD",
1657
  "capabilities": [
1658
  "vision"
1659
  ],
1660
+ "context_window": 2000000,
1661
  "hf_private": true
1662
  },
1663
+ {
1664
+ "name": "together/meta-llama/LlamaGuard-2-8b",
1665
+ "type": "chat",
1666
+ "input_price_per_1m": 0.2,
1667
+ "output_price_per_1m": 0.2,
1668
+ "currency": "USD",
1669
+ "context_window": 8192,
1670
+ "size_b": 8
1671
+ },
1672
  {
1673
  "name": "openai-responses/gpt-5.4-nano",
1674
  "type": "vision",
 
1696
  "hf_private": true
1697
  },
1698
  {
1699
+ "name": "deepinfra/deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1700
+ "type": "chat",
1701
  "input_price_per_1m": 0.23,
1702
+ "output_price_per_1m": 0.69,
1703
  "currency": "USD",
1704
+ "context_window": 64000,
1705
+ "size_b": 70,
1706
  "capabilities": [
1707
+ "reasoning"
1708
  ],
1709
+ "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B"
1710
  },
1711
  {
1712
+ "name": "deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct",
1713
  "type": "chat",
1714
  "input_price_per_1m": 0.23,
1715
  "output_price_per_1m": 0.4,
1716
  "currency": "USD",
1717
+ "context_window": 130815,
1718
+ "size_b": 70
 
 
 
 
1719
  },
1720
  {
1721
+ "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct",
1722
  "type": "chat",
1723
  "input_price_per_1m": 0.23,
1724
+ "output_price_per_1m": 0.4,
1725
  "currency": "USD",
1726
+ "context_window": 131072,
1727
  "size_b": 70,
1728
  "capabilities": [
1729
+ "tools"
1730
  ],
1731
+ "hf_id": "meta-llama/Llama-3.3-70B-Instruct"
1732
  },
1733
  {
1734
+ "name": "deepinfra/Qwen/Qwen2.5-72B-Instruct",
1735
+ "type": "vision",
1736
  "input_price_per_1m": 0.23,
1737
  "output_price_per_1m": 0.4,
1738
  "currency": "USD",
1739
+ "context_window": 131072,
1740
+ "size_b": 72,
1741
+ "capabilities": [
1742
+ "vision"
1743
+ ],
1744
+ "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct"
1745
  },
1746
  {
1747
  "name": "mistral/open-mistral-7b",
 
1753
  "size_b": 7
1754
  },
1755
  {
1756
+ "name": "azure/gpt-5-mini",
1757
  "type": "vision",
1758
  "input_price_per_1m": 0.25,
1759
+ "output_price_per_1m": 2,
1760
  "currency": "USD",
1761
  "capabilities": [
1762
+ "reasoning"
1763
  ],
1764
+ "context_window": 200000,
1765
  "hf_private": true
1766
  },
1767
  {
1768
+ "name": "vertex/gemini-3.1-flash-lite-preview",
1769
  "type": "vision",
1770
  "input_price_per_1m": 0.25,
1771
+ "output_price_per_1m": 1.5,
1772
  "currency": "USD",
1773
  "capabilities": [
1774
+ "vision"
1775
  ],
1776
+ "context_window": 1048576,
1777
  "hf_private": true
1778
  },
1779
  {
 
1837
  "hf_private": true
1838
  },
1839
  {
1840
+ "name": "deepinfra/deepseek-ai/DeepSeek-V3.1",
1841
  "type": "chat",
1842
  "input_price_per_1m": 0.3,
1843
+ "output_price_per_1m": 1,
1844
  "currency": "USD",
1845
+ "context_window": 163840,
1846
+ "capabilities": [
1847
+ "tools",
1848
+ "reasoning"
1849
+ ],
1850
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
1851
+ "size_b": 671
1852
  },
1853
  {
1854
+ "name": "mistral/codestral-latest",
1855
+ "type": "chat",
1856
  "input_price_per_1m": 0.3,
1857
+ "output_price_per_1m": 0.9,
1858
  "currency": "USD",
1859
+ "context_window": 131072,
 
 
 
 
 
1860
  "hf_private": true
1861
  },
1862
  {
1863
+ "name": "parasail/parasail-gemma3-27b-it",
1864
  "type": "chat",
1865
  "input_price_per_1m": 0.3,
1866
+ "output_price_per_1m": 0.5,
1867
  "currency": "USD",
1868
+ "context_window": 128000,
1869
+ "size_b": 27
 
 
 
 
1870
  },
1871
  {
1872
+ "name": "alibaba/qwen3-coder-flash",
1873
  "type": "vision",
1874
  "input_price_per_1m": 0.3,
1875
+ "output_price_per_1m": 1.5,
1876
  "currency": "USD",
1877
  "capabilities": [
1878
+ "vision"
 
1879
  ],
1880
+ "context_window": 1048576,
 
1881
  "hf_private": true
1882
  },
1883
  {
1884
+ "name": "vertex/gemini-2.5-flash",
1885
  "type": "vision",
1886
  "input_price_per_1m": 0.3,
1887
  "output_price_per_1m": 2.5,
 
1894
  "hf_private": true
1895
  },
1896
  {
1897
+ "name": "vertex/gemini-2.5-flash-image",
 
 
 
 
 
 
 
 
 
1898
  "type": "vision",
1899
  "input_price_per_1m": 0.3,
1900
  "output_price_per_1m": 2.5,
 
1907
  "hf_private": true
1908
  },
1909
  {
1910
+ "name": "nebius/deepseek-ai/DeepSeek-V3.2",
1911
+ "type": "chat",
1912
  "input_price_per_1m": 0.3,
1913
+ "output_price_per_1m": 0.45,
1914
  "currency": "USD",
1915
  "capabilities": [
 
1916
  "reasoning"
1917
  ],
1918
+ "context_window": 164000,
1919
+ "hf_id": "deepseek-ai/DeepSeek-V3.2",
1920
+ "size_b": 685.4
1921
  },
1922
  {
1923
+ "name": "nebius/minimax/minimax-m2.1",
1924
  "type": "chat",
1925
  "input_price_per_1m": 0.3,
1926
+ "output_price_per_1m": 1.2,
1927
  "currency": "USD",
1928
+ "capabilities": [
1929
+ "reasoning"
1930
+ ],
1931
+ "context_window": 200000,
1932
+ "hf_id": "MiniMaxAI/MiniMax-M2.1",
1933
+ "size_b": 228.7
1934
  },
1935
  {
1936
+ "name": "novita/deepseek/deepseek-r1-distill-qwen-32b",
1937
+ "type": "chat",
1938
  "input_price_per_1m": 0.3,
1939
+ "output_price_per_1m": 0.3,
1940
  "currency": "USD",
1941
+ "context_window": 12800,
1942
+ "size_b": 32,
1943
  "capabilities": [
 
1944
  "reasoning"
1945
  ],
1946
+ "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B"
 
1947
  },
1948
  {
1949
+ "name": "novita/MiniMax-M2.7",
1950
+ "type": "vision",
1951
  "input_price_per_1m": 0.3,
1952
+ "output_price_per_1m": 1.2,
1953
  "currency": "USD",
 
1954
  "capabilities": [
1955
+ "vision",
1956
  "reasoning"
1957
  ],
1958
+ "context_window": 200000,
1959
+ "hf_id": "MiniMaxAI/MiniMax-M2.7",
1960
+ "hf_private": true
1961
  },
1962
  {
1963
+ "name": "novita/minimax-m2.7",
1964
  "type": "vision",
1965
  "input_price_per_1m": 0.3,
1966
+ "output_price_per_1m": 1.2,
1967
  "currency": "USD",
1968
  "capabilities": [
1969
+ "vision",
1970
+ "reasoning"
1971
  ],
1972
+ "context_window": 200000,
1973
+ "hf_id": "MiniMaxAI/MiniMax-M2.7",
1974
  "hf_private": true
1975
  },
1976
  {
 
2028
  "hf_private": true
2029
  },
2030
  {
2031
+ "name": "coding/gemini-2.5-flash",
2032
+ "type": "vision",
2033
  "input_price_per_1m": 0.3,
2034
+ "output_price_per_1m": 2.5,
2035
  "currency": "USD",
2036
  "capabilities": [
2037
+ "vision",
2038
  "reasoning"
2039
  ],
2040
+ "context_window": 1048576,
2041
+ "hf_private": true
 
2042
  },
2043
  {
2044
+ "name": "together/Qwen/Qwen2.5-7B-Instruct-Turbo",
2045
  "type": "chat",
2046
  "input_price_per_1m": 0.3,
2047
+ "output_price_per_1m": 0.3,
2048
  "currency": "USD",
2049
+ "context_window": 32768,
2050
+ "size_b": 7
 
 
 
 
2051
  },
2052
  {
2053
+ "name": "google/gemini-2.5-flash",
2054
+ "type": "vision",
2055
+ "input_price_per_1m": 0.3,
2056
+ "output_price_per_1m": 2.5,
2057
+ "currency": "USD",
2058
+ "capabilities": [
2059
+ "vision",
2060
+ "reasoning"
2061
+ ],
2062
+ "context_window": 1048576,
2063
+ "hf_private": true
2064
+ },
2065
+ {
2066
+ "name": "deepinfra/meta-llama/Llama-3.2-90B-Vision-Instruct",
2067
  "type": "chat",
2068
  "input_price_per_1m": 0.35,
2069
  "output_price_per_1m": 0.4,
 
2098
  "hf_id": "meta-llama/Llama-3.3-70B-Instruct"
2099
  },
2100
  {
2101
+ "name": "deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2102
  "type": "chat",
2103
  "input_price_per_1m": 0.4,
2104
+ "output_price_per_1m": 1.6,
2105
  "currency": "USD",
2106
+ "context_window": 262144,
2107
+ "size_b": 480,
2108
  "capabilities": [
2109
+ "tools"
 
2110
  ],
2111
+ "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct"
 
2112
  },
2113
  {
2114
+ "name": "mistral/mistral-medium-latest",
2115
  "type": "chat",
2116
  "input_price_per_1m": 0.4,
2117
+ "output_price_per_1m": 2,
2118
  "currency": "USD",
2119
+ "context_window": 131072,
2120
  "hf_private": true
2121
  },
2122
  {
2123
+ "name": "mistral/devstral-medium-2507",
2124
  "type": "chat",
2125
  "input_price_per_1m": 0.4,
2126
  "output_price_per_1m": 2,
2127
  "currency": "USD",
2128
  "context_window": 131072,
2129
+ "capabilities": [
2130
+ "tools"
2131
+ ],
2132
  "hf_private": true
2133
  },
2134
  {
 
2141
  "hf_private": true
2142
  },
2143
  {
2144
+ "name": "azure/gpt-4.1-mini",
2145
+ "type": "vision",
2146
  "input_price_per_1m": 0.4,
2147
+ "output_price_per_1m": 1.6,
2148
  "currency": "USD",
 
2149
  "capabilities": [
2150
+ "vision"
2151
  ],
2152
+ "context_window": 1047576,
2153
  "hf_private": true
2154
  },
2155
  {
2156
+ "name": "azure/openai-responses/gpt-4.1-mini",
2157
  "type": "vision",
2158
  "input_price_per_1m": 0.4,
2159
  "output_price_per_1m": 1.6,
 
2165
  "hf_private": true
2166
  },
2167
  {
2168
+ "name": "alibaba/qwen-plus",
2169
+ "type": "chat",
2170
  "input_price_per_1m": 0.4,
2171
+ "output_price_per_1m": 1.2,
2172
  "currency": "USD",
2173
+ "context_window": 131072,
2174
  "capabilities": [
2175
+ "tools"
2176
  ],
 
2177
  "hf_private": true
2178
  },
2179
  {
2180
+ "name": "nebius/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2181
  "type": "chat",
2182
  "input_price_per_1m": 0.4,
2183
+ "output_price_per_1m": 1.8,
2184
  "currency": "USD",
2185
+ "context_window": 262000,
2186
  "size_b": 480,
2187
  "capabilities": [
2188
  "tools"
 
2190
  "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct"
2191
  },
2192
  {
2193
+ "name": "nebius/zai-org/GLM-4.7",
2194
  "type": "chat",
2195
  "input_price_per_1m": 0.4,
2196
+ "output_price_per_1m": 2,
2197
  "currency": "USD",
 
2198
  "capabilities": [
2199
+ "reasoning"
2200
  ],
2201
+ "context_window": 200000,
2202
+ "hf_id": "zai-org/GLM-4.7",
2203
+ "size_b": 358.3
2204
+ },
2205
+ {
2206
+ "name": "novita/deepseek/deepseek-v3-0324",
2207
+ "type": "chat",
2208
+ "input_price_per_1m": 0.4,
2209
+ "output_price_per_1m": 1.3,
2210
+ "currency": "USD",
2211
+ "context_window": 128000,
2212
+ "capabilities": [
2213
+ "tools",
2214
+ "reasoning"
2215
+ ],
2216
+ "size_b": 685,
2217
+ "hf_id": "deepseek-ai/DeepSeek-V3-0324"
2218
+ },
2219
+ {
2220
+ "name": "novita/deepseek/deepseek-v3-turbo",
2221
+ "type": "chat",
2222
+ "input_price_per_1m": 0.4,
2223
+ "output_price_per_1m": 1.3,
2224
+ "currency": "USD",
2225
+ "context_window": 128000,
2226
  "hf_private": true
2227
  },
2228
  {
 
2249
  "context_window": 1047576,
2250
  "hf_private": true
2251
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2252
  {
2253
  "name": "mistral/mistral-large-latest",
2254
  "type": "chat",
 
2261
  ],
2262
  "hf_private": true
2263
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
2264
  {
2265
  "name": "vertex/gemini-3-flash-preview",
2266
  "type": "vision",
 
2275
  "hf_private": true
2276
  },
2277
  {
2278
+ "name": "vertex/gemini-3.1-flash-image-preview",
2279
  "type": "vision",
2280
  "input_price_per_1m": 0.5,
2281
  "output_price_per_1m": 2,
 
2287
  "context_window": 131072,
2288
  "hf_private": true
2289
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
2290
  {
2291
  "name": "nebius/moonshotai/kimi-k2.5",
2292
  "type": "vision",
 
2328
  "hf_id": "moonshotai/Kimi-K2-Instruct",
2329
  "size_b": 1026.5
2330
  },
2331
+ {
2332
+ "name": "google/gemini-3.1-flash-image-preview",
2333
+ "type": "vision",
2334
+ "input_price_per_1m": 0.5,
2335
+ "output_price_per_1m": 2,
2336
+ "currency": "USD",
2337
+ "capabilities": [
2338
+ "vision",
2339
+ "reasoning"
2340
+ ],
2341
+ "context_window": 131072,
2342
+ "hf_private": true
2343
+ },
2344
+ {
2345
+ "name": "google/gemini-3-flash-preview",
2346
+ "type": "vision",
2347
+ "input_price_per_1m": 0.5,
2348
+ "output_price_per_1m": 3,
2349
+ "currency": "USD",
2350
+ "capabilities": [
2351
+ "vision",
2352
+ "reasoning"
2353
+ ],
2354
+ "context_window": 1048576,
2355
+ "hf_private": true
2356
+ },
2357
  {
2358
  "name": "novita/meta-llama/llama-3-70b-instruct",
2359
  "type": "chat",
 
2407
  "size_b": 1026.5
2408
  },
2409
  {
2410
+ "name": "deepinfra/zai-org/GLM-4.5",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2411
  "type": "chat",
2412
  "input_price_per_1m": 0.6,
2413
  "output_price_per_1m": 2.2,
 
2459
  "hf_id": "zai-org/GLM-4.6",
2460
  "size_b": 356.8
2461
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2462
  {
2463
  "name": "alibaba/qwen3.5",
2464
  "type": "vision",
 
2474
  "hf_id": "Qwen/Qwen3.5-9B"
2475
  },
2476
  {
2477
+ "name": "moonshot/kimi-k2.5",
2478
  "type": "vision",
2479
  "input_price_per_1m": 0.6,
2480
+ "output_price_per_1m": 3,
2481
  "currency": "USD",
2482
  "capabilities": [
2483
  "vision",
2484
  "reasoning"
2485
  ],
2486
+ "context_window": 262144,
2487
+ "hf_id": "moonshotai/Kimi-K2.5",
2488
+ "size_b": 1058.6
2489
  },
2490
  {
2491
+ "name": "moonshot/kimi-k2-thinking-turbo",
2492
+ "type": "chat",
2493
  "input_price_per_1m": 0.6,
2494
+ "output_price_per_1m": 2.5,
2495
  "currency": "USD",
2496
+ "context_window": 131072,
2497
  "capabilities": [
2498
+ "tools",
2499
  "reasoning"
2500
  ],
2501
+ "hf_id": "moonshotai/Kimi-K2-Thinking",
2502
+ "size_b": 1058.1
 
2503
  },
2504
  {
2505
+ "name": "moonshot/kimi-k2-0905-preview",
2506
  "type": "chat",
2507
  "input_price_per_1m": 0.6,
2508
  "output_price_per_1m": 2.5,
 
2511
  "capabilities": [
2512
  "tools"
2513
  ],
2514
+ "hf_id": "moonshotai/Kimi-K2-Instruct-0905",
2515
  "size_b": 1026.5
2516
  },
2517
  {
2518
+ "name": "moonshot/kimi-k2-thinking",
2519
+ "type": "chat",
2520
  "input_price_per_1m": 0.6,
2521
+ "output_price_per_1m": 2.5,
2522
  "currency": "USD",
2523
+ "context_window": 131072,
2524
  "capabilities": [
2525
+ "tools"
 
2526
  ],
2527
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
2528
+ "size_b": 1026.5
 
2529
  },
2530
  {
2531
+ "name": "moonshot/kimi-k2-0711-preview",
2532
  "type": "chat",
2533
  "input_price_per_1m": 0.6,
2534
  "output_price_per_1m": 2.5,
2535
  "currency": "USD",
2536
  "context_window": 131072,
2537
+ "capabilities": [
2538
+ "tools"
2539
+ ],
2540
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
2541
+ "size_b": 1026.5
2542
+ },
2543
+ {
2544
+ "name": "nebius/zai-org/GLM-4.5",
2545
+ "type": "chat",
2546
+ "input_price_per_1m": 0.6,
2547
+ "output_price_per_1m": 2.2,
2548
+ "currency": "USD",
2549
+ "context_window": 128000,
2550
  "capabilities": [
2551
  "tools",
2552
  "reasoning"
2553
  ],
2554
+ "hf_id": "zai-org/GLM-4.5",
2555
+ "size_b": 358.3
2556
  },
2557
  {
2558
+ "name": "novita/zai-org/glm-4.5",
2559
  "type": "chat",
2560
  "input_price_per_1m": 0.6,
2561
+ "output_price_per_1m": 2.2,
2562
  "currency": "USD",
2563
  "context_window": 131072,
2564
  "capabilities": [
2565
+ "tools",
2566
+ "reasoning"
2567
  ],
2568
+ "hf_id": "zai-org/GLM-4.5",
2569
+ "size_b": 358.3
2570
  },
2571
  {
2572
+ "name": "novita/zai-org/glm-4.6",
2573
  "type": "chat",
2574
  "input_price_per_1m": 0.6,
2575
+ "output_price_per_1m": 2.2,
2576
  "currency": "USD",
2577
+ "context_window": 204800,
2578
  "capabilities": [
2579
+ "tools",
2580
+ "reasoning"
2581
+ ],
2582
+ "hf_id": "zai-org/GLM-4.6",
2583
+ "size_b": 356.8
2584
+ },
2585
+ {
2586
+ "name": "minimaxi/MiniMax-M2.7-highspeed",
2587
+ "type": "vision",
2588
+ "input_price_per_1m": 0.6,
2589
+ "output_price_per_1m": 2.4,
2590
+ "currency": "USD",
2591
+ "capabilities": [
2592
+ "vision",
2593
+ "reasoning"
2594
  ],
2595
+ "context_window": 200000,
2596
+ "hf_id": "MiniMaxAI/MiniMax-M2.7",
2597
+ "hf_private": true
2598
  },
2599
  {
2600
+ "name": "minimaxi/MiniMax-M2.5-highspeed",
2601
+ "type": "vision",
2602
  "input_price_per_1m": 0.6,
2603
+ "output_price_per_1m": 2.4,
2604
  "currency": "USD",
 
2605
  "capabilities": [
2606
+ "vision",
2607
  "reasoning"
2608
  ],
2609
+ "context_window": 200000,
2610
+ "hf_id": "MiniMaxAI/MiniMax-M2.5",
2611
+ "size_b": 228.7
2612
  },
2613
  {
2614
  "name": "novita/microsoft/wizardlm-2-8x22b",
 
2632
  "context_window": 400000,
2633
  "hf_private": true
2634
  },
2635
+ {
2636
+ "name": "parasail/parasail-qwen25-vl-72b-instruct",
2637
+ "type": "vision",
2638
+ "input_price_per_1m": 0.7,
2639
+ "output_price_per_1m": 0.7,
2640
+ "currency": "USD",
2641
+ "capabilities": [
2642
+ "vision"
2643
+ ],
2644
+ "context_window": 32768,
2645
+ "size_b": 72
2646
+ },
2647
  {
2648
  "name": "novita/deepseek/deepseek-prover-v2-671b",
2649
  "type": "chat",
 
2667
  "hf_id": "deepseek-ai/DeepSeek-R1",
2668
  "size_b": 671
2669
  },
 
 
 
 
 
 
 
 
 
 
 
 
2670
  {
2671
  "name": "openai-responses/gpt-5.4-mini",
2672
  "type": "vision",
 
2693
  "context_window": 400000,
2694
  "hf_private": true
2695
  },
2696
+ {
2697
+ "name": "deepinfra/meta-llama/Meta-Llama-3.1-405B-Instruct",
2698
+ "type": "chat",
2699
+ "input_price_per_1m": 0.8,
2700
+ "output_price_per_1m": 0.8,
2701
+ "currency": "USD",
2702
+ "context_window": 130815,
2703
+ "size_b": 405
2704
+ },
2705
+ {
2706
+ "name": "nebius/deepseek-ai/DeepSeek-R1-0528",
2707
+ "type": "chat",
2708
+ "input_price_per_1m": 0.8,
2709
+ "output_price_per_1m": 2.4,
2710
+ "currency": "USD",
2711
+ "context_window": 164000,
2712
+ "capabilities": [
2713
+ "tools",
2714
+ "reasoning"
2715
+ ],
2716
+ "hf_id": "deepseek-ai/DeepSeek-R1-0528",
2717
+ "size_b": 684.5
2718
+ },
2719
  {
2720
  "name": "novita/deepseek/deepseek-r1-distill-llama-70b",
2721
  "type": "chat",
 
2743
  "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct"
2744
  },
2745
  {
2746
+ "name": "deepinfra/deepseek-ai/DeepSeek-R1",
 
 
 
 
 
 
 
 
 
2747
  "type": "chat",
2748
+ "input_price_per_1m": 0.85,
2749
+ "output_price_per_1m": 2.5,
2750
  "currency": "USD",
2751
+ "context_window": 64000,
2752
  "capabilities": [
2753
  "tools",
2754
  "reasoning"
2755
  ],
2756
+ "hf_id": "deepseek-ai/DeepSeek-R1",
2757
+ "size_b": 671
2758
  },
2759
  {
2760
  "name": "deepinfra/deepseek-ai/DeepSeek-V3",
 
2770
  "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
2771
  "size_b": 671
2772
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2773
  {
2774
  "name": "alibaba/qwen3-max",
2775
  "type": "vision",
 
2828
  "hf_private": true
2829
  },
2830
  {
2831
+ "name": "anthropic/claude-haiku-4-5",
 
 
 
 
 
 
 
 
 
 
 
 
 
2832
  "type": "vision",
2833
  "input_price_per_1m": 1,
2834
+ "output_price_per_1m": 5,
2835
  "currency": "USD",
2836
  "capabilities": [
2837
+ "vision"
 
2838
  ],
2839
  "context_window": 200000,
2840
+ "hf_private": true
 
2841
  },
2842
  {
2843
+ "name": "groq/moonshotai/Kimi-K2-Instruct-0905",
2844
  "type": "chat",
2845
  "input_price_per_1m": 1,
2846
  "output_price_per_1m": 3,
2847
  "currency": "USD",
2848
+ "context_window": 256000,
2849
  "capabilities": [
2850
  "tools"
2851
  ],
 
2853
  "size_b": 1026.5
2854
  },
2855
  {
2856
+ "name": "groq/moonshotai/kimi-k2-instruct",
2857
  "type": "chat",
2858
  "input_price_per_1m": 1,
2859
  "output_price_per_1m": 3,
2860
  "currency": "USD",
2861
+ "context_window": 131072,
2862
  "capabilities": [
2863
  "tools"
2864
  ],
 
2866
  "size_b": 1026.5
2867
  },
2868
  {
2869
+ "name": "perplexity/sonar",
2870
  "type": "vision",
2871
  "input_price_per_1m": 1,
2872
+ "output_price_per_1m": 1,
2873
  "currency": "USD",
2874
+ "context_window": 131072,
2875
  "capabilities": [
2876
  "vision"
2877
  ],
 
2878
  "hf_private": true
2879
  },
2880
  {
2881
+ "name": "zai/GLM-5",
2882
  "type": "vision",
2883
  "input_price_per_1m": 1,
2884
+ "output_price_per_1m": 3.2,
2885
  "currency": "USD",
2886
  "capabilities": [
2887
+ "vision",
2888
+ "reasoning"
2889
  ],
2890
  "context_window": 200000,
2891
+ "hf_id": "zai-org/GLM-5",
2892
+ "size_b": 753.9
2893
  },
2894
  {
2895
+ "name": "alibaba/qwen3-coder-plus",
2896
  "type": "vision",
2897
  "input_price_per_1m": 1,
2898
+ "output_price_per_1m": 5,
2899
  "currency": "USD",
 
2900
  "capabilities": [
2901
  "vision"
2902
  ],
2903
+ "context_window": 1048576,
2904
  "hf_private": true
2905
  },
2906
  {
2907
+ "name": "vertex/claude-haiku-4-5",
2908
  "type": "vision",
2909
  "input_price_per_1m": 1,
2910
  "output_price_per_1m": 5,
 
2912
  "capabilities": [
2913
  "vision"
2914
  ],
2915
+ "context_window": 200000,
2916
  "hf_private": true
2917
  },
2918
+ {
2919
+ "name": "novita/GLM-5",
2920
+ "type": "chat",
2921
+ "input_price_per_1m": 1,
2922
+ "output_price_per_1m": 3.2,
2923
+ "currency": "USD",
2924
+ "capabilities": [
2925
+ "reasoning"
2926
+ ],
2927
+ "context_window": 202800,
2928
+ "hf_id": "zai-org/GLM-5",
2929
+ "size_b": 753.9
2930
+ },
2931
  {
2932
  "name": "bedrock/claude-haiku-4-5",
2933
  "type": "vision",
 
3001
  "context_window": 200000,
3002
  "hf_private": true
3003
  },
 
 
 
 
 
 
 
 
 
3004
  {
3005
  "name": "moonshot/kimi-k2-turbo-preview",
3006
  "type": "chat",
 
3015
  "size_b": 1026.5
3016
  },
3017
  {
3018
+ "name": "together/Qwen/Qwen2.5-72B-Instruct-Turbo",
3019
  "type": "chat",
3020
+ "input_price_per_1m": 1.2,
3021
+ "output_price_per_1m": 1.2,
3022
+ "currency": "USD",
3023
+ "context_window": 32768,
3024
+ "size_b": 72
3025
+ },
3026
+ {
3027
+ "name": "azure/gpt-5",
3028
+ "type": "vision",
3029
  "input_price_per_1m": 1.25,
3030
+ "output_price_per_1m": 10,
3031
  "currency": "USD",
 
3032
  "capabilities": [
 
3033
  "reasoning"
3034
  ],
3035
+ "context_window": 200000,
3036
+ "hf_private": true
3037
  },
3038
  {
3039
+ "name": "azure/gpt-5.1",
3040
  "type": "vision",
3041
  "input_price_per_1m": 1.25,
3042
  "output_price_per_1m": 10,
3043
  "currency": "USD",
3044
  "capabilities": [
 
3045
  "reasoning"
3046
  ],
3047
+ "context_window": 200000,
3048
  "hf_private": true
3049
  },
3050
  {
 
3061
  "hf_private": true
3062
  },
3063
  {
3064
+ "name": "coding/gemini-2.5-pro",
3065
  "type": "vision",
3066
  "input_price_per_1m": 1.25,
3067
  "output_price_per_1m": 10,
3068
  "currency": "USD",
3069
  "capabilities": [
3070
+ "vision",
3071
  "reasoning"
3072
  ],
3073
+ "context_window": 1048576,
3074
  "hf_private": true
3075
  },
3076
  {
3077
+ "name": "together/deepseek-ai/DeepSeek-V3",
3078
+ "type": "chat",
3079
  "input_price_per_1m": 1.25,
3080
+ "output_price_per_1m": 1.25,
3081
  "currency": "USD",
3082
+ "context_window": 131072,
3083
  "capabilities": [
3084
+ "tools",
3085
  "reasoning"
3086
  ],
3087
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
3088
+ "size_b": 671
3089
  },
3090
  {
3091
  "name": "google/gemini-2.5-pro",
 
3101
  "hf_private": true
3102
  },
3103
  {
3104
+ "name": "openai-responses/gpt-5.1",
3105
  "type": "vision",
3106
  "input_price_per_1m": 1.25,
3107
  "output_price_per_1m": 10,
 
3114
  "hf_private": true
3115
  },
3116
  {
3117
+ "name": "openai-responses/gpt-5.1-codex",
3118
  "type": "vision",
3119
  "input_price_per_1m": 1.25,
3120
  "output_price_per_1m": 10,
 
3127
  "hf_private": true
3128
  },
3129
  {
3130
+ "name": "openai-responses/gpt-5",
3131
  "type": "vision",
3132
  "input_price_per_1m": 1.25,
3133
  "output_price_per_1m": 10,
 
3140
  "hf_private": true
3141
  },
3142
  {
3143
+ "name": "openai-responses/gpt-5-codex",
3144
  "type": "vision",
3145
  "input_price_per_1m": 1.25,
3146
  "output_price_per_1m": 10,
 
3153
  "hf_private": true
3154
  },
3155
  {
3156
+ "name": "openai/gpt-5.1",
3157
  "type": "vision",
3158
  "input_price_per_1m": 1.25,
3159
  "output_price_per_1m": 10,
 
3162
  "vision",
3163
  "reasoning"
3164
  ],
3165
+ "context_window": 400000,
3166
  "hf_private": true
3167
  },
3168
  {
3169
+ "name": "openai/gpt-5.1-chat",
3170
  "type": "vision",
3171
  "input_price_per_1m": 1.25,
3172
  "output_price_per_1m": 10,
 
3175
  "vision",
3176
  "reasoning"
3177
  ],
3178
+ "context_window": 128000,
3179
  "hf_private": true
3180
  },
3181
  {
3182
+ "name": "openai/gpt-5-chat",
3183
  "type": "vision",
3184
  "input_price_per_1m": 1.25,
3185
  "output_price_per_1m": 10,
 
3192
  "hf_private": true
3193
  },
3194
  {
3195
+ "name": "novita/sao10k/l31-70b-euryale-v2.2",
3196
  "type": "chat",
3197
  "input_price_per_1m": 1.48,
3198
  "output_price_per_1m": 1.48,
 
3201
  "size_b": 70
3202
  },
3203
  {
3204
+ "name": "novita/sao10k/l3-70b-euryale-v2.1",
3205
  "type": "chat",
3206
  "input_price_per_1m": 1.48,
3207
  "output_price_per_1m": 1.48,
 
3221
  ],
3222
  "hf_private": true
3223
  },
3224
+ {
3225
+ "name": "azure/gpt-5.2",
3226
+ "type": "vision",
3227
+ "input_price_per_1m": 1.75,
3228
+ "output_price_per_1m": 14,
3229
+ "currency": "USD",
3230
+ "capabilities": [
3231
+ "reasoning"
3232
+ ],
3233
+ "context_window": 200000,
3234
+ "hf_private": true
3235
+ },
3236
  {
3237
  "name": "azure/gpt-5.3-codex",
3238
  "type": "vision",
 
3260
  "hf_private": true
3261
  },
3262
  {
3263
+ "name": "openai-responses/gpt-5.3-chat",
3264
  "type": "vision",
3265
  "input_price_per_1m": 1.75,
3266
  "output_price_per_1m": 14,
3267
  "currency": "USD",
3268
  "capabilities": [
3269
+ "vision",
3270
  "reasoning"
3271
  ],
3272
+ "context_window": 128000,
3273
  "hf_private": true
3274
  },
3275
  {
 
3298
  "context_window": 400000,
3299
  "hf_private": true
3300
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
3301
  {
3302
  "name": "openai-responses/gpt-5.2",
3303
  "type": "vision",
 
3312
  "hf_private": true
3313
  },
3314
  {
3315
+ "name": "openai/gpt-5.2",
3316
  "type": "vision",
3317
  "input_price_per_1m": 1.75,
3318
  "output_price_per_1m": 14,
 
3321
  "vision",
3322
  "reasoning"
3323
  ],
3324
+ "context_window": 400000,
3325
  "hf_private": true
3326
  },
3327
  {
3328
+ "name": "openai/gpt-5.2-chat",
3329
  "type": "vision",
3330
  "input_price_per_1m": 1.75,
3331
  "output_price_per_1m": 14,
 
3334
  "vision",
3335
  "reasoning"
3336
  ],
3337
+ "context_window": 128000,
3338
  "hf_private": true
3339
  },
3340
  {
3341
+ "name": "openai/gpt-5.3-chat",
3342
  "type": "vision",
3343
  "input_price_per_1m": 1.75,
3344
  "output_price_per_1m": 14,
 
3360
  "hf_private": true
3361
  },
3362
  {
3363
+ "name": "perplexity/sonar-reasoning-pro",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3364
  "type": "vision",
3365
  "input_price_per_1m": 2,
3366
+ "output_price_per_1m": 8,
3367
  "currency": "USD",
3368
+ "context_window": 131072,
3369
  "capabilities": [
3370
  "vision",
3371
  "reasoning"
3372
  ],
 
3373
  "hf_private": true
3374
  },
3375
  {
3376
+ "name": "azure/gpt-4.1",
3377
  "type": "vision",
3378
  "input_price_per_1m": 2,
3379
  "output_price_per_1m": 8,
 
3385
  "hf_private": true
3386
  },
3387
  {
3388
+ "name": "azure/openai-responses/gpt-4.1",
3389
  "type": "vision",
3390
  "input_price_per_1m": 2,
3391
  "output_price_per_1m": 8,
 
3397
  "hf_private": true
3398
  },
3399
  {
3400
+ "name": "vertex/gemini-3.1-pro-preview",
3401
  "type": "vision",
3402
  "input_price_per_1m": 2,
3403
+ "output_price_per_1m": 12,
3404
  "currency": "USD",
 
3405
  "capabilities": [
3406
  "vision",
3407
  "reasoning"
3408
  ],
3409
+ "context_window": 1048576,
3410
  "hf_private": true
3411
  },
3412
  {
3413
+ "name": "vertex/gemini-3-pro-preview",
3414
  "type": "vision",
3415
  "input_price_per_1m": 2,
3416
  "output_price_per_1m": 12,
 
3423
  "hf_private": true
3424
  },
3425
  {
3426
+ "name": "vertex/gemini-3-pro-image-preview",
3427
  "type": "vision",
3428
  "input_price_per_1m": 2,
3429
  "output_price_per_1m": 12,
 
3435
  "context_window": 1048576,
3436
  "hf_private": true
3437
  },
3438
+ {
3439
+ "name": "nebius/deepseek-ai/DeepSeek-V3-0324-fast",
3440
+ "type": "chat",
3441
+ "input_price_per_1m": 2,
3442
+ "output_price_per_1m": 6,
3443
+ "currency": "USD",
3444
+ "context_window": 128000,
3445
+ "hf_private": true
3446
+ },
3447
  {
3448
  "name": "xai/grok-2-1212",
3449
  "type": "chat",
 
3467
  "hf_private": true
3468
  },
3469
  {
3470
+ "name": "google/gemini-3-pro-preview",
3471
  "type": "vision",
3472
  "input_price_per_1m": 2,
3473
+ "output_price_per_1m": 12,
3474
  "currency": "USD",
3475
  "capabilities": [
3476
+ "vision",
3477
+ "reasoning"
3478
  ],
3479
+ "context_window": 1048576,
3480
  "hf_private": true
3481
  },
3482
  {
3483
+ "name": "google/gemini-3.1-pro-preview",
3484
+ "type": "vision",
3485
+ "input_price_per_1m": 2,
3486
+ "output_price_per_1m": 12,
3487
+ "currency": "USD",
3488
+ "capabilities": [
3489
+ "vision",
3490
+ "reasoning"
3491
+ ],
3492
+ "context_window": 1048576,
3493
+ "hf_private": true
3494
+ },
3495
+ {
3496
+ "name": "openai-responses/gpt-4.1",
3497
  "type": "vision",
3498
  "input_price_per_1m": 2,
3499
  "output_price_per_1m": 8,
 
3518
  "hf_private": true
3519
  },
3520
  {
3521
+ "name": "openai/gpt-4.1",
3522
+ "type": "vision",
3523
  "input_price_per_1m": 2,
3524
+ "output_price_per_1m": 8,
3525
  "currency": "USD",
3526
+ "capabilities": [
3527
+ "vision"
3528
+ ],
3529
+ "context_window": 1047576,
3530
  "hf_private": true
3531
  },
3532
  {
 
3568
  "hf_private": true
3569
  },
3570
  {
3571
+ "name": "openai/gpt-4o-2024-08-06",
 
 
 
 
 
 
 
 
 
 
 
 
 
3572
  "type": "vision",
3573
  "input_price_per_1m": 2.5,
3574
  "output_price_per_1m": 10,
 
3580
  "hf_private": true
3581
  },
3582
  {
3583
+ "name": "openai/gpt-5.4",
3584
  "type": "vision",
3585
  "input_price_per_1m": 2.5,
3586
+ "output_price_per_1m": 15,
3587
  "currency": "USD",
3588
  "capabilities": [
3589
+ "vision",
3590
+ "reasoning"
3591
  ],
3592
+ "context_window": 1050000,
3593
  "hf_private": true
3594
  },
3595
  {
 
3605
  "hf_private": true
3606
  },
3607
  {
3608
+ "name": "openai/gpt-4o-2024-05-13",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3609
  "type": "vision",
3610
+ "input_price_per_1m": 2.5,
3611
+ "output_price_per_1m": 10,
3612
  "currency": "USD",
3613
  "capabilities": [
3614
+ "vision"
 
3615
  ],
3616
+ "context_window": 128000,
3617
  "hf_private": true
3618
  },
3619
  {
 
3656
  "hf_private": true
3657
  },
3658
  {
3659
+ "name": "perplexity/sonar-pro",
3660
  "type": "vision",
3661
  "input_price_per_1m": 3,
3662
  "output_price_per_1m": 15,
3663
  "currency": "USD",
3664
+ "context_window": 204800,
3665
  "capabilities": [
3666
  "vision"
3667
  ],
 
3668
  "hf_private": true
3669
  },
3670
  {
 
3707
  "hf_private": true
3708
  },
3709
  {
3710
+ "name": "vertex/claude-3-5-sonnet",
3711
  "type": "vision",
3712
  "input_price_per_1m": 3,
3713
  "output_price_per_1m": 15,
3714
  "currency": "USD",
 
3715
  "capabilities": [
3716
  "vision"
3717
  ],
3718
+ "context_window": 200000,
3719
  "hf_private": true
3720
  },
3721
  {
 
3731
  "hf_private": true
3732
  },
3733
  {
3734
+ "name": "coding/claude-sonnet-4-20250514",
3735
  "type": "vision",
3736
  "input_price_per_1m": 3,
3737
  "output_price_per_1m": 15,
 
3744
  "hf_private": true
3745
  },
3746
  {
3747
+ "name": "together/deepseek-ai/DeepSeek-R1",
3748
+ "type": "chat",
3749
+ "input_price_per_1m": 3,
3750
+ "output_price_per_1m": 7,
3751
+ "currency": "USD",
3752
+ "context_window": 64000,
3753
+ "capabilities": [
3754
+ "tools",
3755
+ "reasoning"
3756
+ ],
3757
+ "hf_id": "deepseek-ai/DeepSeek-R1",
3758
+ "size_b": 671
3759
+ },
3760
+ {
3761
+ "name": "bedrock/claude-sonnet-4",
3762
  "type": "vision",
3763
  "input_price_per_1m": 3,
3764
  "output_price_per_1m": 15,
 
3767
  "vision",
3768
  "reasoning"
3769
  ],
3770
+ "context_window": 200000,
3771
  "hf_private": true
3772
  },
3773
  {
3774
+ "name": "bedrock/claude-3-7-sonnet",
3775
  "type": "vision",
3776
  "input_price_per_1m": 3,
3777
  "output_price_per_1m": 15,
 
3784
  "hf_private": true
3785
  },
3786
  {
3787
+ "name": "bedrock/claude-sonnet-4-5",
3788
  "type": "vision",
3789
  "input_price_per_1m": 3,
3790
  "output_price_per_1m": 15,
 
3796
  "context_window": 200000,
3797
  "hf_private": true
3798
  },
3799
+ {
3800
+ "name": "bedrock/claude-sonnet-4-6",
3801
+ "type": "vision",
3802
+ "input_price_per_1m": 3,
3803
+ "output_price_per_1m": 15,
3804
+ "currency": "USD",
3805
+ "capabilities": [
3806
+ "vision",
3807
+ "reasoning"
3808
+ ],
3809
+ "context_window": 1000000,
3810
+ "hf_private": true
3811
+ },
3812
  {
3813
  "name": "novita/deepseek/deepseek-r1",
3814
  "type": "chat",
 
3824
  "size_b": 671
3825
  },
3826
  {
3827
+ "name": "anthropic/claude-opus-4-5",
3828
  "type": "vision",
3829
  "input_price_per_1m": 5,
3830
  "output_price_per_1m": 25,
 
3833
  "vision",
3834
  "reasoning"
3835
  ],
3836
+ "context_window": 200000,
3837
  "hf_private": true
3838
  },
3839
  {
3840
+ "name": "anthropic/claude-opus-4-6",
3841
  "type": "vision",
3842
  "input_price_per_1m": 5,
3843
  "output_price_per_1m": 25,
 
3846
  "vision",
3847
  "reasoning"
3848
  ],
3849
+ "context_window": 1000000,
3850
  "hf_private": true
3851
  },
3852
  {
3853
+ "name": "vertex/claude-opus-4-6",
3854
  "type": "vision",
3855
  "input_price_per_1m": 5,
3856
  "output_price_per_1m": 25,
 
3859
  "vision",
3860
  "reasoning"
3861
  ],
3862
+ "context_window": 1000000,
3863
  "hf_private": true
3864
  },
3865
  {
3866
+ "name": "vertex/claude-opus-4-5",
3867
  "type": "vision",
3868
  "input_price_per_1m": 5,
3869
  "output_price_per_1m": 25,
 
3872
  "vision",
3873
  "reasoning"
3874
  ],
3875
+ "context_window": 200000,
3876
  "hf_private": true
3877
  },
3878
  {
 
3939
  "hf_private": true
3940
  },
3941
  {
3942
+ "name": "anthropic/claude-opus-4",
3943
  "type": "vision",
3944
  "input_price_per_1m": 15,
3945
  "output_price_per_1m": 75,
 
3952
  "hf_private": true
3953
  },
3954
  {
3955
+ "name": "anthropic/claude-opus-4-1",
3956
  "type": "vision",
3957
  "input_price_per_1m": 15,
3958
  "output_price_per_1m": 75,
 
3965
  "hf_private": true
3966
  },
3967
  {
3968
+ "name": "vertex/claude-opus-4",
3969
  "type": "vision",
3970
  "input_price_per_1m": 15,
3971
  "output_price_per_1m": 75,
 
3978
  "hf_private": true
3979
  },
3980
  {
3981
+ "name": "vertex/claude-opus-4-1",
3982
  "type": "vision",
3983
  "input_price_per_1m": 15,
3984
  "output_price_per_1m": 75,
 
3991
  "hf_private": true
3992
  },
3993
  {
3994
+ "name": "coding/claude-opus-4-20250514",
3995
  "type": "vision",
3996
  "input_price_per_1m": 15,
3997
  "output_price_per_1m": 75,
 
4415
  "output_price_per_1m": 1.5,
4416
  "currency": "USD",
4417
  "flavor": "base",
4418
+ "hf_id": "deepseek-ai/DeepSeek-V3",
4419
+ "size_b": 30.8
4420
  },
4421
  {
4422
  "name": "DeepSeek-V3 (base)",
 
4425
  "output_price_per_1m": 1.5,
4426
  "currency": "USD",
4427
  "flavor": "base",
4428
+ "hf_id": "deepseek-ai/DeepSeek-V3",
4429
+ "size_b": 30.8
4430
  },
4431
  {
4432
  "name": "Llama-3.3-70B-Instruct (fast)",
 
4678
  "input_price_per_1m": 0.01,
4679
  "output_price_per_1m": 0,
4680
  "currency": "USD",
4681
+ "hf_id": "BAAI/bge-multilingual-gemma2",
4682
+ "size_b": 7.4
4683
  },
4684
  {
4685
  "name": "bge-en-icl",
 
4772
  "input_price_per_1m": 0.003,
4773
  "output_price_per_1m": 0,
4774
  "currency": "EUR",
4775
+ "hf_id": "openai/whisper-large-v3",
4776
+ "size_b": 0.7
4777
  },
4778
  {
4779
  "name": "holo2-30b-a3b",
 
4873
  "input_price_per_1m": 0.1,
4874
  "output_price_per_1m": 0,
4875
  "currency": "EUR",
4876
+ "hf_id": "BAAI/bge-multilingual-gemma2",
4877
+ "size_b": 7.4
4878
  },
4879
  {
4880
  "name": "llama-3.1-8b-instruct",
 
4934
  ],
4935
  "size_b": 122.61,
4936
  "hf_id": "mistralai/Mistral-Large-Instruct-2411",
4937
+ "hf_private": true,
4938
+ "ollama_id": "mistral-large"
4939
  },
4940
  {
4941
  "name": "Mistral Small 4",
 
5191
  "tools"
5192
  ],
5193
  "hf_id": "mistralai/Mistral-Nemo-Instruct-2407",
5194
+ "size_b": 12,
5195
+ "ollama_id": "mistral-nemo"
5196
  },
5197
  {
5198
  "name": "Mistral 7B",
 
5214
  "capabilities": [
5215
  "tools"
5216
  ],
5217
+ "hf_id": "mistralai/Mixtral-8x7B-Instruct-v0.1",
5218
+ "ollama_id": "mixtral"
5219
  },
5220
  {
5221
  "name": "Mixtral 8x22B",
 
5228
  "capabilities": [
5229
  "tools"
5230
  ],
5231
+ "hf_id": "mistralai/Mixtral-8x22B-Instruct-v0.1",
5232
+ "ollama_id": "mixtral-8x22b"
5233
  }
5234
  ]
5235
  },
 
6755
  "hf_id": "MiniMaxAI/MiniMax-Text-01",
6756
  "capabilities": [
6757
  "vision"
6758
+ ],
6759
+ "size_b": 366.1
6760
  },
6761
  {
6762
  "name": "qwen/qwen-2.5-vl-7b-instruct",
 
6903
  "capabilities": [
6904
  "tools",
6905
  "reasoning"
6906
+ ],
6907
+ "size_b": 30.8
6908
  },
6909
  {
6910
  "name": "inception/mercury",
 
7081
  "capabilities": [
7082
  "tools",
7083
  "reasoning"
7084
+ ],
7085
+ "size_b": 30.8
7086
  },
7087
  {
7088
  "name": "baidu/ernie-4.5-300b-a47b",
 
7329
  "hf_id": "deepseek-ai/DeepSeek-V3.2-Speciale",
7330
  "capabilities": [
7331
  "reasoning"
7332
+ ],
7333
+ "size_b": 30.8
7334
  },
7335
  {
7336
  "name": "moonshotai/kimi-k2-0905",
 
9618
  "input_price_per_1m": 0.111,
9619
  "output_price_per_1m": 0,
9620
  "currency": "USD",
9621
+ "hf_id": "openai/whisper-large-v3",
9622
+ "size_b": 0.7
9623
  },
9624
  {
9625
  "name": "Whisper Large v3 Turbo",
 
9627
  "input_price_per_1m": 0.04,
9628
  "output_price_per_1m": 0,
9629
  "currency": "USD",
9630
+ "hf_id": "openai/whisper-large-v3-turbo",
9631
+ "size_b": 0.7
9632
  }
9633
  ]
9634
  },
scripts/fetch-providers.js CHANGED
@@ -81,7 +81,7 @@ function updateProviderModels(providers, providerName, models) {
81
  const normName = (s) =>
82
  s.toLowerCase().replace(/[-_.:]/g, ' ').replace(/[^a-z0-9 ]/g, '').replace(/\s+/g, ' ').trim();
83
 
84
- // Build an index of normalized OpenRouter model-part → { capabilities, type, size_b, hf_id, hf_private }
85
  // Only includes entries that carry non-trivial capability data.
86
  function buildOrIndex(orProvider) {
87
  if (!orProvider) return [];
@@ -96,6 +96,7 @@ function buildOrIndex(orProvider) {
96
  type: m.type,
97
  size_b: m.size_b,
98
  hf_id: m.hf_id,
 
99
  hf_private: m.hf_private,
100
  });
101
  }
@@ -103,7 +104,7 @@ function buildOrIndex(orProvider) {
103
  }
104
 
105
  // For a given model name, find the best matching OpenRouter index entry.
106
- // Returns { capabilities, type, size_b, hf_id, hf_private } or null.
107
  function findOrMatch(modelName, orIndex) {
108
  // Use the model part (after last '/') for matching, strip :region/@suffix
109
  const raw = modelName.replace(/@[^/]+$/, '').replace(/:[^/]+$/, '');
@@ -163,11 +164,20 @@ function estimateParams(config) {
163
  const l = config.num_hidden_layers || config.n_layer;
164
  const v = config.vocab_size;
165
  const i = config.intermediate_size || config.d_ff;
 
166
 
167
  if (h && l && v) {
168
- // Basic transformer param estimation: Layers * (Embedding + Attention + MLP)
169
  const intermediate = i || (4 * h);
170
- const params = (v * h) + l * (4 * (h * h) + 2 * (h * intermediate));
 
 
 
 
 
 
 
 
 
171
  return params;
172
  }
173
  return null;
@@ -179,24 +189,31 @@ async function fetchHFSize(hfId) {
179
  const token = process.env.HF_TOKEN;
180
  const headers = token ? { Authorization: `Bearer ${token}` } : {};
181
  try {
182
- // Limit to 1 retry for technical metadata lookups
183
  const data = await getJson(`https://huggingface.co/api/models/${hfId}`, { headers, retries: 1 });
184
 
185
- // Check various common metadata locations for total parameters
186
  let params = data.safetensors?.total || data.config?.total_parameters || data.config?.model_type_params;
187
 
188
- // Fallback: cardData
189
  if (!params && data.cardData?.model_details?.parameters) {
190
  const match = data.cardData.model_details.parameters.match(/([\d.]+)\s*[Bb]/);
191
  if (match) params = parseFloat(match[1]) * 1_000_000_000;
192
  }
193
 
194
- // Fallback: vLLM-style estimation from config
195
- if (!params && data.config) {
196
- params = estimateParams(data.config);
 
 
 
 
197
  }
198
 
199
- if (!params) return { error: 'No parameter data in Hub metadata' };
 
 
 
 
200
 
201
  const b = params / 1_000_000_000;
202
  // Keep 2 decimals for small models (<1B), 1 decimal for others
@@ -242,13 +259,16 @@ const EMBEDDER_KEYWORDS = ['embed', 'bge', 'gte', 'e5', 'stella', 'minilm', 'mul
242
  const MANUAL_HF_ID_MAP = {
243
  'all minilm l12 v2': 'sentence-transformers/all-MiniLM-L12-v2',
244
  'whisper v3': 'openai/whisper-large-v3',
245
- 'whisper v3 large': 'openai/whisper-large-v3',
246
  'whisper large v3': 'openai/whisper-large-v3',
 
247
  'whisper large v3 turbo': 'openai/whisper-large-v3-turbo',
248
  'step 3 5 flash': 'stepfun-ai/Step-3.5-Flash',
249
  'bge m3': 'BAAI/bge-m3',
250
  'bge en icl': 'BAAI/bge-en-icl',
 
 
251
  'lightonocr 2': 'lightonai/LightOnOCR-2-1B',
 
252
  'sdxl': 'stabilityai/stable-diffusion-xl-base-1.0',
253
  'flux 1 schnell': 'black-forest-labs/FLUX.1-schnell',
254
  'flux schnell': 'black-forest-labs/FLUX.1-schnell',
@@ -261,10 +281,13 @@ const MANUAL_HF_ID_MAP = {
261
  // Qwen
262
  'qwen turbo': 'Alibaba/Qwen-Turbo',
263
  'alibaba qwen turbo': 'Alibaba/Qwen-Turbo',
 
264
  'qwen plus': 'Alibaba/Qwen-Plus',
265
  'alibaba qwen plus': 'Alibaba/Qwen-Plus',
 
266
  'qwen max': 'Alibaba/Qwen-Max',
267
  'alibaba qwen max': 'Alibaba/Qwen-Max',
 
268
  'qwen 3 coder flash': 'Qwen/Qwen2.5-Coder-7B-Instruct',
269
  'qwen3 coder flash': 'Qwen/Qwen2.5-Coder-7B-Instruct',
270
  'qwen 3 coder plus': 'Qwen/Qwen2.5-Coder-32B-Instruct',
@@ -341,6 +364,15 @@ const MANUAL_OLLAMA_ID_MAP = {
341
  'gemma 2 27b': 'gemma2:27b',
342
  'qwen 2 5 coder 7b': 'qwen2.5-coder:7b',
343
  'qwen 2 5 coder 32b': 'qwen2.5-coder:32b',
 
 
 
 
 
 
 
 
 
344
  };
345
 
346
  const PROPRIETARY_KEYWORDS = [
 
81
  const normName = (s) =>
82
  s.toLowerCase().replace(/[-_.:]/g, ' ').replace(/[^a-z0-9 ]/g, '').replace(/\s+/g, ' ').trim();
83
 
84
+ // Build an index of normalized OpenRouter model-part → { capabilities, type, size_b, hf_id, ollama_id, hf_private }
85
  // Only includes entries that carry non-trivial capability data.
86
  function buildOrIndex(orProvider) {
87
  if (!orProvider) return [];
 
96
  type: m.type,
97
  size_b: m.size_b,
98
  hf_id: m.hf_id,
99
+ ollama_id: m.ollama_id,
100
  hf_private: m.hf_private,
101
  });
102
  }
 
104
  }
105
 
106
  // For a given model name, find the best matching OpenRouter index entry.
107
+ // Returns metadata object or null.
108
  function findOrMatch(modelName, orIndex) {
109
  // Use the model part (after last '/') for matching, strip :region/@suffix
110
  const raw = modelName.replace(/@[^/]+$/, '').replace(/:[^/]+$/, '');
 
164
  const l = config.num_hidden_layers || config.n_layer;
165
  const v = config.vocab_size;
166
  const i = config.intermediate_size || config.d_ff;
167
+ const numExperts = config.num_local_experts || config.n_experts || 1;
168
 
169
  if (h && l && v) {
 
170
  const intermediate = i || (4 * h);
171
+ // Embedding parameters
172
+ const vocabParams = v * h;
173
+ const posParams = (config.max_position_embeddings || 512) * h;
174
+ const typeParams = (config.type_vocab_size || 0) * h;
175
+ const embedParams = vocabParams + posParams + typeParams;
176
+
177
+ // Layer parameters (Attention + MLP)
178
+ const mlpParams = 2 * h * intermediate * numExperts;
179
+ const attentionParams = 4 * (h * h);
180
+ const params = embedParams + l * (attentionParams + mlpParams);
181
  return params;
182
  }
183
  return null;
 
189
  const token = process.env.HF_TOKEN;
190
  const headers = token ? { Authorization: `Bearer ${token}` } : {};
191
  try {
192
+ // 1. Get top-level metadata
193
  const data = await getJson(`https://huggingface.co/api/models/${hfId}`, { headers, retries: 1 });
194
 
 
195
  let params = data.safetensors?.total || data.config?.total_parameters || data.config?.model_type_params;
196
 
197
+ // 2. Fallback: cardData
198
  if (!params && data.cardData?.model_details?.parameters) {
199
  const match = data.cardData.model_details.parameters.match(/([\d.]+)\s*[Bb]/);
200
  if (match) params = parseFloat(match[1]) * 1_000_000_000;
201
  }
202
 
203
+ // 3. Fallback: vLLM-style estimation from config
204
+ // If the API config is "minified", fetch the raw config.json file
205
+ let config = data.config;
206
+ if (!params && (!config || !config.hidden_size)) {
207
+ try {
208
+ config = await getJson(`https://huggingface.co/${hfId}/raw/main/config.json`, { headers, retries: 1 });
209
+ } catch (e) { /* ignore raw config fetch failure */ }
210
  }
211
 
212
+ if (!params && config) {
213
+ params = estimateParams(config);
214
+ }
215
+
216
+ if (!params) return { error: 'No parameter data' };
217
 
218
  const b = params / 1_000_000_000;
219
  // Keep 2 decimals for small models (<1B), 1 decimal for others
 
259
  const MANUAL_HF_ID_MAP = {
260
  'all minilm l12 v2': 'sentence-transformers/all-MiniLM-L12-v2',
261
  'whisper v3': 'openai/whisper-large-v3',
 
262
  'whisper large v3': 'openai/whisper-large-v3',
263
+ 'whisper v3 large': 'openai/whisper-large-v3',
264
  'whisper large v3 turbo': 'openai/whisper-large-v3-turbo',
265
  'step 3 5 flash': 'stepfun-ai/Step-3.5-Flash',
266
  'bge m3': 'BAAI/bge-m3',
267
  'bge en icl': 'BAAI/bge-en-icl',
268
+ 'bge large en v1 5': 'BAAI/bge-large-en-v1.5',
269
+ 'bge multilingual gemma2': 'BAAI/bge-multilingual-gemma2',
270
  'lightonocr 2': 'lightonai/LightOnOCR-2-1B',
271
+
272
  'sdxl': 'stabilityai/stable-diffusion-xl-base-1.0',
273
  'flux 1 schnell': 'black-forest-labs/FLUX.1-schnell',
274
  'flux schnell': 'black-forest-labs/FLUX.1-schnell',
 
281
  // Qwen
282
  'qwen turbo': 'Alibaba/Qwen-Turbo',
283
  'alibaba qwen turbo': 'Alibaba/Qwen-Turbo',
284
+ 'qwen qwen turbo': 'Alibaba/Qwen-Turbo',
285
  'qwen plus': 'Alibaba/Qwen-Plus',
286
  'alibaba qwen plus': 'Alibaba/Qwen-Plus',
287
+ 'qwen qwen plus': 'Alibaba/Qwen-Plus',
288
  'qwen max': 'Alibaba/Qwen-Max',
289
  'alibaba qwen max': 'Alibaba/Qwen-Max',
290
+ 'qwen qwen max': 'Alibaba/Qwen-Max',
291
  'qwen 3 coder flash': 'Qwen/Qwen2.5-Coder-7B-Instruct',
292
  'qwen3 coder flash': 'Qwen/Qwen2.5-Coder-7B-Instruct',
293
  'qwen 3 coder plus': 'Qwen/Qwen2.5-Coder-32B-Instruct',
 
364
  'gemma 2 27b': 'gemma2:27b',
365
  'qwen 2 5 coder 7b': 'qwen2.5-coder:7b',
366
  'qwen 2 5 coder 32b': 'qwen2.5-coder:32b',
367
+ 'mistral large 2411': 'mistral-large',
368
+ 'mistral large 3': 'mistral-large',
369
+ 'phi 3 5 mini': 'phi3.5',
370
+ 'phi 3 5 vision': 'phi3.5-vision',
371
+ 'qwen 2 5 7b': 'qwen2.5:7b',
372
+ 'qwen 2 5 72b': 'qwen2.5:72b',
373
+ 'mistral nemo': 'mistral-nemo',
374
+ 'mixtral 8x7b': 'mixtral',
375
+ 'mixtral 8x22b': 'mixtral-8x22b',
376
  };
377
 
378
  const PROPRIETARY_KEYWORDS = [