CrispStrobe commited on
Commit
bffabba
Β·
1 Parent(s): ab19dc2

fix: optimize HF Hub lookups with smart merging, limited retries, and detailed logging

Browse files
Files changed (2) hide show
  1. data/providers.json +725 -666
  2. scripts/fetch-providers.js +55 -14
data/providers.json CHANGED
@@ -133,7 +133,9 @@
133
  "type": "embedding",
134
  "input_price_per_1m": 0.02,
135
  "output_price_per_1m": 0,
136
- "currency": "USD"
 
 
137
  }
138
  ],
139
  "lastUpdated": "2026-03-02T04:54:46.028Z"
@@ -1036,13 +1038,26 @@
1036
  "hf_id": "meta-llama/Meta-Llama-3-8B-Instruct"
1037
  },
1038
  {
1039
- "name": "novita/Sao10K/L3-8B-Stheno-v3.2",
1040
  "type": "chat",
1041
  "input_price_per_1m": 0.05,
1042
- "output_price_per_1m": 0.05,
1043
  "currency": "USD",
1044
- "context_window": 8192,
1045
- "size_b": 8
 
 
 
 
 
 
 
 
 
 
 
 
 
1046
  },
1047
  {
1048
  "name": "novita/meta-llama/llama-3.1-8b-instruct",
@@ -1067,38 +1082,25 @@
1067
  "size_b": 8
1068
  },
1069
  {
1070
- "name": "openai-responses/gpt-5-nano",
1071
- "type": "vision",
1072
  "input_price_per_1m": 0.05,
1073
- "output_price_per_1m": 0.4,
1074
  "currency": "USD",
1075
- "capabilities": [
1076
- "vision",
1077
- "reasoning"
1078
- ],
1079
- "context_window": 400000
1080
  },
1081
  {
1082
- "name": "azure/gpt-5-nano",
1083
  "type": "vision",
1084
  "input_price_per_1m": 0.05,
1085
  "output_price_per_1m": 0.4,
1086
  "currency": "USD",
1087
  "capabilities": [
 
1088
  "reasoning"
1089
  ],
1090
- "context_window": 200000
1091
- },
1092
- {
1093
- "name": "alibaba/qwen-turbo",
1094
- "type": "chat",
1095
- "input_price_per_1m": 0.05,
1096
- "output_price_per_1m": 0.2,
1097
- "currency": "USD",
1098
- "context_window": 1000000,
1099
- "capabilities": [
1100
- "tools"
1101
- ]
1102
  },
1103
  {
1104
  "name": "together/meta-llama/Llama-3.2-3B-Instruct-Turbo",
@@ -1110,21 +1112,21 @@
1110
  "size_b": 3
1111
  },
1112
  {
1113
- "name": "deepinfra/microsoft/phi-4",
1114
  "type": "chat",
1115
  "input_price_per_1m": 0.07,
1116
- "output_price_per_1m": 0.14,
1117
  "currency": "USD",
1118
- "context_window": 16384
 
1119
  },
1120
  {
1121
- "name": "deepinfra/Qwen/Qwen2.5-Coder-32B-Instruct",
1122
  "type": "chat",
1123
  "input_price_per_1m": 0.07,
1124
- "output_price_per_1m": 0.16,
1125
  "currency": "USD",
1126
- "context_window": 16384,
1127
- "size_b": 32
1128
  },
1129
  {
1130
  "name": "novita/gryphe/mythomax-l2-13b",
@@ -1136,16 +1138,18 @@
1136
  "size_b": 13
1137
  },
1138
  {
1139
- "name": "vertex/gemini-2.5-flash-lite",
1140
- "type": "vision",
1141
  "input_price_per_1m": 0.1,
1142
- "output_price_per_1m": 0.4,
1143
  "currency": "USD",
 
 
1144
  "capabilities": [
1145
- "vision",
1146
  "reasoning"
1147
  ],
1148
- "context_window": 1048576
1149
  },
1150
  {
1151
  "name": "openai/gpt-4.1-nano",
@@ -1159,27 +1163,30 @@
1159
  "context_window": 1047576
1160
  },
1161
  {
1162
- "name": "mistral/devstral-small-latest",
1163
- "type": "chat",
1164
  "input_price_per_1m": 0.1,
1165
- "output_price_per_1m": 0.3,
1166
  "currency": "USD",
1167
- "context_window": 131072,
1168
  "capabilities": [
1169
- "tools"
1170
  ],
1171
- "hf_id": "mistralai/Devstral-Small-2507"
1172
  },
1173
  {
1174
- "name": "mistral/mistral-small-2503",
1175
- "type": "chat",
1176
  "input_price_per_1m": 0.1,
1177
- "output_price_per_1m": 0.3,
1178
  "currency": "USD",
1179
- "context_window": 32768
 
 
 
 
1180
  },
1181
  {
1182
- "name": "mistral/devstral-small-2507",
1183
  "type": "chat",
1184
  "input_price_per_1m": 0.1,
1185
  "output_price_per_1m": 0.3,
@@ -1191,41 +1198,27 @@
1191
  "hf_id": "mistralai/Devstral-Small-2507"
1192
  },
1193
  {
1194
- "name": "openai-responses/gpt-4.1-nano",
1195
- "type": "vision",
1196
- "input_price_per_1m": 0.1,
1197
- "output_price_per_1m": 0.4,
1198
- "currency": "USD",
1199
- "capabilities": [
1200
- "vision"
1201
- ],
1202
- "context_window": 1047576
1203
- },
1204
- {
1205
- "name": "together/meta-llama/Meta-Llama-3-8B-Instruct-Lite",
1206
  "type": "chat",
1207
  "input_price_per_1m": 0.1,
1208
- "output_price_per_1m": 0.1,
1209
  "currency": "USD",
1210
- "context_window": 8192,
1211
- "size_b": 8
1212
  },
1213
  {
1214
- "name": "deepinfra/Qwen/Qwen3-32B",
1215
  "type": "chat",
1216
  "input_price_per_1m": 0.1,
1217
  "output_price_per_1m": 0.3,
1218
  "currency": "USD",
1219
- "context_window": 40000,
1220
- "size_b": 32,
1221
  "capabilities": [
1222
- "tools",
1223
- "reasoning"
1224
  ],
1225
- "hf_id": "Qwen/Qwen3-32B"
1226
  },
1227
  {
1228
- "name": "google/gemini-2.5-flash-lite",
1229
  "type": "vision",
1230
  "input_price_per_1m": 0.1,
1231
  "output_price_per_1m": 0.4,
@@ -1237,7 +1230,7 @@
1237
  "context_window": 1048576
1238
  },
1239
  {
1240
- "name": "google/gemini-2.0-flash-001",
1241
  "type": "vision",
1242
  "input_price_per_1m": 0.1,
1243
  "output_price_per_1m": 0.4,
@@ -1245,10 +1238,10 @@
1245
  "capabilities": [
1246
  "vision"
1247
  ],
1248
- "context_window": 1048576
1249
  },
1250
  {
1251
- "name": "azure/openai-responses/gpt-4.1-nano",
1252
  "type": "vision",
1253
  "input_price_per_1m": 0.1,
1254
  "output_price_per_1m": 0.4,
@@ -1259,7 +1252,16 @@
1259
  "context_window": 1047576
1260
  },
1261
  {
1262
- "name": "azure/gpt-4.1-nano",
 
 
 
 
 
 
 
 
 
1263
  "type": "vision",
1264
  "input_price_per_1m": 0.1,
1265
  "output_price_per_1m": 0.4,
@@ -1270,18 +1272,18 @@
1270
  "context_window": 1047576
1271
  },
1272
  {
1273
- "name": "groq/openai/gpt-oss-20b",
1274
  "type": "chat",
1275
  "input_price_per_1m": 0.1,
1276
- "output_price_per_1m": 0.5,
1277
  "currency": "USD",
1278
- "context_window": 131072,
1279
- "size_b": 20,
1280
  "capabilities": [
1281
  "tools",
1282
  "reasoning"
1283
  ],
1284
- "hf_id": "openai/gpt-oss-20b"
1285
  },
1286
  {
1287
  "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct-Turbo",
@@ -1331,18 +1333,18 @@
1331
  "size_b": 8
1332
  },
1333
  {
1334
- "name": "novita/deepseek/deepseek-r1-distill-qwen-14b",
1335
  "type": "chat",
1336
  "input_price_per_1m": 0.15,
1337
- "output_price_per_1m": 0.15,
1338
  "currency": "USD",
1339
- "context_window": 128000,
1340
- "size_b": 14,
1341
  "capabilities": [
1342
  "tools",
1343
  "reasoning"
1344
  ],
1345
- "hf_id": "deepseek-ai/DeepSeek-R1"
1346
  },
1347
  {
1348
  "name": "openai/gpt-4o-mini",
@@ -1356,16 +1358,26 @@
1356
  "context_window": 128000
1357
  },
1358
  {
1359
- "name": "mistral/mistral-small-latest",
1360
- "type": "vision",
1361
  "input_price_per_1m": 0.15,
1362
  "output_price_per_1m": 0.6,
1363
  "currency": "USD",
1364
  "capabilities": [
1365
- "vision",
1366
  "reasoning"
1367
  ],
1368
- "context_window": 256000
 
 
 
 
 
 
 
 
 
 
 
1369
  },
1370
  {
1371
  "name": "mistral/mistral-small-2603",
@@ -1382,40 +1394,30 @@
1382
  "hf_id": "mistralai/Mistral-Small-4-119B-2603"
1383
  },
1384
  {
1385
- "name": "parasail/parasail-qwen3-235b-a22b-instruct-2507",
1386
- "type": "chat",
1387
- "input_price_per_1m": 0.15,
1388
- "output_price_per_1m": 0.85,
1389
- "currency": "USD",
1390
- "context_window": 262144,
1391
- "size_b": 235
1392
- },
1393
- {
1394
- "name": "nebius/openai/gpt-oss-120b",
1395
- "type": "chat",
1396
  "input_price_per_1m": 0.15,
1397
  "output_price_per_1m": 0.6,
1398
  "currency": "USD",
1399
  "capabilities": [
 
1400
  "reasoning"
1401
  ],
1402
- "context_window": 131000,
1403
- "size_b": 120,
1404
- "hf_id": "openai/gpt-oss-120b"
1405
  },
1406
  {
1407
- "name": "groq/openai/gpt-oss-120b",
1408
  "type": "chat",
1409
  "input_price_per_1m": 0.15,
1410
- "output_price_per_1m": 0.75,
1411
  "currency": "USD",
1412
- "context_window": 131072,
1413
- "size_b": 120,
1414
  "capabilities": [
1415
  "tools",
1416
  "reasoning"
1417
  ],
1418
- "hf_id": "openai/gpt-oss-120b"
1419
  },
1420
  {
1421
  "name": "novita/mistralai/mistral-nemo",
@@ -1439,18 +1441,29 @@
1439
  "size_b": 8
1440
  },
1441
  {
1442
- "name": "novita/meta-llama/llama-4-maverick-17b-128e-instruct-fp8",
1443
  "type": "vision",
1444
  "input_price_per_1m": 0.2,
1445
- "output_price_per_1m": 0.85,
1446
  "currency": "USD",
1447
- "context_window": 1048576,
1448
- "size_b": 17,
1449
  "capabilities": [
1450
  "vision",
1451
- "tools"
1452
  ],
1453
- "hf_id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct"
 
 
 
 
 
 
 
 
 
 
 
 
 
1454
  },
1455
  {
1456
  "name": "novita/qwen/qwen3-235b-a22b-fp8",
@@ -1467,44 +1480,34 @@
1467
  "hf_id": "Qwen/Qwen3-235B-A22B"
1468
  },
1469
  {
1470
- "name": "openai/gpt-5.4-nano",
1471
  "type": "vision",
1472
  "input_price_per_1m": 0.2,
1473
- "output_price_per_1m": 1.25,
1474
  "currency": "USD",
 
 
1475
  "capabilities": [
1476
  "vision",
1477
- "reasoning"
1478
  ],
1479
- "context_window": 400000
1480
  },
1481
  {
1482
- "name": "openai-responses/gpt-5.4-nano",
1483
  "type": "vision",
1484
  "input_price_per_1m": 0.2,
1485
- "output_price_per_1m": 1.25,
1486
  "currency": "USD",
 
1487
  "capabilities": [
1488
  "vision",
1489
- "reasoning"
1490
- ],
1491
- "context_window": 400000
1492
- },
1493
- {
1494
- "name": "xai/grok-4-fast-non-reasoning",
1495
- "type": "vision",
1496
- "input_price_per_1m": 0.2,
1497
- "output_price_per_1m": 0.5,
1498
- "currency": "USD",
1499
- "context_window": 2000000,
1500
- "capabilities": [
1501
- "vision",
1502
- "tools",
1503
  "reasoning"
1504
  ]
1505
  },
1506
  {
1507
- "name": "xai/grok-4-1-fast-non-reasoning",
1508
  "type": "vision",
1509
  "input_price_per_1m": 0.2,
1510
  "output_price_per_1m": 0.5,
@@ -1515,15 +1518,15 @@
1515
  "context_window": 2000000
1516
  },
1517
  {
1518
- "name": "xai/grok-code-fast-1",
1519
  "type": "vision",
1520
  "input_price_per_1m": 0.2,
1521
- "output_price_per_1m": 1.5,
1522
  "currency": "USD",
1523
  "capabilities": [
1524
  "vision"
1525
  ],
1526
- "context_window": 256000
1527
  },
1528
  {
1529
  "name": "xai/grok-4-fast",
@@ -1539,15 +1542,15 @@
1539
  ]
1540
  },
1541
  {
1542
- "name": "xai/grok-4-1-fast-reasoning",
1543
  "type": "vision",
1544
  "input_price_per_1m": 0.2,
1545
- "output_price_per_1m": 0.5,
1546
  "currency": "USD",
1547
  "capabilities": [
1548
  "vision"
1549
  ],
1550
- "context_window": 2000000
1551
  },
1552
  {
1553
  "name": "together/meta-llama/LlamaGuard-2-8b",
@@ -1559,18 +1562,16 @@
1559
  "size_b": 8
1560
  },
1561
  {
1562
- "name": "deepinfra/zai-org/GLM-4.5-Air",
1563
- "type": "chat",
1564
  "input_price_per_1m": 0.2,
1565
- "output_price_per_1m": 1.1,
1566
  "currency": "USD",
1567
- "context_window": 131072,
1568
  "capabilities": [
1569
- "tools",
1570
  "reasoning"
1571
  ],
1572
- "hf_id": "zai-org/GLM-4.5-Air",
1573
- "size_b": 110.5
1574
  },
1575
  {
1576
  "name": "deepinfra/Qwen/Qwen3-235B-A22B",
@@ -1587,17 +1588,31 @@
1587
  "hf_id": "Qwen/Qwen3-235B-A22B"
1588
  },
1589
  {
1590
- "name": "alibaba/qwen3-30b-a3b-instruct-2507",
1591
- "type": "vision",
1592
  "input_price_per_1m": 0.2,
1593
- "output_price_per_1m": 0.8,
1594
  "currency": "USD",
 
1595
  "capabilities": [
1596
- "vision"
 
1597
  ],
 
 
 
 
 
 
 
 
 
1598
  "context_window": 131072,
1599
- "size_b": 30,
1600
- "hf_id": "Qwen/Qwen3-30B-A3B-Instruct-2507"
 
 
 
1601
  },
1602
  {
1603
  "name": "deepinfra/deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
@@ -1635,20 +1650,7 @@
1635
  "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct"
1636
  },
1637
  {
1638
- "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct",
1639
- "type": "chat",
1640
- "input_price_per_1m": 0.23,
1641
- "output_price_per_1m": 0.4,
1642
- "currency": "USD",
1643
- "context_window": 131072,
1644
- "size_b": 70,
1645
- "capabilities": [
1646
- "tools"
1647
- ],
1648
- "hf_id": "meta-llama/Llama-3.3-70B-Instruct"
1649
- },
1650
- {
1651
- "name": "vertex/gemini-3.1-flash-lite-preview",
1652
  "type": "vision",
1653
  "input_price_per_1m": 0.25,
1654
  "output_price_per_1m": 1.5,
@@ -1668,38 +1670,38 @@
1668
  "size_b": 7
1669
  },
1670
  {
1671
- "name": "openai-responses/gpt-5-mini",
1672
  "type": "vision",
1673
  "input_price_per_1m": 0.25,
1674
- "output_price_per_1m": 2,
1675
  "currency": "USD",
1676
  "capabilities": [
1677
- "vision",
1678
- "reasoning"
1679
  ],
1680
- "context_window": 400000
1681
  },
1682
  {
1683
- "name": "google/gemini-3.1-flash-lite-preview",
1684
  "type": "vision",
1685
  "input_price_per_1m": 0.25,
1686
- "output_price_per_1m": 1.5,
1687
  "currency": "USD",
1688
  "capabilities": [
1689
- "vision"
1690
  ],
1691
- "context_window": 1048576
1692
  },
1693
  {
1694
- "name": "azure/gpt-5-mini",
1695
  "type": "vision",
1696
  "input_price_per_1m": 0.25,
1697
  "output_price_per_1m": 2,
1698
  "currency": "USD",
1699
  "capabilities": [
 
1700
  "reasoning"
1701
  ],
1702
- "context_window": 200000
1703
  },
1704
  {
1705
  "name": "novita/deepseek/deepseek-v3.2",
@@ -1711,7 +1713,8 @@
1711
  "reasoning"
1712
  ],
1713
  "context_window": 163840,
1714
- "hf_id": "deepseek-ai/DeepSeek-V3.2"
 
1715
  },
1716
  {
1717
  "name": "deepseek/deepseek-chat",
@@ -1734,46 +1737,53 @@
1734
  "context_window": 128000
1735
  },
1736
  {
1737
- "name": "novita/minimax-m2.7",
1738
- "type": "vision",
1739
  "input_price_per_1m": 0.3,
1740
  "output_price_per_1m": 1.2,
1741
  "currency": "USD",
1742
  "capabilities": [
1743
- "vision",
1744
  "reasoning"
1745
  ],
1746
  "context_window": 200000,
1747
- "hf_id": "MiniMaxAI/MiniMax-M2.7"
 
1748
  },
1749
  {
1750
- "name": "novita/deepseek/deepseek-r1-distill-qwen-32b",
1751
  "type": "chat",
1752
  "input_price_per_1m": 0.3,
1753
- "output_price_per_1m": 0.3,
1754
  "currency": "USD",
1755
- "context_window": 12800,
1756
- "size_b": 32,
1757
  "capabilities": [
1758
  "reasoning"
1759
  ],
1760
- "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B"
 
 
1761
  },
1762
  {
1763
- "name": "novita/MiniMax-M2.7",
 
 
 
 
 
 
 
 
 
1764
  "type": "vision",
1765
  "input_price_per_1m": 0.3,
1766
- "output_price_per_1m": 1.2,
1767
  "currency": "USD",
1768
  "capabilities": [
1769
- "vision",
1770
- "reasoning"
1771
  ],
1772
- "context_window": 200000,
1773
- "hf_id": "MiniMaxAI/MiniMax-M2.7"
1774
  },
1775
  {
1776
- "name": "vertex/gemini-2.5-flash",
1777
  "type": "vision",
1778
  "input_price_per_1m": 0.3,
1779
  "output_price_per_1m": 2.5,
@@ -1785,7 +1795,15 @@
1785
  "context_window": 1048576
1786
  },
1787
  {
1788
- "name": "vertex/gemini-2.5-flash-image",
 
 
 
 
 
 
 
 
1789
  "type": "vision",
1790
  "input_price_per_1m": 0.3,
1791
  "output_price_per_1m": 2.5,
@@ -1797,7 +1815,7 @@
1797
  "context_window": 1048576
1798
  },
1799
  {
1800
- "name": "coding/gemini-2.5-flash",
1801
  "type": "vision",
1802
  "input_price_per_1m": 0.3,
1803
  "output_price_per_1m": 2.5,
@@ -1809,90 +1827,71 @@
1809
  "context_window": 1048576
1810
  },
1811
  {
1812
- "name": "mistral/codestral-latest",
1813
- "type": "chat",
1814
- "input_price_per_1m": 0.3,
1815
- "output_price_per_1m": 0.9,
1816
- "currency": "USD",
1817
- "context_window": 131072
1818
- },
1819
- {
1820
- "name": "xai/grok-3-mini",
1821
- "type": "chat",
1822
  "input_price_per_1m": 0.3,
1823
- "output_price_per_1m": 0.5,
1824
  "currency": "USD",
1825
  "capabilities": [
 
1826
  "reasoning"
1827
  ],
1828
- "context_window": 131072
 
1829
  },
1830
  {
1831
- "name": "together/Qwen/Qwen2.5-7B-Instruct-Turbo",
1832
  "type": "chat",
1833
  "input_price_per_1m": 0.3,
1834
  "output_price_per_1m": 0.3,
1835
  "currency": "USD",
1836
- "context_window": 32768,
1837
- "size_b": 7
1838
- },
1839
- {
1840
- "name": "deepinfra/deepseek-ai/DeepSeek-V3.1",
1841
- "type": "chat",
1842
- "input_price_per_1m": 0.3,
1843
- "output_price_per_1m": 1,
1844
- "currency": "USD",
1845
- "context_window": 163840,
1846
  "capabilities": [
1847
- "tools",
1848
  "reasoning"
1849
  ],
1850
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus"
1851
- },
1852
- {
1853
- "name": "parasail/parasail-gemma3-27b-it",
1854
- "type": "chat",
1855
- "input_price_per_1m": 0.3,
1856
- "output_price_per_1m": 0.5,
1857
- "currency": "USD",
1858
- "context_window": 128000,
1859
- "size_b": 27
1860
  },
1861
  {
1862
- "name": "google/gemini-2.5-flash",
1863
  "type": "vision",
1864
  "input_price_per_1m": 0.3,
1865
- "output_price_per_1m": 2.5,
1866
  "currency": "USD",
1867
  "capabilities": [
1868
  "vision",
1869
  "reasoning"
1870
  ],
1871
- "context_window": 1048576
 
1872
  },
1873
  {
1874
- "name": "nebius/deepseek-ai/DeepSeek-V3.2",
1875
  "type": "chat",
1876
  "input_price_per_1m": 0.3,
1877
- "output_price_per_1m": 0.45,
1878
  "currency": "USD",
 
1879
  "capabilities": [
 
1880
  "reasoning"
1881
  ],
1882
- "context_window": 164000,
1883
- "hf_id": "deepseek-ai/DeepSeek-V3.2"
1884
  },
1885
  {
1886
- "name": "nebius/minimax/minimax-m2.1",
1887
- "type": "chat",
1888
  "input_price_per_1m": 0.3,
1889
  "output_price_per_1m": 1.2,
1890
  "currency": "USD",
1891
  "capabilities": [
 
1892
  "reasoning"
1893
  ],
1894
  "context_window": 200000,
1895
- "hf_id": "MiniMaxAI/MiniMax-M2.1"
 
1896
  },
1897
  {
1898
  "name": "minimaxi/MiniMax-M2.7",
@@ -1908,41 +1907,49 @@
1908
  "hf_id": "MiniMaxAI/MiniMax-M2.7"
1909
  },
1910
  {
1911
- "name": "minimaxi/MiniMax-M2",
1912
  "type": "chat",
1913
  "input_price_per_1m": 0.3,
1914
- "output_price_per_1m": 1.2,
1915
  "currency": "USD",
1916
- "context_window": 200000,
1917
  "capabilities": [
1918
- "tools",
1919
  "reasoning"
1920
  ],
1921
- "hf_id": "MiniMaxAI/MiniMax-M2"
1922
  },
1923
  {
1924
- "name": "minimaxi/MiniMax-M2.5",
 
 
 
 
 
 
 
 
 
1925
  "type": "vision",
1926
  "input_price_per_1m": 0.3,
1927
- "output_price_per_1m": 1.2,
1928
  "currency": "USD",
1929
  "capabilities": [
1930
  "vision",
1931
  "reasoning"
1932
  ],
1933
- "context_window": 200000,
1934
- "hf_id": "MiniMaxAI/MiniMax-M2.5"
1935
  },
1936
  {
1937
- "name": "alibaba/qwen3-coder-flash",
1938
- "type": "vision",
1939
  "input_price_per_1m": 0.3,
1940
- "output_price_per_1m": 1.5,
1941
  "currency": "USD",
 
1942
  "capabilities": [
1943
- "vision"
 
1944
  ],
1945
- "context_window": 1048576
1946
  },
1947
  {
1948
  "name": "deepinfra/meta-llama/Llama-3.2-90B-Vision-Instruct",
@@ -1980,51 +1987,47 @@
1980
  "hf_id": "meta-llama/Llama-3.3-70B-Instruct"
1981
  },
1982
  {
1983
- "name": "novita/deepseek/deepseek-v3-0324",
1984
- "type": "chat",
1985
  "input_price_per_1m": 0.4,
1986
- "output_price_per_1m": 1.3,
1987
  "currency": "USD",
1988
- "context_window": 128000,
1989
  "capabilities": [
1990
- "tools",
1991
- "reasoning"
1992
  ],
1993
- "size_b": 685,
1994
- "hf_id": "deepseek-ai/DeepSeek-V3-0324"
1995
- },
1996
- {
1997
- "name": "novita/deepseek/deepseek-v3-turbo",
1998
- "type": "chat",
1999
- "input_price_per_1m": 0.4,
2000
- "output_price_per_1m": 1.3,
2001
- "currency": "USD",
2002
- "context_window": 128000
2003
  },
2004
  {
2005
- "name": "openai/gpt-4.1-mini",
2006
- "type": "vision",
2007
  "input_price_per_1m": 0.4,
2008
- "output_price_per_1m": 1.6,
2009
  "currency": "USD",
 
 
2010
  "capabilities": [
2011
- "vision"
2012
  ],
2013
- "context_window": 1047576
2014
  },
2015
  {
2016
- "name": "mistral/devstral-latest",
2017
  "type": "chat",
2018
  "input_price_per_1m": 0.4,
2019
  "output_price_per_1m": 2,
2020
  "currency": "USD",
2021
- "context_window": 256000
 
 
 
 
 
2022
  },
2023
  {
2024
- "name": "mistral/devstral-medium-2507",
2025
  "type": "chat",
2026
  "input_price_per_1m": 0.4,
2027
- "output_price_per_1m": 2,
2028
  "currency": "USD",
2029
  "context_window": 131072,
2030
  "capabilities": [
@@ -2040,28 +2043,23 @@
2040
  "context_window": 131072
2041
  },
2042
  {
2043
- "name": "openai-responses/gpt-4.1-mini",
2044
- "type": "vision",
2045
  "input_price_per_1m": 0.4,
2046
- "output_price_per_1m": 1.6,
2047
  "currency": "USD",
 
2048
  "capabilities": [
2049
- "vision"
2050
- ],
2051
- "context_window": 1047576
2052
  },
2053
  {
2054
- "name": "deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2055
  "type": "chat",
2056
  "input_price_per_1m": 0.4,
2057
- "output_price_per_1m": 1.6,
2058
  "currency": "USD",
2059
- "context_window": 262144,
2060
- "size_b": 480,
2061
- "capabilities": [
2062
- "tools"
2063
- ],
2064
- "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct"
2065
  },
2066
  {
2067
  "name": "azure/gpt-4.1-mini",
@@ -2086,75 +2084,91 @@
2086
  "context_window": 1047576
2087
  },
2088
  {
2089
- "name": "nebius/zai-org/GLM-4.7",
2090
  "type": "chat",
2091
  "input_price_per_1m": 0.4,
2092
- "output_price_per_1m": 2,
2093
  "currency": "USD",
 
2094
  "capabilities": [
 
2095
  "reasoning"
2096
  ],
2097
- "context_window": 200000,
2098
- "hf_id": "zai-org/GLM-4.7"
2099
  },
2100
  {
2101
- "name": "nebius/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2102
  "type": "chat",
2103
  "input_price_per_1m": 0.4,
2104
- "output_price_per_1m": 1.8,
 
 
 
 
 
 
 
 
2105
  "currency": "USD",
2106
- "context_window": 262000,
2107
- "size_b": 480,
2108
  "capabilities": [
2109
- "tools"
2110
  ],
2111
- "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct"
2112
  },
2113
  {
2114
- "name": "alibaba/qwen-plus",
2115
  "type": "chat",
2116
  "input_price_per_1m": 0.4,
2117
- "output_price_per_1m": 1.2,
2118
  "currency": "USD",
2119
- "context_window": 131072,
 
2120
  "capabilities": [
2121
  "tools"
2122
- ]
 
2123
  },
2124
  {
2125
- "name": "vertex/gemini-3.1-flash-image-preview",
2126
- "type": "vision",
2127
  "input_price_per_1m": 0.5,
2128
- "output_price_per_1m": 2,
2129
  "currency": "USD",
 
2130
  "capabilities": [
2131
- "vision",
2132
  "reasoning"
2133
  ],
2134
- "context_window": 131072
 
2135
  },
2136
  {
2137
- "name": "vertex/gemini-3-flash-preview",
2138
- "type": "vision",
2139
  "input_price_per_1m": 0.5,
2140
- "output_price_per_1m": 3,
2141
  "currency": "USD",
 
2142
  "capabilities": [
2143
- "vision",
2144
- "reasoning"
2145
  ],
2146
- "context_window": 1048576
 
2147
  },
2148
  {
2149
- "name": "mistral/mistral-large-latest",
2150
- "type": "chat",
2151
  "input_price_per_1m": 0.5,
2152
- "output_price_per_1m": 1.5,
2153
  "currency": "USD",
2154
- "context_window": 131072,
2155
  "capabilities": [
2156
- "tools"
2157
- ]
 
 
 
 
2158
  },
2159
  {
2160
  "name": "google/gemini-3.1-flash-image-preview",
@@ -2181,44 +2195,39 @@
2181
  "context_window": 1048576
2182
  },
2183
  {
2184
- "name": "nebius/moonshotai/Kimi-K2-Instruct",
2185
  "type": "chat",
2186
  "input_price_per_1m": 0.5,
2187
- "output_price_per_1m": 2.4,
2188
  "currency": "USD",
2189
- "context_window": 131000,
2190
  "capabilities": [
2191
  "tools"
2192
- ],
2193
- "hf_id": "moonshotai/Kimi-K2-Instruct"
2194
  },
2195
  {
2196
- "name": "nebius/deepseek-ai/DeepSeek-V3-0324",
2197
- "type": "chat",
2198
  "input_price_per_1m": 0.5,
2199
- "output_price_per_1m": 1.5,
2200
  "currency": "USD",
2201
- "context_window": 128000,
2202
  "capabilities": [
2203
- "tools",
2204
  "reasoning"
2205
  ],
2206
- "size_b": 685,
2207
- "hf_id": "deepseek-ai/DeepSeek-V3-0324"
2208
  },
2209
  {
2210
- "name": "nebius/moonshotai/kimi-k2.5",
2211
  "type": "vision",
2212
  "input_price_per_1m": 0.5,
2213
- "output_price_per_1m": 2.5,
2214
  "currency": "USD",
2215
  "capabilities": [
2216
  "vision",
2217
  "reasoning"
2218
  ],
2219
- "context_window": 256000,
2220
- "hf_id": "moonshotai/Kimi-K2.5",
2221
- "size_b": 1058.6
2222
  },
2223
  {
2224
  "name": "novita/meta-llama/llama-3-70b-instruct",
@@ -2255,7 +2264,8 @@
2255
  "reasoning"
2256
  ],
2257
  "context_window": 163840,
2258
- "hf_id": "deepseek-ai/DeepSeek-V3.2"
 
2259
  },
2260
  {
2261
  "name": "novita/moonshotai/kimi-k2-instruct",
@@ -2267,36 +2277,37 @@
2267
  "capabilities": [
2268
  "tools"
2269
  ],
2270
- "hf_id": "moonshotai/Kimi-K2-Instruct"
 
2271
  },
2272
  {
2273
- "name": "novita/zai-org/glm-4.6",
2274
  "type": "chat",
2275
  "input_price_per_1m": 0.6,
2276
  "output_price_per_1m": 2.2,
2277
  "currency": "USD",
2278
- "context_window": 204800,
2279
  "capabilities": [
2280
- "tools",
2281
  "reasoning"
2282
  ],
2283
- "hf_id": "zai-org/GLM-4.6"
 
 
2284
  },
2285
  {
2286
- "name": "novita/zai-org/glm-4.5",
2287
  "type": "chat",
2288
  "input_price_per_1m": 0.6,
2289
  "output_price_per_1m": 2.2,
2290
  "currency": "USD",
2291
- "context_window": 131072,
2292
  "capabilities": [
2293
- "tools",
2294
  "reasoning"
2295
  ],
2296
- "hf_id": "zai-org/GLM-4.5"
 
 
2297
  },
2298
  {
2299
- "name": "zai/GLM-4.5",
2300
  "type": "chat",
2301
  "input_price_per_1m": 0.6,
2302
  "output_price_per_1m": 2.2,
@@ -2304,32 +2315,37 @@
2304
  "capabilities": [
2305
  "reasoning"
2306
  ],
2307
- "context_window": 131072,
2308
- "hf_id": "zai-org/GLM-4.5"
 
2309
  },
2310
  {
2311
- "name": "zai/GLM-4.6",
2312
  "type": "chat",
2313
  "input_price_per_1m": 0.6,
2314
  "output_price_per_1m": 2.2,
2315
  "currency": "USD",
 
2316
  "capabilities": [
 
2317
  "reasoning"
2318
  ],
2319
- "context_window": 200000,
2320
- "hf_id": "zai-org/GLM-4.6"
2321
  },
2322
  {
2323
- "name": "zai/GLM-4.7",
2324
- "type": "chat",
2325
  "input_price_per_1m": 0.6,
2326
- "output_price_per_1m": 2.2,
2327
  "currency": "USD",
2328
  "capabilities": [
 
2329
  "reasoning"
2330
  ],
2331
- "context_window": 200000,
2332
- "hf_id": "zai-org/GLM-4.7"
 
2333
  },
2334
  {
2335
  "name": "moonshot/kimi-k2-0711-preview",
@@ -2341,7 +2357,8 @@
2341
  "capabilities": [
2342
  "tools"
2343
  ],
2344
- "hf_id": "moonshotai/Kimi-K2-Instruct"
 
2345
  },
2346
  {
2347
  "name": "moonshot/kimi-k2.5",
@@ -2368,7 +2385,8 @@
2368
  "tools",
2369
  "reasoning"
2370
  ],
2371
- "hf_id": "moonshotai/Kimi-K2-Thinking"
 
2372
  },
2373
  {
2374
  "name": "moonshot/kimi-k2-0905-preview",
@@ -2380,7 +2398,8 @@
2380
  "capabilities": [
2381
  "tools"
2382
  ],
2383
- "hf_id": "moonshotai/Kimi-K2-Instruct-0905"
 
2384
  },
2385
  {
2386
  "name": "moonshot/kimi-k2-thinking",
@@ -2392,10 +2411,11 @@
2392
  "capabilities": [
2393
  "tools"
2394
  ],
2395
- "hf_id": "moonshotai/Kimi-K2-Instruct"
 
2396
  },
2397
  {
2398
- "name": "deepinfra/zai-org/GLM-4.5",
2399
  "type": "chat",
2400
  "input_price_per_1m": 0.6,
2401
  "output_price_per_1m": 2.2,
@@ -2405,23 +2425,25 @@
2405
  "tools",
2406
  "reasoning"
2407
  ],
2408
- "hf_id": "zai-org/GLM-4.5"
 
2409
  },
2410
  {
2411
- "name": "nebius/zai-org/GLM-4.5",
2412
  "type": "chat",
2413
  "input_price_per_1m": 0.6,
2414
  "output_price_per_1m": 2.2,
2415
  "currency": "USD",
2416
- "context_window": 128000,
2417
  "capabilities": [
2418
  "tools",
2419
  "reasoning"
2420
  ],
2421
- "hf_id": "zai-org/GLM-4.5"
 
2422
  },
2423
  {
2424
- "name": "minimaxi/MiniMax-M2.7-highspeed",
2425
  "type": "vision",
2426
  "input_price_per_1m": 0.6,
2427
  "output_price_per_1m": 2.4,
@@ -2431,10 +2453,11 @@
2431
  "reasoning"
2432
  ],
2433
  "context_window": 200000,
2434
- "hf_id": "MiniMaxAI/MiniMax-M2.7"
 
2435
  },
2436
  {
2437
- "name": "minimaxi/MiniMax-M2.5-highspeed",
2438
  "type": "vision",
2439
  "input_price_per_1m": 0.6,
2440
  "output_price_per_1m": 2.4,
@@ -2444,21 +2467,21 @@
2444
  "reasoning"
2445
  ],
2446
  "context_window": 200000,
2447
- "hf_id": "MiniMaxAI/MiniMax-M2.5"
2448
  },
2449
  {
2450
- "name": "alibaba/qwen3.5",
2451
- "type": "vision",
2452
  "input_price_per_1m": 0.6,
2453
- "output_price_per_1m": 3.6,
2454
  "currency": "USD",
 
2455
  "capabilities": [
2456
- "vision",
2457
  "reasoning"
2458
  ],
2459
- "context_window": 256000,
2460
- "size_b": 9,
2461
- "hf_id": "Qwen/Qwen3.5-9B"
2462
  },
2463
  {
2464
  "name": "novita/microsoft/wizardlm-2-8x22b",
@@ -2482,13 +2505,16 @@
2482
  "context_window": 400000
2483
  },
2484
  {
2485
- "name": "novita/deepseek/deepseek-prover-v2-671b",
2486
- "type": "chat",
2487
  "input_price_per_1m": 0.7,
2488
- "output_price_per_1m": 2.5,
2489
  "currency": "USD",
2490
- "context_window": 160000,
2491
- "size_b": 671
 
 
 
2492
  },
2493
  {
2494
  "name": "novita/deepseek/deepseek-r1-turbo",
@@ -2501,19 +2527,17 @@
2501
  "tools",
2502
  "reasoning"
2503
  ],
2504
- "hf_id": "deepseek-ai/DeepSeek-R1"
 
2505
  },
2506
  {
2507
- "name": "parasail/parasail-qwen25-vl-72b-instruct",
2508
- "type": "vision",
2509
  "input_price_per_1m": 0.7,
2510
- "output_price_per_1m": 0.7,
2511
  "currency": "USD",
2512
- "capabilities": [
2513
- "vision"
2514
- ],
2515
- "context_window": 32768,
2516
- "size_b": 72
2517
  },
2518
  {
2519
  "name": "openai/gpt-5.4-mini",
@@ -2537,7 +2561,21 @@
2537
  "vision",
2538
  "reasoning"
2539
  ],
2540
- "context_window": 400000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2541
  },
2542
  {
2543
  "name": "novita/deepseek/deepseek-r1-distill-llama-70b",
@@ -2575,17 +2613,17 @@
2575
  "size_b": 405
2576
  },
2577
  {
2578
- "name": "nebius/deepseek-ai/DeepSeek-R1-0528",
2579
  "type": "chat",
2580
- "input_price_per_1m": 0.8,
2581
- "output_price_per_1m": 2.4,
2582
  "currency": "USD",
2583
- "context_window": 164000,
2584
  "capabilities": [
2585
  "tools",
2586
  "reasoning"
2587
  ],
2588
- "hf_id": "deepseek-ai/DeepSeek-R1-0528"
2589
  },
2590
  {
2591
  "name": "deepinfra/deepseek-ai/DeepSeek-R1",
@@ -2598,20 +2636,8 @@
2598
  "tools",
2599
  "reasoning"
2600
  ],
2601
- "hf_id": "deepseek-ai/DeepSeek-R1"
2602
- },
2603
- {
2604
- "name": "deepinfra/deepseek-ai/DeepSeek-V3",
2605
- "type": "chat",
2606
- "input_price_per_1m": 0.85,
2607
- "output_price_per_1m": 0.9,
2608
- "currency": "USD",
2609
- "context_window": 128000,
2610
- "capabilities": [
2611
- "tools",
2612
- "reasoning"
2613
- ],
2614
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus"
2615
  },
2616
  {
2617
  "name": "alibaba/qwen3-max",
@@ -2625,26 +2651,26 @@
2625
  "context_window": 262144
2626
  },
2627
  {
2628
- "name": "together/meta-llama/Llama-3.3-70B-Instruct-Turbo",
2629
  "type": "chat",
2630
  "input_price_per_1m": 0.88,
2631
  "output_price_per_1m": 0.88,
2632
  "currency": "USD",
2633
  "context_window": 131072,
2634
- "size_b": 70,
2635
- "capabilities": [
2636
- "tools"
2637
- ],
2638
- "hf_id": "meta-llama/Llama-3.3-70B-Instruct"
2639
  },
2640
  {
2641
- "name": "together/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
2642
  "type": "chat",
2643
  "input_price_per_1m": 0.88,
2644
  "output_price_per_1m": 0.88,
2645
  "currency": "USD",
2646
  "context_window": 131072,
2647
- "size_b": 70
 
 
 
 
2648
  },
2649
  {
2650
  "name": "novita/deepseek/deepseek_v3",
@@ -2668,41 +2694,47 @@
2668
  "context_window": 131072
2669
  },
2670
  {
2671
- "name": "perplexity/sonar",
2672
  "type": "vision",
2673
  "input_price_per_1m": 1,
2674
- "output_price_per_1m": 1,
2675
  "currency": "USD",
2676
- "context_window": 131072,
2677
  "capabilities": [
2678
- "vision"
2679
- ]
 
 
 
 
2680
  },
2681
  {
2682
- "name": "bedrock/claude-haiku-4-5",
2683
- "type": "vision",
2684
  "input_price_per_1m": 1,
2685
- "output_price_per_1m": 5,
2686
  "currency": "USD",
 
2687
  "capabilities": [
2688
- "vision"
2689
  ],
2690
- "context_window": 200000
 
2691
  },
2692
  {
2693
- "name": "novita/GLM-5",
2694
  "type": "chat",
2695
  "input_price_per_1m": 1,
2696
- "output_price_per_1m": 3.2,
2697
  "currency": "USD",
 
2698
  "capabilities": [
2699
- "reasoning"
2700
  ],
2701
- "context_window": 202800,
2702
- "hf_id": "zai-org/GLM-5"
2703
  },
2704
  {
2705
- "name": "vertex/claude-haiku-4-5",
2706
  "type": "vision",
2707
  "input_price_per_1m": 1,
2708
  "output_price_per_1m": 5,
@@ -2725,20 +2757,18 @@
2725
  "context_window": 200000
2726
  },
2727
  {
2728
- "name": "zai/GLM-5",
2729
  "type": "vision",
2730
  "input_price_per_1m": 1,
2731
- "output_price_per_1m": 3.2,
2732
  "currency": "USD",
2733
  "capabilities": [
2734
- "vision",
2735
- "reasoning"
2736
  ],
2737
- "context_window": 200000,
2738
- "hf_id": "zai-org/GLM-5"
2739
  },
2740
  {
2741
- "name": "anthropic/claude-haiku-4-5",
2742
  "type": "vision",
2743
  "input_price_per_1m": 1,
2744
  "output_price_per_1m": 5,
@@ -2749,39 +2779,39 @@
2749
  "context_window": 200000
2750
  },
2751
  {
2752
- "name": "alibaba/qwen3-coder-plus",
2753
  "type": "vision",
2754
  "input_price_per_1m": 1,
2755
- "output_price_per_1m": 5,
2756
  "currency": "USD",
 
2757
  "capabilities": [
2758
  "vision"
2759
- ],
2760
- "context_window": 1048576
2761
  },
2762
  {
2763
- "name": "groq/moonshotai/Kimi-K2-Instruct-0905",
2764
- "type": "chat",
2765
  "input_price_per_1m": 1,
2766
- "output_price_per_1m": 3,
2767
  "currency": "USD",
2768
- "context_window": 256000,
2769
  "capabilities": [
2770
- "tools"
2771
  ],
2772
- "hf_id": "moonshotai/Kimi-K2-Instruct"
2773
  },
2774
  {
2775
- "name": "groq/moonshotai/kimi-k2-instruct",
2776
  "type": "chat",
2777
  "input_price_per_1m": 1,
2778
- "output_price_per_1m": 3,
2779
  "currency": "USD",
2780
- "context_window": 131072,
2781
  "capabilities": [
2782
- "tools"
2783
  ],
2784
- "hf_id": "moonshotai/Kimi-K2-Instruct"
 
 
2785
  },
2786
  {
2787
  "name": "openai/o3-mini",
@@ -2795,7 +2825,7 @@
2795
  "context_window": 200000
2796
  },
2797
  {
2798
- "name": "openai-responses/o4-mini",
2799
  "type": "vision",
2800
  "input_price_per_1m": 1.1,
2801
  "output_price_per_1m": 4.4,
@@ -2817,7 +2847,7 @@
2817
  "context_window": 200000
2818
  },
2819
  {
2820
- "name": "azure/o4-mini",
2821
  "type": "vision",
2822
  "input_price_per_1m": 1.1,
2823
  "output_price_per_1m": 4.4,
@@ -2837,7 +2867,8 @@
2837
  "capabilities": [
2838
  "tools"
2839
  ],
2840
- "hf_id": "moonshotai/Kimi-K2-Instruct"
 
2841
  },
2842
  {
2843
  "name": "together/Qwen/Qwen2.5-72B-Instruct-Turbo",
@@ -2849,7 +2880,7 @@
2849
  "size_b": 72
2850
  },
2851
  {
2852
- "name": "vertex/gemini-2.5-pro",
2853
  "type": "vision",
2854
  "input_price_per_1m": 1.25,
2855
  "output_price_per_1m": 10,
@@ -2858,10 +2889,10 @@
2858
  "vision",
2859
  "reasoning"
2860
  ],
2861
- "context_window": 1048576
2862
  },
2863
  {
2864
- "name": "openai/gpt-5-chat",
2865
  "type": "vision",
2866
  "input_price_per_1m": 1.25,
2867
  "output_price_per_1m": 10,
@@ -2873,7 +2904,7 @@
2873
  "context_window": 128000
2874
  },
2875
  {
2876
- "name": "openai/gpt-5.1",
2877
  "type": "vision",
2878
  "input_price_per_1m": 1.25,
2879
  "output_price_per_1m": 10,
@@ -2882,10 +2913,10 @@
2882
  "vision",
2883
  "reasoning"
2884
  ],
2885
- "context_window": 400000
2886
  },
2887
  {
2888
- "name": "openai/gpt-5.1-chat",
2889
  "type": "vision",
2890
  "input_price_per_1m": 1.25,
2891
  "output_price_per_1m": 10,
@@ -2894,10 +2925,10 @@
2894
  "vision",
2895
  "reasoning"
2896
  ],
2897
- "context_window": 128000
2898
  },
2899
  {
2900
- "name": "coding/gemini-2.5-pro",
2901
  "type": "vision",
2902
  "input_price_per_1m": 1.25,
2903
  "output_price_per_1m": 10,
@@ -2909,40 +2940,39 @@
2909
  "context_window": 1048576
2910
  },
2911
  {
2912
- "name": "openai-responses/gpt-5",
2913
  "type": "vision",
2914
  "input_price_per_1m": 1.25,
2915
  "output_price_per_1m": 10,
2916
  "currency": "USD",
2917
  "capabilities": [
2918
- "vision",
2919
  "reasoning"
2920
  ],
2921
- "context_window": 400000
2922
  },
2923
  {
2924
- "name": "openai-responses/gpt-5.1",
2925
  "type": "vision",
2926
  "input_price_per_1m": 1.25,
2927
  "output_price_per_1m": 10,
2928
  "currency": "USD",
2929
  "capabilities": [
2930
- "vision",
2931
  "reasoning"
2932
  ],
2933
- "context_window": 400000
2934
  },
2935
  {
2936
- "name": "openai-responses/gpt-5.1-codex",
2937
- "type": "vision",
2938
  "input_price_per_1m": 1.25,
2939
- "output_price_per_1m": 10,
2940
  "currency": "USD",
 
2941
  "capabilities": [
2942
- "vision",
2943
  "reasoning"
2944
  ],
2945
- "context_window": 400000
2946
  },
2947
  {
2948
  "name": "openai-responses/gpt-5-codex",
@@ -2957,20 +2987,19 @@
2957
  "context_window": 400000
2958
  },
2959
  {
2960
- "name": "together/deepseek-ai/DeepSeek-V3",
2961
- "type": "chat",
2962
  "input_price_per_1m": 1.25,
2963
- "output_price_per_1m": 1.25,
2964
  "currency": "USD",
2965
- "context_window": 131072,
2966
  "capabilities": [
2967
- "tools",
2968
  "reasoning"
2969
  ],
2970
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus"
2971
  },
2972
  {
2973
- "name": "google/gemini-2.5-pro",
2974
  "type": "vision",
2975
  "input_price_per_1m": 1.25,
2976
  "output_price_per_1m": 10,
@@ -2979,29 +3008,31 @@
2979
  "vision",
2980
  "reasoning"
2981
  ],
2982
- "context_window": 1048576
2983
  },
2984
  {
2985
- "name": "azure/gpt-5",
2986
  "type": "vision",
2987
  "input_price_per_1m": 1.25,
2988
  "output_price_per_1m": 10,
2989
  "currency": "USD",
2990
  "capabilities": [
 
2991
  "reasoning"
2992
  ],
2993
- "context_window": 200000
2994
  },
2995
  {
2996
- "name": "azure/gpt-5.1",
2997
  "type": "vision",
2998
  "input_price_per_1m": 1.25,
2999
  "output_price_per_1m": 10,
3000
  "currency": "USD",
3001
  "capabilities": [
 
3002
  "reasoning"
3003
  ],
3004
- "context_window": 200000
3005
  },
3006
  {
3007
  "name": "novita/sao10k/l31-70b-euryale-v2.2",
@@ -3033,7 +3064,7 @@
3033
  ]
3034
  },
3035
  {
3036
- "name": "openai/gpt-5.3-chat",
3037
  "type": "vision",
3038
  "input_price_per_1m": 1.75,
3039
  "output_price_per_1m": 14,
@@ -3042,10 +3073,10 @@
3042
  "vision",
3043
  "reasoning"
3044
  ],
3045
- "context_window": 128000
3046
  },
3047
  {
3048
- "name": "openai/gpt-5.2",
3049
  "type": "vision",
3050
  "input_price_per_1m": 1.75,
3051
  "output_price_per_1m": 14,
@@ -3054,10 +3085,10 @@
3054
  "vision",
3055
  "reasoning"
3056
  ],
3057
- "context_window": 400000
3058
  },
3059
  {
3060
- "name": "openai/gpt-5.2-chat",
3061
  "type": "vision",
3062
  "input_price_per_1m": 1.75,
3063
  "output_price_per_1m": 14,
@@ -3069,19 +3100,18 @@
3069
  "context_window": 128000
3070
  },
3071
  {
3072
- "name": "openai-responses/gpt-5.2-codex",
3073
  "type": "vision",
3074
  "input_price_per_1m": 1.75,
3075
  "output_price_per_1m": 14,
3076
  "currency": "USD",
3077
  "capabilities": [
3078
- "vision",
3079
  "reasoning"
3080
  ],
3081
- "context_window": 400000
3082
  },
3083
  {
3084
- "name": "openai-responses/gpt-5.3-codex",
3085
  "type": "vision",
3086
  "input_price_per_1m": 1.75,
3087
  "output_price_per_1m": 14,
@@ -3093,7 +3123,7 @@
3093
  "context_window": 400000
3094
  },
3095
  {
3096
- "name": "openai-responses/gpt-5.3-chat",
3097
  "type": "vision",
3098
  "input_price_per_1m": 1.75,
3099
  "output_price_per_1m": 14,
@@ -3102,10 +3132,10 @@
3102
  "vision",
3103
  "reasoning"
3104
  ],
3105
- "context_window": 128000
3106
  },
3107
  {
3108
- "name": "openai-responses/gpt-5.2",
3109
  "type": "vision",
3110
  "input_price_per_1m": 1.75,
3111
  "output_price_per_1m": 14,
@@ -3117,7 +3147,7 @@
3117
  "context_window": 400000
3118
  },
3119
  {
3120
- "name": "azure/gpt-5.3-codex",
3121
  "type": "vision",
3122
  "input_price_per_1m": 1.75,
3123
  "output_price_per_1m": 14,
@@ -3126,10 +3156,10 @@
3126
  "vision",
3127
  "reasoning"
3128
  ],
3129
- "context_window": 400000
3130
  },
3131
  {
3132
- "name": "azure/openai-responses/gpt-5.2-codex",
3133
  "type": "vision",
3134
  "input_price_per_1m": 1.75,
3135
  "output_price_per_1m": 14,
@@ -3141,86 +3171,71 @@
3141
  "context_window": 400000
3142
  },
3143
  {
3144
- "name": "azure/gpt-5.2",
3145
  "type": "vision",
3146
  "input_price_per_1m": 1.75,
3147
  "output_price_per_1m": 14,
3148
  "currency": "USD",
3149
  "capabilities": [
 
3150
  "reasoning"
3151
  ],
3152
- "context_window": 200000
3153
  },
3154
  {
3155
- "name": "perplexity/sonar-reasoning-pro",
3156
  "type": "vision",
3157
  "input_price_per_1m": 2,
3158
  "output_price_per_1m": 8,
3159
  "currency": "USD",
3160
- "context_window": 131072,
3161
- "capabilities": [
3162
- "vision",
3163
- "reasoning"
3164
- ]
3165
- },
3166
- {
3167
- "name": "vertex/gemini-3.1-pro-preview",
3168
- "type": "vision",
3169
- "input_price_per_1m": 2,
3170
- "output_price_per_1m": 12,
3171
- "currency": "USD",
3172
  "capabilities": [
3173
  "vision",
3174
  "reasoning"
3175
  ],
3176
- "context_window": 1048576
3177
  },
3178
  {
3179
- "name": "vertex/gemini-3-pro-preview",
3180
  "type": "vision",
3181
  "input_price_per_1m": 2,
3182
- "output_price_per_1m": 12,
3183
  "currency": "USD",
3184
  "capabilities": [
3185
- "vision",
3186
- "reasoning"
3187
  ],
3188
- "context_window": 1048576
3189
  },
3190
  {
3191
- "name": "vertex/gemini-3-pro-image-preview",
3192
- "type": "vision",
3193
  "input_price_per_1m": 2,
3194
- "output_price_per_1m": 12,
3195
  "currency": "USD",
3196
- "capabilities": [
3197
- "vision",
3198
- "reasoning"
3199
- ],
3200
- "context_window": 1048576
3201
  },
3202
  {
3203
- "name": "openai/gpt-4.1",
3204
  "type": "vision",
3205
  "input_price_per_1m": 2,
3206
- "output_price_per_1m": 8,
3207
  "currency": "USD",
3208
  "capabilities": [
3209
- "vision"
 
3210
  ],
3211
- "context_window": 1047576
3212
  },
3213
  {
3214
- "name": "openai/o4-mini-deep-research",
3215
  "type": "vision",
3216
  "input_price_per_1m": 2,
3217
- "output_price_per_1m": 8,
3218
  "currency": "USD",
3219
  "capabilities": [
3220
  "vision",
3221
  "reasoning"
3222
  ],
3223
- "context_window": 100000
3224
  },
3225
  {
3226
  "name": "mistral/pixtral-large-latest",
@@ -3231,38 +3246,31 @@
3231
  "context_window": 131072
3232
  },
3233
  {
3234
- "name": "openai-responses/gpt-4.1",
3235
  "type": "vision",
3236
  "input_price_per_1m": 2,
3237
  "output_price_per_1m": 8,
3238
  "currency": "USD",
 
3239
  "capabilities": [
3240
- "vision"
3241
- ],
3242
- "context_window": 1047576
3243
- },
3244
- {
3245
- "name": "xai/grok-2-1212",
3246
- "type": "chat",
3247
- "input_price_per_1m": 2,
3248
- "output_price_per_1m": 10,
3249
- "currency": "USD",
3250
- "context_window": 131072
3251
  },
3252
  {
3253
- "name": "xai/grok-4.2-beta",
3254
  "type": "vision",
3255
  "input_price_per_1m": 2,
3256
- "output_price_per_1m": 6,
3257
  "currency": "USD",
3258
  "capabilities": [
3259
  "vision",
3260
  "reasoning"
3261
  ],
3262
- "context_window": 2000000
3263
  },
3264
  {
3265
- "name": "google/gemini-3-pro-preview",
3266
  "type": "vision",
3267
  "input_price_per_1m": 2,
3268
  "output_price_per_1m": 12,
@@ -3274,7 +3282,7 @@
3274
  "context_window": 1048576
3275
  },
3276
  {
3277
- "name": "google/gemini-3.1-pro-preview",
3278
  "type": "vision",
3279
  "input_price_per_1m": 2,
3280
  "output_price_per_1m": 12,
@@ -3308,26 +3316,38 @@
3308
  "context_window": 1047576
3309
  },
3310
  {
3311
- "name": "nebius/deepseek-ai/DeepSeek-V3-0324-fast",
3312
  "type": "chat",
3313
  "input_price_per_1m": 2,
 
 
 
 
 
 
 
 
3314
  "output_price_per_1m": 6,
3315
  "currency": "USD",
3316
- "context_window": 128000
 
 
 
 
3317
  },
3318
  {
3319
- "name": "openai/gpt-4o-2024-11-20",
3320
  "type": "vision",
3321
- "input_price_per_1m": 2.5,
3322
- "output_price_per_1m": 10,
3323
  "currency": "USD",
3324
  "capabilities": [
3325
  "vision"
3326
  ],
3327
- "context_window": 128000
3328
  },
3329
  {
3330
- "name": "openai/gpt-4o-2024-08-06",
3331
  "type": "vision",
3332
  "input_price_per_1m": 2.5,
3333
  "output_price_per_1m": 10,
@@ -3338,7 +3358,7 @@
3338
  "context_window": 128000
3339
  },
3340
  {
3341
- "name": "openai/gpt-4o-2024-05-13",
3342
  "type": "vision",
3343
  "input_price_per_1m": 2.5,
3344
  "output_price_per_1m": 10,
@@ -3349,19 +3369,18 @@
3349
  "context_window": 128000
3350
  },
3351
  {
3352
- "name": "openai/gpt-5.4",
3353
  "type": "vision",
3354
  "input_price_per_1m": 2.5,
3355
- "output_price_per_1m": 15,
3356
  "currency": "USD",
3357
  "capabilities": [
3358
- "vision",
3359
- "reasoning"
3360
  ],
3361
- "context_window": 1050000
3362
  },
3363
  {
3364
- "name": "openai/gpt-4o",
3365
  "type": "vision",
3366
  "input_price_per_1m": 2.5,
3367
  "output_price_per_1m": 10,
@@ -3372,7 +3391,7 @@
3372
  "context_window": 128000
3373
  },
3374
  {
3375
- "name": "openai-responses/gpt-5.4",
3376
  "type": "vision",
3377
  "input_price_per_1m": 2.5,
3378
  "output_price_per_1m": 15,
@@ -3396,18 +3415,19 @@
3396
  "context_window": 1050000
3397
  },
3398
  {
3399
- "name": "perplexity/sonar-pro",
3400
  "type": "vision",
3401
- "input_price_per_1m": 3,
3402
  "output_price_per_1m": 15,
3403
  "currency": "USD",
3404
- "context_window": 204800,
3405
  "capabilities": [
3406
- "vision"
3407
- ]
 
 
3408
  },
3409
  {
3410
- "name": "bedrock/claude-sonnet-4-5",
3411
  "type": "vision",
3412
  "input_price_per_1m": 3,
3413
  "output_price_per_1m": 15,
@@ -3416,10 +3436,10 @@
3416
  "vision",
3417
  "reasoning"
3418
  ],
3419
- "context_window": 200000
3420
  },
3421
  {
3422
- "name": "bedrock/claude-sonnet-4-6",
3423
  "type": "vision",
3424
  "input_price_per_1m": 3,
3425
  "output_price_per_1m": 15,
@@ -3431,7 +3451,7 @@
3431
  "context_window": 1000000
3432
  },
3433
  {
3434
- "name": "bedrock/claude-sonnet-4",
3435
  "type": "vision",
3436
  "input_price_per_1m": 3,
3437
  "output_price_per_1m": 15,
@@ -3440,10 +3460,10 @@
3440
  "vision",
3441
  "reasoning"
3442
  ],
3443
- "context_window": 200000
3444
  },
3445
  {
3446
- "name": "bedrock/claude-3-7-sonnet",
3447
  "type": "vision",
3448
  "input_price_per_1m": 3,
3449
  "output_price_per_1m": 15,
@@ -3452,10 +3472,10 @@
3452
  "vision",
3453
  "reasoning"
3454
  ],
3455
- "context_window": 200000
3456
  },
3457
  {
3458
- "name": "vertex/claude-sonnet-4-5",
3459
  "type": "vision",
3460
  "input_price_per_1m": 3,
3461
  "output_price_per_1m": 15,
@@ -3467,7 +3487,7 @@
3467
  "context_window": 200000
3468
  },
3469
  {
3470
- "name": "vertex/claude-sonnet-4",
3471
  "type": "vision",
3472
  "input_price_per_1m": 3,
3473
  "output_price_per_1m": 15,
@@ -3479,7 +3499,7 @@
3479
  "context_window": 200000
3480
  },
3481
  {
3482
- "name": "vertex/claude-3-7-sonnet",
3483
  "type": "vision",
3484
  "input_price_per_1m": 3,
3485
  "output_price_per_1m": 15,
@@ -3491,30 +3511,29 @@
3491
  "context_window": 200000
3492
  },
3493
  {
3494
- "name": "vertex/claude-3-5-sonnet",
3495
  "type": "vision",
3496
  "input_price_per_1m": 3,
3497
  "output_price_per_1m": 15,
3498
  "currency": "USD",
 
3499
  "capabilities": [
3500
  "vision"
3501
- ],
3502
- "context_window": 200000
3503
  },
3504
  {
3505
- "name": "coding/claude-sonnet-4-20250514",
3506
  "type": "vision",
3507
  "input_price_per_1m": 3,
3508
  "output_price_per_1m": 15,
3509
  "currency": "USD",
3510
  "capabilities": [
3511
- "vision",
3512
- "reasoning"
3513
  ],
3514
  "context_window": 200000
3515
  },
3516
  {
3517
- "name": "anthropic/claude-sonnet-4-5",
3518
  "type": "vision",
3519
  "input_price_per_1m": 3,
3520
  "output_price_per_1m": 15,
@@ -3523,10 +3542,10 @@
3523
  "vision",
3524
  "reasoning"
3525
  ],
3526
- "context_window": 1000000
3527
  },
3528
  {
3529
- "name": "anthropic/claude-sonnet-4-6",
3530
  "type": "vision",
3531
  "input_price_per_1m": 3,
3532
  "output_price_per_1m": 15,
@@ -3535,10 +3554,10 @@
3535
  "vision",
3536
  "reasoning"
3537
  ],
3538
- "context_window": 1000000
3539
  },
3540
  {
3541
- "name": "anthropic/claude-sonnet-4",
3542
  "type": "vision",
3543
  "input_price_per_1m": 3,
3544
  "output_price_per_1m": 15,
@@ -3547,7 +3566,7 @@
3547
  "vision",
3548
  "reasoning"
3549
  ],
3550
- "context_window": 1000000
3551
  },
3552
  {
3553
  "name": "xai/grok-4",
@@ -3571,7 +3590,20 @@
3571
  "tools",
3572
  "reasoning"
3573
  ],
3574
- "hf_id": "deepseek-ai/DeepSeek-R1"
 
 
 
 
 
 
 
 
 
 
 
 
 
3575
  },
3576
  {
3577
  "name": "novita/deepseek/deepseek-r1",
@@ -3584,10 +3616,11 @@
3584
  "tools",
3585
  "reasoning"
3586
  ],
3587
- "hf_id": "deepseek-ai/DeepSeek-R1"
 
3588
  },
3589
  {
3590
- "name": "bedrock/claude-opus-4-5",
3591
  "type": "vision",
3592
  "input_price_per_1m": 5,
3593
  "output_price_per_1m": 25,
@@ -3599,7 +3632,7 @@
3599
  "context_window": 200000
3600
  },
3601
  {
3602
- "name": "bedrock/claude-opus-4-6",
3603
  "type": "vision",
3604
  "input_price_per_1m": 5,
3605
  "output_price_per_1m": 25,
@@ -3611,19 +3644,18 @@
3611
  "context_window": 1000000
3612
  },
3613
  {
3614
- "name": "vertex/claude-opus-4-6",
3615
  "type": "vision",
3616
  "input_price_per_1m": 5,
3617
- "output_price_per_1m": 25,
3618
  "currency": "USD",
3619
  "capabilities": [
3620
- "vision",
3621
- "reasoning"
3622
  ],
3623
- "context_window": 1000000
3624
  },
3625
  {
3626
- "name": "vertex/claude-opus-4-5",
3627
  "type": "vision",
3628
  "input_price_per_1m": 5,
3629
  "output_price_per_1m": 25,
@@ -3635,18 +3667,19 @@
3635
  "context_window": 200000
3636
  },
3637
  {
3638
- "name": "openai/chatgpt-4o",
3639
  "type": "vision",
3640
  "input_price_per_1m": 5,
3641
- "output_price_per_1m": 15,
3642
  "currency": "USD",
3643
  "capabilities": [
3644
- "vision"
 
3645
  ],
3646
- "context_window": 128000
3647
  },
3648
  {
3649
- "name": "anthropic/claude-opus-4-6",
3650
  "type": "vision",
3651
  "input_price_per_1m": 5,
3652
  "output_price_per_1m": 25,
@@ -3658,7 +3691,7 @@
3658
  "context_window": 1000000
3659
  },
3660
  {
3661
- "name": "anthropic/claude-opus-4-5",
3662
  "type": "vision",
3663
  "input_price_per_1m": 5,
3664
  "output_price_per_1m": 25,
@@ -3693,7 +3726,7 @@
3693
  "context_window": 100000
3694
  },
3695
  {
3696
- "name": "bedrock/claude-opus-4",
3697
  "type": "vision",
3698
  "input_price_per_1m": 15,
3699
  "output_price_per_1m": 75,
@@ -3705,7 +3738,7 @@
3705
  "context_window": 200000
3706
  },
3707
  {
3708
- "name": "vertex/claude-opus-4",
3709
  "type": "vision",
3710
  "input_price_per_1m": 15,
3711
  "output_price_per_1m": 75,
@@ -3717,10 +3750,10 @@
3717
  "context_window": 200000
3718
  },
3719
  {
3720
- "name": "vertex/claude-opus-4-1",
3721
  "type": "vision",
3722
  "input_price_per_1m": 15,
3723
- "output_price_per_1m": 75,
3724
  "currency": "USD",
3725
  "capabilities": [
3726
  "vision",
@@ -3729,10 +3762,10 @@
3729
  "context_window": 200000
3730
  },
3731
  {
3732
- "name": "openai/o1",
3733
  "type": "vision",
3734
  "input_price_per_1m": 15,
3735
- "output_price_per_1m": 60,
3736
  "currency": "USD",
3737
  "capabilities": [
3738
  "vision",
@@ -3741,7 +3774,7 @@
3741
  "context_window": 200000
3742
  },
3743
  {
3744
- "name": "coding/claude-opus-4-20250514",
3745
  "type": "vision",
3746
  "input_price_per_1m": 15,
3747
  "output_price_per_1m": 75,
@@ -3753,7 +3786,7 @@
3753
  "context_window": 200000
3754
  },
3755
  {
3756
- "name": "anthropic/claude-opus-4-1",
3757
  "type": "vision",
3758
  "input_price_per_1m": 15,
3759
  "output_price_per_1m": 75,
@@ -3765,28 +3798,28 @@
3765
  "context_window": 200000
3766
  },
3767
  {
3768
- "name": "anthropic/claude-opus-4",
3769
  "type": "vision",
3770
  "input_price_per_1m": 15,
3771
- "output_price_per_1m": 75,
3772
  "currency": "USD",
3773
  "capabilities": [
3774
  "vision",
3775
  "reasoning"
3776
  ],
3777
- "context_window": 200000
3778
  },
3779
  {
3780
- "name": "openai-responses/gpt-5-pro",
3781
  "type": "vision",
3782
  "input_price_per_1m": 15,
3783
- "output_price_per_1m": 120,
3784
  "currency": "USD",
3785
  "capabilities": [
3786
  "vision",
3787
  "reasoning"
3788
  ],
3789
- "context_window": 400000
3790
  },
3791
  {
3792
  "name": "openai-responses/o3-pro",
@@ -3813,7 +3846,7 @@
3813
  "context_window": 1050000
3814
  },
3815
  {
3816
- "name": "openai-responses/gpt-5.4-pro",
3817
  "type": "vision",
3818
  "input_price_per_1m": 30,
3819
  "output_price_per_1m": 180,
@@ -3825,7 +3858,7 @@
3825
  "context_window": 1050000
3826
  },
3827
  {
3828
- "name": "azure/openai-responses/gpt-5.4-pro",
3829
  "type": "vision",
3830
  "input_price_per_1m": 30,
3831
  "output_price_per_1m": 180,
@@ -3897,7 +3930,8 @@
3897
  "capabilities": [
3898
  "tools"
3899
  ],
3900
- "hf_id": "moonshotai/Kimi-K2-Instruct"
 
3901
  },
3902
  {
3903
  "name": "Qwen3-Coder-480B-A35B-Instruct (base)",
@@ -4093,7 +4127,8 @@
4093
  "tools",
4094
  "reasoning"
4095
  ],
4096
- "hf_id": "zai-org/GLM-4.5"
 
4097
  },
4098
  {
4099
  "name": "GLM-4.5-Air (base)",
@@ -4120,7 +4155,8 @@
4120
  "tools",
4121
  "reasoning"
4122
  ],
4123
- "hf_id": "deepseek-ai/DeepSeek-R1-0528"
 
4124
  },
4125
  {
4126
  "name": "DeepSeek-R1-0528 (base)",
@@ -4133,7 +4169,8 @@
4133
  "tools",
4134
  "reasoning"
4135
  ],
4136
- "hf_id": "deepseek-ai/DeepSeek-R1-0528"
 
4137
  },
4138
  {
4139
  "name": "DeepSeek-V3-0324 (fast)",
@@ -4492,7 +4529,8 @@
4492
  "type": "audio",
4493
  "input_price_per_1m": 0.003,
4494
  "output_price_per_1m": 0,
4495
- "currency": "EUR"
 
4496
  },
4497
  {
4498
  "name": "holo2-30b-a3b",
@@ -4950,7 +4988,8 @@
4950
  "input_price_per_1m": 0.017,
4951
  "output_price_per_1m": 0.11,
4952
  "currency": "USD",
4953
- "hf_id": "ibm-granite/granite-4.0-h-micro"
 
4954
  },
4955
  {
4956
  "name": "google/gemma-3n-e4b-it",
@@ -5277,7 +5316,8 @@
5277
  "capabilities": [
5278
  "tools",
5279
  "reasoning"
5280
- ]
 
5281
  },
5282
  {
5283
  "name": "qwen/qwen3-14b",
@@ -5527,7 +5567,8 @@
5527
  "capabilities": [
5528
  "tools",
5529
  "reasoning"
5530
- ]
 
5531
  },
5532
  {
5533
  "name": "alibaba/tongyi-deepresearch-30b-a3b",
@@ -5617,7 +5658,8 @@
5617
  "capabilities": [
5618
  "tools",
5619
  "reasoning"
5620
- ]
 
5621
  },
5622
  {
5623
  "name": "mistralai/mistral-small-creative",
@@ -5841,7 +5883,8 @@
5841
  "hf_id": "Qwen/Qwen3-Coder-Next",
5842
  "capabilities": [
5843
  "tools"
5844
- ]
 
5845
  },
5846
  {
5847
  "name": "allenai/olmo-3-7b-think",
@@ -6229,7 +6272,8 @@
6229
  "capabilities": [
6230
  "tools",
6231
  "reasoning"
6232
- ]
 
6233
  },
6234
  {
6235
  "name": "allenai/molmo-2-8b",
@@ -6342,7 +6386,8 @@
6342
  "hf_id": "meituan-longcat/LongCat-Flash-Chat",
6343
  "capabilities": [
6344
  "tools"
6345
- ]
 
6346
  },
6347
  {
6348
  "name": "x-ai/grok-code-fast-1",
@@ -6584,7 +6629,8 @@
6584
  "tools",
6585
  "reasoning",
6586
  "eu-endpoint"
6587
- ]
 
6588
  },
6589
  {
6590
  "name": "qwen/qwen3.5-122b-a10b",
@@ -6625,7 +6671,8 @@
6625
  "tools",
6626
  "reasoning",
6627
  "eu-endpoint"
6628
- ]
 
6629
  },
6630
  {
6631
  "name": "qwen/qwen3-vl-235b-a22b-thinking",
@@ -6682,7 +6729,8 @@
6682
  "capabilities": [
6683
  "tools",
6684
  "reasoning"
6685
- ]
 
6686
  },
6687
  {
6688
  "name": "nex-agi/deepseek-v3.1-nex-n1",
@@ -6693,7 +6741,8 @@
6693
  "hf_id": "nex-agi/DeepSeek-V3.1-Nex-N1",
6694
  "capabilities": [
6695
  "tools"
6696
- ]
 
6697
  },
6698
  {
6699
  "name": "deepseek/deepseek-v3.2-exp",
@@ -6891,7 +6940,8 @@
6891
  "tools",
6892
  "reasoning",
6893
  "eu-endpoint"
6894
- ]
 
6895
  },
6896
  {
6897
  "name": "z-ai/glm-4.6",
@@ -6903,7 +6953,8 @@
6903
  "capabilities": [
6904
  "tools",
6905
  "reasoning"
6906
- ]
 
6907
  },
6908
  {
6909
  "name": "xiaomi/mimo-v2-omni",
@@ -6951,7 +7002,8 @@
6951
  "hf_id": "moonshotai/Kimi-K2-Instruct-0905",
6952
  "capabilities": [
6953
  "tools"
6954
- ]
 
6955
  },
6956
  {
6957
  "name": "mistralai/mistral-medium-3.1",
@@ -7070,7 +7122,8 @@
7070
  "capabilities": [
7071
  "tools",
7072
  "reasoning"
7073
- ]
 
7074
  },
7075
  {
7076
  "name": "undi95/remm-slerp-l2-13b",
@@ -7105,7 +7158,8 @@
7105
  "tools",
7106
  "reasoning",
7107
  "eu-endpoint"
7108
- ]
 
7109
  },
7110
  {
7111
  "name": "google/gemini-3.1-flash-image-preview",
@@ -7261,7 +7315,8 @@
7261
  "capabilities": [
7262
  "tools",
7263
  "reasoning"
7264
- ]
 
7265
  },
7266
  {
7267
  "name": "nvidia/llama-3.1-nemotron-ultra-253b-v1",
@@ -7355,7 +7410,8 @@
7355
  "tools",
7356
  "reasoning",
7357
  "eu-endpoint"
7358
- ]
 
7359
  },
7360
  {
7361
  "name": "z-ai/glm-5",
@@ -7367,7 +7423,8 @@
7367
  "capabilities": [
7368
  "tools",
7369
  "reasoning"
7370
- ]
 
7371
  },
7372
  {
7373
  "name": "openai/gpt-5.4-mini",
@@ -8733,7 +8790,8 @@
8733
  "capabilities": [
8734
  "tools",
8735
  "reasoning"
8736
- ]
 
8737
  },
8738
  {
8739
  "name": "arcee-ai/trinity-large-preview:free",
@@ -9034,7 +9092,8 @@
9034
  "capabilities": [
9035
  "tools"
9036
  ],
9037
- "hf_id": "moonshotai/Kimi-K2-Instruct-0905"
 
9038
  },
9039
  {
9040
  "name": "Llama 4 Scout (17Bx16E) 128k",
 
133
  "type": "embedding",
134
  "input_price_per_1m": 0.02,
135
  "output_price_per_1m": 0,
136
+ "currency": "USD",
137
+ "hf_id": "BAAI/bge-m3",
138
+ "size_b": 0.57
139
  }
140
  ],
141
  "lastUpdated": "2026-03-02T04:54:46.028Z"
 
1038
  "hf_id": "meta-llama/Meta-Llama-3-8B-Instruct"
1039
  },
1040
  {
1041
+ "name": "alibaba/qwen-turbo",
1042
  "type": "chat",
1043
  "input_price_per_1m": 0.05,
1044
+ "output_price_per_1m": 0.2,
1045
  "currency": "USD",
1046
+ "context_window": 1000000,
1047
+ "capabilities": [
1048
+ "tools"
1049
+ ]
1050
+ },
1051
+ {
1052
+ "name": "azure/gpt-5-nano",
1053
+ "type": "vision",
1054
+ "input_price_per_1m": 0.05,
1055
+ "output_price_per_1m": 0.4,
1056
+ "currency": "USD",
1057
+ "capabilities": [
1058
+ "reasoning"
1059
+ ],
1060
+ "context_window": 200000
1061
  },
1062
  {
1063
  "name": "novita/meta-llama/llama-3.1-8b-instruct",
 
1082
  "size_b": 8
1083
  },
1084
  {
1085
+ "name": "novita/Sao10K/L3-8B-Stheno-v3.2",
1086
+ "type": "chat",
1087
  "input_price_per_1m": 0.05,
1088
+ "output_price_per_1m": 0.05,
1089
  "currency": "USD",
1090
+ "context_window": 8192,
1091
+ "size_b": 8
 
 
 
1092
  },
1093
  {
1094
+ "name": "openai-responses/gpt-5-nano",
1095
  "type": "vision",
1096
  "input_price_per_1m": 0.05,
1097
  "output_price_per_1m": 0.4,
1098
  "currency": "USD",
1099
  "capabilities": [
1100
+ "vision",
1101
  "reasoning"
1102
  ],
1103
+ "context_window": 400000
 
 
 
 
 
 
 
 
 
 
 
1104
  },
1105
  {
1106
  "name": "together/meta-llama/Llama-3.2-3B-Instruct-Turbo",
 
1112
  "size_b": 3
1113
  },
1114
  {
1115
+ "name": "deepinfra/Qwen/Qwen2.5-Coder-32B-Instruct",
1116
  "type": "chat",
1117
  "input_price_per_1m": 0.07,
1118
+ "output_price_per_1m": 0.16,
1119
  "currency": "USD",
1120
+ "context_window": 16384,
1121
+ "size_b": 32
1122
  },
1123
  {
1124
+ "name": "deepinfra/microsoft/phi-4",
1125
  "type": "chat",
1126
  "input_price_per_1m": 0.07,
1127
+ "output_price_per_1m": 0.14,
1128
  "currency": "USD",
1129
+ "context_window": 16384
 
1130
  },
1131
  {
1132
  "name": "novita/gryphe/mythomax-l2-13b",
 
1138
  "size_b": 13
1139
  },
1140
  {
1141
+ "name": "groq/openai/gpt-oss-20b",
1142
+ "type": "chat",
1143
  "input_price_per_1m": 0.1,
1144
+ "output_price_per_1m": 0.5,
1145
  "currency": "USD",
1146
+ "context_window": 131072,
1147
+ "size_b": 20,
1148
  "capabilities": [
1149
+ "tools",
1150
  "reasoning"
1151
  ],
1152
+ "hf_id": "openai/gpt-oss-20b"
1153
  },
1154
  {
1155
  "name": "openai/gpt-4.1-nano",
 
1163
  "context_window": 1047576
1164
  },
1165
  {
1166
+ "name": "google/gemini-2.0-flash-001",
1167
+ "type": "vision",
1168
  "input_price_per_1m": 0.1,
1169
+ "output_price_per_1m": 0.4,
1170
  "currency": "USD",
 
1171
  "capabilities": [
1172
+ "vision"
1173
  ],
1174
+ "context_window": 1048576
1175
  },
1176
  {
1177
+ "name": "google/gemini-2.5-flash-lite",
1178
+ "type": "vision",
1179
  "input_price_per_1m": 0.1,
1180
+ "output_price_per_1m": 0.4,
1181
  "currency": "USD",
1182
+ "capabilities": [
1183
+ "vision",
1184
+ "reasoning"
1185
+ ],
1186
+ "context_window": 1048576
1187
  },
1188
  {
1189
+ "name": "mistral/devstral-small-latest",
1190
  "type": "chat",
1191
  "input_price_per_1m": 0.1,
1192
  "output_price_per_1m": 0.3,
 
1198
  "hf_id": "mistralai/Devstral-Small-2507"
1199
  },
1200
  {
1201
+ "name": "mistral/mistral-small-2503",
 
 
 
 
 
 
 
 
 
 
 
1202
  "type": "chat",
1203
  "input_price_per_1m": 0.1,
1204
+ "output_price_per_1m": 0.3,
1205
  "currency": "USD",
1206
+ "context_window": 32768
 
1207
  },
1208
  {
1209
+ "name": "mistral/devstral-small-2507",
1210
  "type": "chat",
1211
  "input_price_per_1m": 0.1,
1212
  "output_price_per_1m": 0.3,
1213
  "currency": "USD",
1214
+ "context_window": 131072,
 
1215
  "capabilities": [
1216
+ "tools"
 
1217
  ],
1218
+ "hf_id": "mistralai/Devstral-Small-2507"
1219
  },
1220
  {
1221
+ "name": "vertex/gemini-2.5-flash-lite",
1222
  "type": "vision",
1223
  "input_price_per_1m": 0.1,
1224
  "output_price_per_1m": 0.4,
 
1230
  "context_window": 1048576
1231
  },
1232
  {
1233
+ "name": "azure/openai-responses/gpt-4.1-nano",
1234
  "type": "vision",
1235
  "input_price_per_1m": 0.1,
1236
  "output_price_per_1m": 0.4,
 
1238
  "capabilities": [
1239
  "vision"
1240
  ],
1241
+ "context_window": 1047576
1242
  },
1243
  {
1244
+ "name": "azure/gpt-4.1-nano",
1245
  "type": "vision",
1246
  "input_price_per_1m": 0.1,
1247
  "output_price_per_1m": 0.4,
 
1252
  "context_window": 1047576
1253
  },
1254
  {
1255
+ "name": "together/meta-llama/Meta-Llama-3-8B-Instruct-Lite",
1256
+ "type": "chat",
1257
+ "input_price_per_1m": 0.1,
1258
+ "output_price_per_1m": 0.1,
1259
+ "currency": "USD",
1260
+ "context_window": 8192,
1261
+ "size_b": 8
1262
+ },
1263
+ {
1264
+ "name": "openai-responses/gpt-4.1-nano",
1265
  "type": "vision",
1266
  "input_price_per_1m": 0.1,
1267
  "output_price_per_1m": 0.4,
 
1272
  "context_window": 1047576
1273
  },
1274
  {
1275
+ "name": "deepinfra/Qwen/Qwen3-32B",
1276
  "type": "chat",
1277
  "input_price_per_1m": 0.1,
1278
+ "output_price_per_1m": 0.3,
1279
  "currency": "USD",
1280
+ "context_window": 40000,
1281
+ "size_b": 32,
1282
  "capabilities": [
1283
  "tools",
1284
  "reasoning"
1285
  ],
1286
+ "hf_id": "Qwen/Qwen3-32B"
1287
  },
1288
  {
1289
  "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct-Turbo",
 
1333
  "size_b": 8
1334
  },
1335
  {
1336
+ "name": "groq/openai/gpt-oss-120b",
1337
  "type": "chat",
1338
  "input_price_per_1m": 0.15,
1339
+ "output_price_per_1m": 0.75,
1340
  "currency": "USD",
1341
+ "context_window": 131072,
1342
+ "size_b": 120,
1343
  "capabilities": [
1344
  "tools",
1345
  "reasoning"
1346
  ],
1347
+ "hf_id": "openai/gpt-oss-120b"
1348
  },
1349
  {
1350
  "name": "openai/gpt-4o-mini",
 
1358
  "context_window": 128000
1359
  },
1360
  {
1361
+ "name": "nebius/openai/gpt-oss-120b",
1362
+ "type": "chat",
1363
  "input_price_per_1m": 0.15,
1364
  "output_price_per_1m": 0.6,
1365
  "currency": "USD",
1366
  "capabilities": [
 
1367
  "reasoning"
1368
  ],
1369
+ "context_window": 131000,
1370
+ "size_b": 120,
1371
+ "hf_id": "openai/gpt-oss-120b"
1372
+ },
1373
+ {
1374
+ "name": "parasail/parasail-qwen3-235b-a22b-instruct-2507",
1375
+ "type": "chat",
1376
+ "input_price_per_1m": 0.15,
1377
+ "output_price_per_1m": 0.85,
1378
+ "currency": "USD",
1379
+ "context_window": 262144,
1380
+ "size_b": 235
1381
  },
1382
  {
1383
  "name": "mistral/mistral-small-2603",
 
1394
  "hf_id": "mistralai/Mistral-Small-4-119B-2603"
1395
  },
1396
  {
1397
+ "name": "mistral/mistral-small-latest",
1398
+ "type": "vision",
 
 
 
 
 
 
 
 
 
1399
  "input_price_per_1m": 0.15,
1400
  "output_price_per_1m": 0.6,
1401
  "currency": "USD",
1402
  "capabilities": [
1403
+ "vision",
1404
  "reasoning"
1405
  ],
1406
+ "context_window": 256000
 
 
1407
  },
1408
  {
1409
+ "name": "novita/deepseek/deepseek-r1-distill-qwen-14b",
1410
  "type": "chat",
1411
  "input_price_per_1m": 0.15,
1412
+ "output_price_per_1m": 0.15,
1413
  "currency": "USD",
1414
+ "context_window": 128000,
1415
+ "size_b": 14,
1416
  "capabilities": [
1417
  "tools",
1418
  "reasoning"
1419
  ],
1420
+ "hf_id": "deepseek-ai/DeepSeek-R1"
1421
  },
1422
  {
1423
  "name": "novita/mistralai/mistral-nemo",
 
1441
  "size_b": 8
1442
  },
1443
  {
1444
+ "name": "openai/gpt-5.4-nano",
1445
  "type": "vision",
1446
  "input_price_per_1m": 0.2,
1447
+ "output_price_per_1m": 1.25,
1448
  "currency": "USD",
 
 
1449
  "capabilities": [
1450
  "vision",
1451
+ "reasoning"
1452
  ],
1453
+ "context_window": 400000
1454
+ },
1455
+ {
1456
+ "name": "alibaba/qwen3-30b-a3b-instruct-2507",
1457
+ "type": "vision",
1458
+ "input_price_per_1m": 0.2,
1459
+ "output_price_per_1m": 0.8,
1460
+ "currency": "USD",
1461
+ "capabilities": [
1462
+ "vision"
1463
+ ],
1464
+ "context_window": 131072,
1465
+ "size_b": 30,
1466
+ "hf_id": "Qwen/Qwen3-30B-A3B-Instruct-2507"
1467
  },
1468
  {
1469
  "name": "novita/qwen/qwen3-235b-a22b-fp8",
 
1480
  "hf_id": "Qwen/Qwen3-235B-A22B"
1481
  },
1482
  {
1483
+ "name": "novita/meta-llama/llama-4-maverick-17b-128e-instruct-fp8",
1484
  "type": "vision",
1485
  "input_price_per_1m": 0.2,
1486
+ "output_price_per_1m": 0.85,
1487
  "currency": "USD",
1488
+ "context_window": 1048576,
1489
+ "size_b": 17,
1490
  "capabilities": [
1491
  "vision",
1492
+ "tools"
1493
  ],
1494
+ "hf_id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct"
1495
  },
1496
  {
1497
+ "name": "xai/grok-4-fast-non-reasoning",
1498
  "type": "vision",
1499
  "input_price_per_1m": 0.2,
1500
+ "output_price_per_1m": 0.5,
1501
  "currency": "USD",
1502
+ "context_window": 2000000,
1503
  "capabilities": [
1504
  "vision",
1505
+ "tools",
 
 
 
 
 
 
 
 
 
 
 
 
 
1506
  "reasoning"
1507
  ]
1508
  },
1509
  {
1510
+ "name": "xai/grok-4-1-fast-reasoning",
1511
  "type": "vision",
1512
  "input_price_per_1m": 0.2,
1513
  "output_price_per_1m": 0.5,
 
1518
  "context_window": 2000000
1519
  },
1520
  {
1521
+ "name": "xai/grok-4-1-fast-non-reasoning",
1522
  "type": "vision",
1523
  "input_price_per_1m": 0.2,
1524
+ "output_price_per_1m": 0.5,
1525
  "currency": "USD",
1526
  "capabilities": [
1527
  "vision"
1528
  ],
1529
+ "context_window": 2000000
1530
  },
1531
  {
1532
  "name": "xai/grok-4-fast",
 
1542
  ]
1543
  },
1544
  {
1545
+ "name": "xai/grok-code-fast-1",
1546
  "type": "vision",
1547
  "input_price_per_1m": 0.2,
1548
+ "output_price_per_1m": 1.5,
1549
  "currency": "USD",
1550
  "capabilities": [
1551
  "vision"
1552
  ],
1553
+ "context_window": 256000
1554
  },
1555
  {
1556
  "name": "together/meta-llama/LlamaGuard-2-8b",
 
1562
  "size_b": 8
1563
  },
1564
  {
1565
+ "name": "openai-responses/gpt-5.4-nano",
1566
+ "type": "vision",
1567
  "input_price_per_1m": 0.2,
1568
+ "output_price_per_1m": 1.25,
1569
  "currency": "USD",
 
1570
  "capabilities": [
1571
+ "vision",
1572
  "reasoning"
1573
  ],
1574
+ "context_window": 400000
 
1575
  },
1576
  {
1577
  "name": "deepinfra/Qwen/Qwen3-235B-A22B",
 
1588
  "hf_id": "Qwen/Qwen3-235B-A22B"
1589
  },
1590
  {
1591
+ "name": "deepinfra/zai-org/GLM-4.5-Air",
1592
+ "type": "chat",
1593
  "input_price_per_1m": 0.2,
1594
+ "output_price_per_1m": 1.1,
1595
  "currency": "USD",
1596
+ "context_window": 131072,
1597
  "capabilities": [
1598
+ "tools",
1599
+ "reasoning"
1600
  ],
1601
+ "hf_id": "zai-org/GLM-4.5-Air",
1602
+ "size_b": 110.5
1603
+ },
1604
+ {
1605
+ "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct",
1606
+ "type": "chat",
1607
+ "input_price_per_1m": 0.23,
1608
+ "output_price_per_1m": 0.4,
1609
+ "currency": "USD",
1610
  "context_window": 131072,
1611
+ "size_b": 70,
1612
+ "capabilities": [
1613
+ "tools"
1614
+ ],
1615
+ "hf_id": "meta-llama/Llama-3.3-70B-Instruct"
1616
  },
1617
  {
1618
  "name": "deepinfra/deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
 
1650
  "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct"
1651
  },
1652
  {
1653
+ "name": "google/gemini-3.1-flash-lite-preview",
 
 
 
 
 
 
 
 
 
 
 
 
 
1654
  "type": "vision",
1655
  "input_price_per_1m": 0.25,
1656
  "output_price_per_1m": 1.5,
 
1670
  "size_b": 7
1671
  },
1672
  {
1673
+ "name": "vertex/gemini-3.1-flash-lite-preview",
1674
  "type": "vision",
1675
  "input_price_per_1m": 0.25,
1676
+ "output_price_per_1m": 1.5,
1677
  "currency": "USD",
1678
  "capabilities": [
1679
+ "vision"
 
1680
  ],
1681
+ "context_window": 1048576
1682
  },
1683
  {
1684
+ "name": "azure/gpt-5-mini",
1685
  "type": "vision",
1686
  "input_price_per_1m": 0.25,
1687
+ "output_price_per_1m": 2,
1688
  "currency": "USD",
1689
  "capabilities": [
1690
+ "reasoning"
1691
  ],
1692
+ "context_window": 200000
1693
  },
1694
  {
1695
+ "name": "openai-responses/gpt-5-mini",
1696
  "type": "vision",
1697
  "input_price_per_1m": 0.25,
1698
  "output_price_per_1m": 2,
1699
  "currency": "USD",
1700
  "capabilities": [
1701
+ "vision",
1702
  "reasoning"
1703
  ],
1704
+ "context_window": 400000
1705
  },
1706
  {
1707
  "name": "novita/deepseek/deepseek-v3.2",
 
1713
  "reasoning"
1714
  ],
1715
  "context_window": 163840,
1716
+ "hf_id": "deepseek-ai/DeepSeek-V3.2",
1717
+ "size_b": 685.4
1718
  },
1719
  {
1720
  "name": "deepseek/deepseek-chat",
 
1737
  "context_window": 128000
1738
  },
1739
  {
1740
+ "name": "nebius/minimax/minimax-m2.1",
1741
+ "type": "chat",
1742
  "input_price_per_1m": 0.3,
1743
  "output_price_per_1m": 1.2,
1744
  "currency": "USD",
1745
  "capabilities": [
 
1746
  "reasoning"
1747
  ],
1748
  "context_window": 200000,
1749
+ "hf_id": "MiniMaxAI/MiniMax-M2.1",
1750
+ "size_b": 228.7
1751
  },
1752
  {
1753
+ "name": "nebius/deepseek-ai/DeepSeek-V3.2",
1754
  "type": "chat",
1755
  "input_price_per_1m": 0.3,
1756
+ "output_price_per_1m": 0.45,
1757
  "currency": "USD",
 
 
1758
  "capabilities": [
1759
  "reasoning"
1760
  ],
1761
+ "context_window": 164000,
1762
+ "hf_id": "deepseek-ai/DeepSeek-V3.2",
1763
+ "size_b": 685.4
1764
  },
1765
  {
1766
+ "name": "parasail/parasail-gemma3-27b-it",
1767
+ "type": "chat",
1768
+ "input_price_per_1m": 0.3,
1769
+ "output_price_per_1m": 0.5,
1770
+ "currency": "USD",
1771
+ "context_window": 128000,
1772
+ "size_b": 27
1773
+ },
1774
+ {
1775
+ "name": "alibaba/qwen3-coder-flash",
1776
  "type": "vision",
1777
  "input_price_per_1m": 0.3,
1778
+ "output_price_per_1m": 1.5,
1779
  "currency": "USD",
1780
  "capabilities": [
1781
+ "vision"
 
1782
  ],
1783
+ "context_window": 1048576
 
1784
  },
1785
  {
1786
+ "name": "google/gemini-2.5-flash",
1787
  "type": "vision",
1788
  "input_price_per_1m": 0.3,
1789
  "output_price_per_1m": 2.5,
 
1795
  "context_window": 1048576
1796
  },
1797
  {
1798
+ "name": "mistral/codestral-latest",
1799
+ "type": "chat",
1800
+ "input_price_per_1m": 0.3,
1801
+ "output_price_per_1m": 0.9,
1802
+ "currency": "USD",
1803
+ "context_window": 131072
1804
+ },
1805
+ {
1806
+ "name": "vertex/gemini-2.5-flash",
1807
  "type": "vision",
1808
  "input_price_per_1m": 0.3,
1809
  "output_price_per_1m": 2.5,
 
1815
  "context_window": 1048576
1816
  },
1817
  {
1818
+ "name": "vertex/gemini-2.5-flash-image",
1819
  "type": "vision",
1820
  "input_price_per_1m": 0.3,
1821
  "output_price_per_1m": 2.5,
 
1827
  "context_window": 1048576
1828
  },
1829
  {
1830
+ "name": "novita/minimax-m2.7",
1831
+ "type": "vision",
 
 
 
 
 
 
 
 
1832
  "input_price_per_1m": 0.3,
1833
+ "output_price_per_1m": 1.2,
1834
  "currency": "USD",
1835
  "capabilities": [
1836
+ "vision",
1837
  "reasoning"
1838
  ],
1839
+ "context_window": 200000,
1840
+ "hf_id": "MiniMaxAI/MiniMax-M2.7"
1841
  },
1842
  {
1843
+ "name": "novita/deepseek/deepseek-r1-distill-qwen-32b",
1844
  "type": "chat",
1845
  "input_price_per_1m": 0.3,
1846
  "output_price_per_1m": 0.3,
1847
  "currency": "USD",
1848
+ "context_window": 12800,
1849
+ "size_b": 32,
 
 
 
 
 
 
 
 
1850
  "capabilities": [
 
1851
  "reasoning"
1852
  ],
1853
+ "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B"
 
 
 
 
 
 
 
 
 
1854
  },
1855
  {
1856
+ "name": "novita/MiniMax-M2.7",
1857
  "type": "vision",
1858
  "input_price_per_1m": 0.3,
1859
+ "output_price_per_1m": 1.2,
1860
  "currency": "USD",
1861
  "capabilities": [
1862
  "vision",
1863
  "reasoning"
1864
  ],
1865
+ "context_window": 200000,
1866
+ "hf_id": "MiniMaxAI/MiniMax-M2.7"
1867
  },
1868
  {
1869
+ "name": "minimaxi/MiniMax-M2",
1870
  "type": "chat",
1871
  "input_price_per_1m": 0.3,
1872
+ "output_price_per_1m": 1.2,
1873
  "currency": "USD",
1874
+ "context_window": 200000,
1875
  "capabilities": [
1876
+ "tools",
1877
  "reasoning"
1878
  ],
1879
+ "hf_id": "MiniMaxAI/MiniMax-M2",
1880
+ "size_b": 228.7
1881
  },
1882
  {
1883
+ "name": "minimaxi/MiniMax-M2.5",
1884
+ "type": "vision",
1885
  "input_price_per_1m": 0.3,
1886
  "output_price_per_1m": 1.2,
1887
  "currency": "USD",
1888
  "capabilities": [
1889
+ "vision",
1890
  "reasoning"
1891
  ],
1892
  "context_window": 200000,
1893
+ "hf_id": "MiniMaxAI/MiniMax-M2.5",
1894
+ "size_b": 228.7
1895
  },
1896
  {
1897
  "name": "minimaxi/MiniMax-M2.7",
 
1907
  "hf_id": "MiniMaxAI/MiniMax-M2.7"
1908
  },
1909
  {
1910
+ "name": "xai/grok-3-mini",
1911
  "type": "chat",
1912
  "input_price_per_1m": 0.3,
1913
+ "output_price_per_1m": 0.5,
1914
  "currency": "USD",
 
1915
  "capabilities": [
 
1916
  "reasoning"
1917
  ],
1918
+ "context_window": 131072
1919
  },
1920
  {
1921
+ "name": "together/Qwen/Qwen2.5-7B-Instruct-Turbo",
1922
+ "type": "chat",
1923
+ "input_price_per_1m": 0.3,
1924
+ "output_price_per_1m": 0.3,
1925
+ "currency": "USD",
1926
+ "context_window": 32768,
1927
+ "size_b": 7
1928
+ },
1929
+ {
1930
+ "name": "coding/gemini-2.5-flash",
1931
  "type": "vision",
1932
  "input_price_per_1m": 0.3,
1933
+ "output_price_per_1m": 2.5,
1934
  "currency": "USD",
1935
  "capabilities": [
1936
  "vision",
1937
  "reasoning"
1938
  ],
1939
+ "context_window": 1048576
 
1940
  },
1941
  {
1942
+ "name": "deepinfra/deepseek-ai/DeepSeek-V3.1",
1943
+ "type": "chat",
1944
  "input_price_per_1m": 0.3,
1945
+ "output_price_per_1m": 1,
1946
  "currency": "USD",
1947
+ "context_window": 163840,
1948
  "capabilities": [
1949
+ "tools",
1950
+ "reasoning"
1951
  ],
1952
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus"
1953
  },
1954
  {
1955
  "name": "deepinfra/meta-llama/Llama-3.2-90B-Vision-Instruct",
 
1987
  "hf_id": "meta-llama/Llama-3.3-70B-Instruct"
1988
  },
1989
  {
1990
+ "name": "openai/gpt-4.1-mini",
1991
+ "type": "vision",
1992
  "input_price_per_1m": 0.4,
1993
+ "output_price_per_1m": 1.6,
1994
  "currency": "USD",
 
1995
  "capabilities": [
1996
+ "vision"
 
1997
  ],
1998
+ "context_window": 1047576
 
 
 
 
 
 
 
 
 
1999
  },
2000
  {
2001
+ "name": "nebius/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2002
+ "type": "chat",
2003
  "input_price_per_1m": 0.4,
2004
+ "output_price_per_1m": 1.8,
2005
  "currency": "USD",
2006
+ "context_window": 262000,
2007
+ "size_b": 480,
2008
  "capabilities": [
2009
+ "tools"
2010
  ],
2011
+ "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct"
2012
  },
2013
  {
2014
+ "name": "nebius/zai-org/GLM-4.7",
2015
  "type": "chat",
2016
  "input_price_per_1m": 0.4,
2017
  "output_price_per_1m": 2,
2018
  "currency": "USD",
2019
+ "capabilities": [
2020
+ "reasoning"
2021
+ ],
2022
+ "context_window": 200000,
2023
+ "hf_id": "zai-org/GLM-4.7",
2024
+ "size_b": 358.3
2025
  },
2026
  {
2027
+ "name": "alibaba/qwen-plus",
2028
  "type": "chat",
2029
  "input_price_per_1m": 0.4,
2030
+ "output_price_per_1m": 1.2,
2031
  "currency": "USD",
2032
  "context_window": 131072,
2033
  "capabilities": [
 
2043
  "context_window": 131072
2044
  },
2045
  {
2046
+ "name": "mistral/devstral-medium-2507",
2047
+ "type": "chat",
2048
  "input_price_per_1m": 0.4,
2049
+ "output_price_per_1m": 2,
2050
  "currency": "USD",
2051
+ "context_window": 131072,
2052
  "capabilities": [
2053
+ "tools"
2054
+ ]
 
2055
  },
2056
  {
2057
+ "name": "mistral/devstral-latest",
2058
  "type": "chat",
2059
  "input_price_per_1m": 0.4,
2060
+ "output_price_per_1m": 2,
2061
  "currency": "USD",
2062
+ "context_window": 256000
 
 
 
 
 
2063
  },
2064
  {
2065
  "name": "azure/gpt-4.1-mini",
 
2084
  "context_window": 1047576
2085
  },
2086
  {
2087
+ "name": "novita/deepseek/deepseek-v3-0324",
2088
  "type": "chat",
2089
  "input_price_per_1m": 0.4,
2090
+ "output_price_per_1m": 1.3,
2091
  "currency": "USD",
2092
+ "context_window": 128000,
2093
  "capabilities": [
2094
+ "tools",
2095
  "reasoning"
2096
  ],
2097
+ "size_b": 685,
2098
+ "hf_id": "deepseek-ai/DeepSeek-V3-0324"
2099
  },
2100
  {
2101
+ "name": "novita/deepseek/deepseek-v3-turbo",
2102
  "type": "chat",
2103
  "input_price_per_1m": 0.4,
2104
+ "output_price_per_1m": 1.3,
2105
+ "currency": "USD",
2106
+ "context_window": 128000
2107
+ },
2108
+ {
2109
+ "name": "openai-responses/gpt-4.1-mini",
2110
+ "type": "vision",
2111
+ "input_price_per_1m": 0.4,
2112
+ "output_price_per_1m": 1.6,
2113
  "currency": "USD",
 
 
2114
  "capabilities": [
2115
+ "vision"
2116
  ],
2117
+ "context_window": 1047576
2118
  },
2119
  {
2120
+ "name": "deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2121
  "type": "chat",
2122
  "input_price_per_1m": 0.4,
2123
+ "output_price_per_1m": 1.6,
2124
  "currency": "USD",
2125
+ "context_window": 262144,
2126
+ "size_b": 480,
2127
  "capabilities": [
2128
  "tools"
2129
+ ],
2130
+ "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct"
2131
  },
2132
  {
2133
+ "name": "nebius/deepseek-ai/DeepSeek-V3-0324",
2134
+ "type": "chat",
2135
  "input_price_per_1m": 0.5,
2136
+ "output_price_per_1m": 1.5,
2137
  "currency": "USD",
2138
+ "context_window": 128000,
2139
  "capabilities": [
2140
+ "tools",
2141
  "reasoning"
2142
  ],
2143
+ "size_b": 685,
2144
+ "hf_id": "deepseek-ai/DeepSeek-V3-0324"
2145
  },
2146
  {
2147
+ "name": "nebius/moonshotai/Kimi-K2-Instruct",
2148
+ "type": "chat",
2149
  "input_price_per_1m": 0.5,
2150
+ "output_price_per_1m": 2.4,
2151
  "currency": "USD",
2152
+ "context_window": 131000,
2153
  "capabilities": [
2154
+ "tools"
 
2155
  ],
2156
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
2157
+ "size_b": 1026.5
2158
  },
2159
  {
2160
+ "name": "nebius/moonshotai/kimi-k2.5",
2161
+ "type": "vision",
2162
  "input_price_per_1m": 0.5,
2163
+ "output_price_per_1m": 2.5,
2164
  "currency": "USD",
 
2165
  "capabilities": [
2166
+ "vision",
2167
+ "reasoning"
2168
+ ],
2169
+ "context_window": 256000,
2170
+ "hf_id": "moonshotai/Kimi-K2.5",
2171
+ "size_b": 1058.6
2172
  },
2173
  {
2174
  "name": "google/gemini-3.1-flash-image-preview",
 
2195
  "context_window": 1048576
2196
  },
2197
  {
2198
+ "name": "mistral/mistral-large-latest",
2199
  "type": "chat",
2200
  "input_price_per_1m": 0.5,
2201
+ "output_price_per_1m": 1.5,
2202
  "currency": "USD",
2203
+ "context_window": 131072,
2204
  "capabilities": [
2205
  "tools"
2206
+ ]
 
2207
  },
2208
  {
2209
+ "name": "vertex/gemini-3-flash-preview",
2210
+ "type": "vision",
2211
  "input_price_per_1m": 0.5,
2212
+ "output_price_per_1m": 3,
2213
  "currency": "USD",
 
2214
  "capabilities": [
2215
+ "vision",
2216
  "reasoning"
2217
  ],
2218
+ "context_window": 1048576
 
2219
  },
2220
  {
2221
+ "name": "vertex/gemini-3.1-flash-image-preview",
2222
  "type": "vision",
2223
  "input_price_per_1m": 0.5,
2224
+ "output_price_per_1m": 2,
2225
  "currency": "USD",
2226
  "capabilities": [
2227
  "vision",
2228
  "reasoning"
2229
  ],
2230
+ "context_window": 131072
 
 
2231
  },
2232
  {
2233
  "name": "novita/meta-llama/llama-3-70b-instruct",
 
2264
  "reasoning"
2265
  ],
2266
  "context_window": 163840,
2267
+ "hf_id": "deepseek-ai/DeepSeek-V3.2",
2268
+ "size_b": 685.4
2269
  },
2270
  {
2271
  "name": "novita/moonshotai/kimi-k2-instruct",
 
2277
  "capabilities": [
2278
  "tools"
2279
  ],
2280
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
2281
+ "size_b": 1026.5
2282
  },
2283
  {
2284
+ "name": "zai/GLM-4.7",
2285
  "type": "chat",
2286
  "input_price_per_1m": 0.6,
2287
  "output_price_per_1m": 2.2,
2288
  "currency": "USD",
 
2289
  "capabilities": [
 
2290
  "reasoning"
2291
  ],
2292
+ "context_window": 200000,
2293
+ "hf_id": "zai-org/GLM-4.7",
2294
+ "size_b": 358.3
2295
  },
2296
  {
2297
+ "name": "zai/GLM-4.5",
2298
  "type": "chat",
2299
  "input_price_per_1m": 0.6,
2300
  "output_price_per_1m": 2.2,
2301
  "currency": "USD",
 
2302
  "capabilities": [
 
2303
  "reasoning"
2304
  ],
2305
+ "context_window": 131072,
2306
+ "hf_id": "zai-org/GLM-4.5",
2307
+ "size_b": 358.3
2308
  },
2309
  {
2310
+ "name": "zai/GLM-4.6",
2311
  "type": "chat",
2312
  "input_price_per_1m": 0.6,
2313
  "output_price_per_1m": 2.2,
 
2315
  "capabilities": [
2316
  "reasoning"
2317
  ],
2318
+ "context_window": 200000,
2319
+ "hf_id": "zai-org/GLM-4.6",
2320
+ "size_b": 356.8
2321
  },
2322
  {
2323
+ "name": "nebius/zai-org/GLM-4.5",
2324
  "type": "chat",
2325
  "input_price_per_1m": 0.6,
2326
  "output_price_per_1m": 2.2,
2327
  "currency": "USD",
2328
+ "context_window": 128000,
2329
  "capabilities": [
2330
+ "tools",
2331
  "reasoning"
2332
  ],
2333
+ "hf_id": "zai-org/GLM-4.5",
2334
+ "size_b": 358.3
2335
  },
2336
  {
2337
+ "name": "alibaba/qwen3.5",
2338
+ "type": "vision",
2339
  "input_price_per_1m": 0.6,
2340
+ "output_price_per_1m": 3.6,
2341
  "currency": "USD",
2342
  "capabilities": [
2343
+ "vision",
2344
  "reasoning"
2345
  ],
2346
+ "context_window": 256000,
2347
+ "size_b": 9,
2348
+ "hf_id": "Qwen/Qwen3.5-9B"
2349
  },
2350
  {
2351
  "name": "moonshot/kimi-k2-0711-preview",
 
2357
  "capabilities": [
2358
  "tools"
2359
  ],
2360
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
2361
+ "size_b": 1026.5
2362
  },
2363
  {
2364
  "name": "moonshot/kimi-k2.5",
 
2385
  "tools",
2386
  "reasoning"
2387
  ],
2388
+ "hf_id": "moonshotai/Kimi-K2-Thinking",
2389
+ "size_b": 1058.1
2390
  },
2391
  {
2392
  "name": "moonshot/kimi-k2-0905-preview",
 
2398
  "capabilities": [
2399
  "tools"
2400
  ],
2401
+ "hf_id": "moonshotai/Kimi-K2-Instruct-0905",
2402
+ "size_b": 1026.5
2403
  },
2404
  {
2405
  "name": "moonshot/kimi-k2-thinking",
 
2411
  "capabilities": [
2412
  "tools"
2413
  ],
2414
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
2415
+ "size_b": 1026.5
2416
  },
2417
  {
2418
+ "name": "novita/zai-org/glm-4.5",
2419
  "type": "chat",
2420
  "input_price_per_1m": 0.6,
2421
  "output_price_per_1m": 2.2,
 
2425
  "tools",
2426
  "reasoning"
2427
  ],
2428
+ "hf_id": "zai-org/GLM-4.5",
2429
+ "size_b": 358.3
2430
  },
2431
  {
2432
+ "name": "novita/zai-org/glm-4.6",
2433
  "type": "chat",
2434
  "input_price_per_1m": 0.6,
2435
  "output_price_per_1m": 2.2,
2436
  "currency": "USD",
2437
+ "context_window": 204800,
2438
  "capabilities": [
2439
  "tools",
2440
  "reasoning"
2441
  ],
2442
+ "hf_id": "zai-org/GLM-4.6",
2443
+ "size_b": 356.8
2444
  },
2445
  {
2446
+ "name": "minimaxi/MiniMax-M2.5-highspeed",
2447
  "type": "vision",
2448
  "input_price_per_1m": 0.6,
2449
  "output_price_per_1m": 2.4,
 
2453
  "reasoning"
2454
  ],
2455
  "context_window": 200000,
2456
+ "hf_id": "MiniMaxAI/MiniMax-M2.5",
2457
+ "size_b": 228.7
2458
  },
2459
  {
2460
+ "name": "minimaxi/MiniMax-M2.7-highspeed",
2461
  "type": "vision",
2462
  "input_price_per_1m": 0.6,
2463
  "output_price_per_1m": 2.4,
 
2467
  "reasoning"
2468
  ],
2469
  "context_window": 200000,
2470
+ "hf_id": "MiniMaxAI/MiniMax-M2.7"
2471
  },
2472
  {
2473
+ "name": "deepinfra/zai-org/GLM-4.5",
2474
+ "type": "chat",
2475
  "input_price_per_1m": 0.6,
2476
+ "output_price_per_1m": 2.2,
2477
  "currency": "USD",
2478
+ "context_window": 131072,
2479
  "capabilities": [
2480
+ "tools",
2481
  "reasoning"
2482
  ],
2483
+ "hf_id": "zai-org/GLM-4.5",
2484
+ "size_b": 358.3
 
2485
  },
2486
  {
2487
  "name": "novita/microsoft/wizardlm-2-8x22b",
 
2505
  "context_window": 400000
2506
  },
2507
  {
2508
+ "name": "parasail/parasail-qwen25-vl-72b-instruct",
2509
+ "type": "vision",
2510
  "input_price_per_1m": 0.7,
2511
+ "output_price_per_1m": 0.7,
2512
  "currency": "USD",
2513
+ "capabilities": [
2514
+ "vision"
2515
+ ],
2516
+ "context_window": 32768,
2517
+ "size_b": 72
2518
  },
2519
  {
2520
  "name": "novita/deepseek/deepseek-r1-turbo",
 
2527
  "tools",
2528
  "reasoning"
2529
  ],
2530
+ "hf_id": "deepseek-ai/DeepSeek-R1",
2531
+ "size_b": 684.5
2532
  },
2533
  {
2534
+ "name": "novita/deepseek/deepseek-prover-v2-671b",
2535
+ "type": "chat",
2536
  "input_price_per_1m": 0.7,
2537
+ "output_price_per_1m": 2.5,
2538
  "currency": "USD",
2539
+ "context_window": 160000,
2540
+ "size_b": 671
 
 
 
2541
  },
2542
  {
2543
  "name": "openai/gpt-5.4-mini",
 
2561
  "vision",
2562
  "reasoning"
2563
  ],
2564
+ "context_window": 400000
2565
+ },
2566
+ {
2567
+ "name": "nebius/deepseek-ai/DeepSeek-R1-0528",
2568
+ "type": "chat",
2569
+ "input_price_per_1m": 0.8,
2570
+ "output_price_per_1m": 2.4,
2571
+ "currency": "USD",
2572
+ "context_window": 164000,
2573
+ "capabilities": [
2574
+ "tools",
2575
+ "reasoning"
2576
+ ],
2577
+ "hf_id": "deepseek-ai/DeepSeek-R1-0528",
2578
+ "size_b": 684.5
2579
  },
2580
  {
2581
  "name": "novita/deepseek/deepseek-r1-distill-llama-70b",
 
2613
  "size_b": 405
2614
  },
2615
  {
2616
+ "name": "deepinfra/deepseek-ai/DeepSeek-V3",
2617
  "type": "chat",
2618
+ "input_price_per_1m": 0.85,
2619
+ "output_price_per_1m": 0.9,
2620
  "currency": "USD",
2621
+ "context_window": 128000,
2622
  "capabilities": [
2623
  "tools",
2624
  "reasoning"
2625
  ],
2626
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus"
2627
  },
2628
  {
2629
  "name": "deepinfra/deepseek-ai/DeepSeek-R1",
 
2636
  "tools",
2637
  "reasoning"
2638
  ],
2639
+ "hf_id": "deepseek-ai/DeepSeek-R1",
2640
+ "size_b": 684.5
 
 
 
 
 
 
 
 
 
 
 
 
2641
  },
2642
  {
2643
  "name": "alibaba/qwen3-max",
 
2651
  "context_window": 262144
2652
  },
2653
  {
2654
+ "name": "together/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
2655
  "type": "chat",
2656
  "input_price_per_1m": 0.88,
2657
  "output_price_per_1m": 0.88,
2658
  "currency": "USD",
2659
  "context_window": 131072,
2660
+ "size_b": 70
 
 
 
 
2661
  },
2662
  {
2663
+ "name": "together/meta-llama/Llama-3.3-70B-Instruct-Turbo",
2664
  "type": "chat",
2665
  "input_price_per_1m": 0.88,
2666
  "output_price_per_1m": 0.88,
2667
  "currency": "USD",
2668
  "context_window": 131072,
2669
+ "size_b": 70,
2670
+ "capabilities": [
2671
+ "tools"
2672
+ ],
2673
+ "hf_id": "meta-llama/Llama-3.3-70B-Instruct"
2674
  },
2675
  {
2676
  "name": "novita/deepseek/deepseek_v3",
 
2694
  "context_window": 131072
2695
  },
2696
  {
2697
+ "name": "zai/GLM-5",
2698
  "type": "vision",
2699
  "input_price_per_1m": 1,
2700
+ "output_price_per_1m": 3.2,
2701
  "currency": "USD",
 
2702
  "capabilities": [
2703
+ "vision",
2704
+ "reasoning"
2705
+ ],
2706
+ "context_window": 200000,
2707
+ "hf_id": "zai-org/GLM-5",
2708
+ "size_b": 753.9
2709
  },
2710
  {
2711
+ "name": "groq/moonshotai/kimi-k2-instruct",
2712
+ "type": "chat",
2713
  "input_price_per_1m": 1,
2714
+ "output_price_per_1m": 3,
2715
  "currency": "USD",
2716
+ "context_window": 131072,
2717
  "capabilities": [
2718
+ "tools"
2719
  ],
2720
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
2721
+ "size_b": 1026.5
2722
  },
2723
  {
2724
+ "name": "groq/moonshotai/Kimi-K2-Instruct-0905",
2725
  "type": "chat",
2726
  "input_price_per_1m": 1,
2727
+ "output_price_per_1m": 3,
2728
  "currency": "USD",
2729
+ "context_window": 256000,
2730
  "capabilities": [
2731
+ "tools"
2732
  ],
2733
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
2734
+ "size_b": 1026.5
2735
  },
2736
  {
2737
+ "name": "anthropic/claude-haiku-4-5",
2738
  "type": "vision",
2739
  "input_price_per_1m": 1,
2740
  "output_price_per_1m": 5,
 
2757
  "context_window": 200000
2758
  },
2759
  {
2760
+ "name": "alibaba/qwen3-coder-plus",
2761
  "type": "vision",
2762
  "input_price_per_1m": 1,
2763
+ "output_price_per_1m": 5,
2764
  "currency": "USD",
2765
  "capabilities": [
2766
+ "vision"
 
2767
  ],
2768
+ "context_window": 1048576
 
2769
  },
2770
  {
2771
+ "name": "bedrock/claude-haiku-4-5",
2772
  "type": "vision",
2773
  "input_price_per_1m": 1,
2774
  "output_price_per_1m": 5,
 
2779
  "context_window": 200000
2780
  },
2781
  {
2782
+ "name": "perplexity/sonar",
2783
  "type": "vision",
2784
  "input_price_per_1m": 1,
2785
+ "output_price_per_1m": 1,
2786
  "currency": "USD",
2787
+ "context_window": 131072,
2788
  "capabilities": [
2789
  "vision"
2790
+ ]
 
2791
  },
2792
  {
2793
+ "name": "vertex/claude-haiku-4-5",
2794
+ "type": "vision",
2795
  "input_price_per_1m": 1,
2796
+ "output_price_per_1m": 5,
2797
  "currency": "USD",
 
2798
  "capabilities": [
2799
+ "vision"
2800
  ],
2801
+ "context_window": 200000
2802
  },
2803
  {
2804
+ "name": "novita/GLM-5",
2805
  "type": "chat",
2806
  "input_price_per_1m": 1,
2807
+ "output_price_per_1m": 3.2,
2808
  "currency": "USD",
 
2809
  "capabilities": [
2810
+ "reasoning"
2811
  ],
2812
+ "context_window": 202800,
2813
+ "hf_id": "zai-org/GLM-5",
2814
+ "size_b": 753.9
2815
  },
2816
  {
2817
  "name": "openai/o3-mini",
 
2825
  "context_window": 200000
2826
  },
2827
  {
2828
+ "name": "azure/o4-mini",
2829
  "type": "vision",
2830
  "input_price_per_1m": 1.1,
2831
  "output_price_per_1m": 4.4,
 
2847
  "context_window": 200000
2848
  },
2849
  {
2850
+ "name": "openai-responses/o4-mini",
2851
  "type": "vision",
2852
  "input_price_per_1m": 1.1,
2853
  "output_price_per_1m": 4.4,
 
2867
  "capabilities": [
2868
  "tools"
2869
  ],
2870
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
2871
+ "size_b": 1026.5
2872
  },
2873
  {
2874
  "name": "together/Qwen/Qwen2.5-72B-Instruct-Turbo",
 
2880
  "size_b": 72
2881
  },
2882
  {
2883
+ "name": "openai/gpt-5.1",
2884
  "type": "vision",
2885
  "input_price_per_1m": 1.25,
2886
  "output_price_per_1m": 10,
 
2889
  "vision",
2890
  "reasoning"
2891
  ],
2892
+ "context_window": 400000
2893
  },
2894
  {
2895
+ "name": "openai/gpt-5.1-chat",
2896
  "type": "vision",
2897
  "input_price_per_1m": 1.25,
2898
  "output_price_per_1m": 10,
 
2904
  "context_window": 128000
2905
  },
2906
  {
2907
+ "name": "openai/gpt-5-chat",
2908
  "type": "vision",
2909
  "input_price_per_1m": 1.25,
2910
  "output_price_per_1m": 10,
 
2913
  "vision",
2914
  "reasoning"
2915
  ],
2916
+ "context_window": 128000
2917
  },
2918
  {
2919
+ "name": "google/gemini-2.5-pro",
2920
  "type": "vision",
2921
  "input_price_per_1m": 1.25,
2922
  "output_price_per_1m": 10,
 
2925
  "vision",
2926
  "reasoning"
2927
  ],
2928
+ "context_window": 1048576
2929
  },
2930
  {
2931
+ "name": "vertex/gemini-2.5-pro",
2932
  "type": "vision",
2933
  "input_price_per_1m": 1.25,
2934
  "output_price_per_1m": 10,
 
2940
  "context_window": 1048576
2941
  },
2942
  {
2943
+ "name": "azure/gpt-5.1",
2944
  "type": "vision",
2945
  "input_price_per_1m": 1.25,
2946
  "output_price_per_1m": 10,
2947
  "currency": "USD",
2948
  "capabilities": [
 
2949
  "reasoning"
2950
  ],
2951
+ "context_window": 200000
2952
  },
2953
  {
2954
+ "name": "azure/gpt-5",
2955
  "type": "vision",
2956
  "input_price_per_1m": 1.25,
2957
  "output_price_per_1m": 10,
2958
  "currency": "USD",
2959
  "capabilities": [
 
2960
  "reasoning"
2961
  ],
2962
+ "context_window": 200000
2963
  },
2964
  {
2965
+ "name": "together/deepseek-ai/DeepSeek-V3",
2966
+ "type": "chat",
2967
  "input_price_per_1m": 1.25,
2968
+ "output_price_per_1m": 1.25,
2969
  "currency": "USD",
2970
+ "context_window": 131072,
2971
  "capabilities": [
2972
+ "tools",
2973
  "reasoning"
2974
  ],
2975
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus"
2976
  },
2977
  {
2978
  "name": "openai-responses/gpt-5-codex",
 
2987
  "context_window": 400000
2988
  },
2989
  {
2990
+ "name": "openai-responses/gpt-5.1",
2991
+ "type": "vision",
2992
  "input_price_per_1m": 1.25,
2993
+ "output_price_per_1m": 10,
2994
  "currency": "USD",
 
2995
  "capabilities": [
2996
+ "vision",
2997
  "reasoning"
2998
  ],
2999
+ "context_window": 400000
3000
  },
3001
  {
3002
+ "name": "openai-responses/gpt-5",
3003
  "type": "vision",
3004
  "input_price_per_1m": 1.25,
3005
  "output_price_per_1m": 10,
 
3008
  "vision",
3009
  "reasoning"
3010
  ],
3011
+ "context_window": 400000
3012
  },
3013
  {
3014
+ "name": "openai-responses/gpt-5.1-codex",
3015
  "type": "vision",
3016
  "input_price_per_1m": 1.25,
3017
  "output_price_per_1m": 10,
3018
  "currency": "USD",
3019
  "capabilities": [
3020
+ "vision",
3021
  "reasoning"
3022
  ],
3023
+ "context_window": 400000
3024
  },
3025
  {
3026
+ "name": "coding/gemini-2.5-pro",
3027
  "type": "vision",
3028
  "input_price_per_1m": 1.25,
3029
  "output_price_per_1m": 10,
3030
  "currency": "USD",
3031
  "capabilities": [
3032
+ "vision",
3033
  "reasoning"
3034
  ],
3035
+ "context_window": 1048576
3036
  },
3037
  {
3038
  "name": "novita/sao10k/l31-70b-euryale-v2.2",
 
3064
  ]
3065
  },
3066
  {
3067
+ "name": "openai/gpt-5.2",
3068
  "type": "vision",
3069
  "input_price_per_1m": 1.75,
3070
  "output_price_per_1m": 14,
 
3073
  "vision",
3074
  "reasoning"
3075
  ],
3076
+ "context_window": 400000
3077
  },
3078
  {
3079
+ "name": "openai/gpt-5.2-chat",
3080
  "type": "vision",
3081
  "input_price_per_1m": 1.75,
3082
  "output_price_per_1m": 14,
 
3085
  "vision",
3086
  "reasoning"
3087
  ],
3088
+ "context_window": 128000
3089
  },
3090
  {
3091
+ "name": "openai/gpt-5.3-chat",
3092
  "type": "vision",
3093
  "input_price_per_1m": 1.75,
3094
  "output_price_per_1m": 14,
 
3100
  "context_window": 128000
3101
  },
3102
  {
3103
+ "name": "azure/gpt-5.2",
3104
  "type": "vision",
3105
  "input_price_per_1m": 1.75,
3106
  "output_price_per_1m": 14,
3107
  "currency": "USD",
3108
  "capabilities": [
 
3109
  "reasoning"
3110
  ],
3111
+ "context_window": 200000
3112
  },
3113
  {
3114
+ "name": "azure/openai-responses/gpt-5.2-codex",
3115
  "type": "vision",
3116
  "input_price_per_1m": 1.75,
3117
  "output_price_per_1m": 14,
 
3123
  "context_window": 400000
3124
  },
3125
  {
3126
+ "name": "azure/gpt-5.3-codex",
3127
  "type": "vision",
3128
  "input_price_per_1m": 1.75,
3129
  "output_price_per_1m": 14,
 
3132
  "vision",
3133
  "reasoning"
3134
  ],
3135
+ "context_window": 400000
3136
  },
3137
  {
3138
+ "name": "openai-responses/gpt-5.3-codex",
3139
  "type": "vision",
3140
  "input_price_per_1m": 1.75,
3141
  "output_price_per_1m": 14,
 
3147
  "context_window": 400000
3148
  },
3149
  {
3150
+ "name": "openai-responses/gpt-5.3-chat",
3151
  "type": "vision",
3152
  "input_price_per_1m": 1.75,
3153
  "output_price_per_1m": 14,
 
3156
  "vision",
3157
  "reasoning"
3158
  ],
3159
+ "context_window": 128000
3160
  },
3161
  {
3162
+ "name": "openai-responses/gpt-5.2-codex",
3163
  "type": "vision",
3164
  "input_price_per_1m": 1.75,
3165
  "output_price_per_1m": 14,
 
3171
  "context_window": 400000
3172
  },
3173
  {
3174
+ "name": "openai-responses/gpt-5.2",
3175
  "type": "vision",
3176
  "input_price_per_1m": 1.75,
3177
  "output_price_per_1m": 14,
3178
  "currency": "USD",
3179
  "capabilities": [
3180
+ "vision",
3181
  "reasoning"
3182
  ],
3183
+ "context_window": 400000
3184
  },
3185
  {
3186
+ "name": "openai/o4-mini-deep-research",
3187
  "type": "vision",
3188
  "input_price_per_1m": 2,
3189
  "output_price_per_1m": 8,
3190
  "currency": "USD",
 
 
 
 
 
 
 
 
 
 
 
 
3191
  "capabilities": [
3192
  "vision",
3193
  "reasoning"
3194
  ],
3195
+ "context_window": 100000
3196
  },
3197
  {
3198
+ "name": "openai/gpt-4.1",
3199
  "type": "vision",
3200
  "input_price_per_1m": 2,
3201
+ "output_price_per_1m": 8,
3202
  "currency": "USD",
3203
  "capabilities": [
3204
+ "vision"
 
3205
  ],
3206
+ "context_window": 1047576
3207
  },
3208
  {
3209
+ "name": "nebius/deepseek-ai/DeepSeek-V3-0324-fast",
3210
+ "type": "chat",
3211
  "input_price_per_1m": 2,
3212
+ "output_price_per_1m": 6,
3213
  "currency": "USD",
3214
+ "context_window": 128000
 
 
 
 
3215
  },
3216
  {
3217
+ "name": "google/gemini-3.1-pro-preview",
3218
  "type": "vision",
3219
  "input_price_per_1m": 2,
3220
+ "output_price_per_1m": 12,
3221
  "currency": "USD",
3222
  "capabilities": [
3223
+ "vision",
3224
+ "reasoning"
3225
  ],
3226
+ "context_window": 1048576
3227
  },
3228
  {
3229
+ "name": "google/gemini-3-pro-preview",
3230
  "type": "vision",
3231
  "input_price_per_1m": 2,
3232
+ "output_price_per_1m": 12,
3233
  "currency": "USD",
3234
  "capabilities": [
3235
  "vision",
3236
  "reasoning"
3237
  ],
3238
+ "context_window": 1048576
3239
  },
3240
  {
3241
  "name": "mistral/pixtral-large-latest",
 
3246
  "context_window": 131072
3247
  },
3248
  {
3249
+ "name": "perplexity/sonar-reasoning-pro",
3250
  "type": "vision",
3251
  "input_price_per_1m": 2,
3252
  "output_price_per_1m": 8,
3253
  "currency": "USD",
3254
+ "context_window": 131072,
3255
  "capabilities": [
3256
+ "vision",
3257
+ "reasoning"
3258
+ ]
 
 
 
 
 
 
 
 
3259
  },
3260
  {
3261
+ "name": "vertex/gemini-3.1-pro-preview",
3262
  "type": "vision",
3263
  "input_price_per_1m": 2,
3264
+ "output_price_per_1m": 12,
3265
  "currency": "USD",
3266
  "capabilities": [
3267
  "vision",
3268
  "reasoning"
3269
  ],
3270
+ "context_window": 1048576
3271
  },
3272
  {
3273
+ "name": "vertex/gemini-3-pro-preview",
3274
  "type": "vision",
3275
  "input_price_per_1m": 2,
3276
  "output_price_per_1m": 12,
 
3282
  "context_window": 1048576
3283
  },
3284
  {
3285
+ "name": "vertex/gemini-3-pro-image-preview",
3286
  "type": "vision",
3287
  "input_price_per_1m": 2,
3288
  "output_price_per_1m": 12,
 
3316
  "context_window": 1047576
3317
  },
3318
  {
3319
+ "name": "xai/grok-2-1212",
3320
  "type": "chat",
3321
  "input_price_per_1m": 2,
3322
+ "output_price_per_1m": 10,
3323
+ "currency": "USD",
3324
+ "context_window": 131072
3325
+ },
3326
+ {
3327
+ "name": "xai/grok-4.2-beta",
3328
+ "type": "vision",
3329
+ "input_price_per_1m": 2,
3330
  "output_price_per_1m": 6,
3331
  "currency": "USD",
3332
+ "capabilities": [
3333
+ "vision",
3334
+ "reasoning"
3335
+ ],
3336
+ "context_window": 2000000
3337
  },
3338
  {
3339
+ "name": "openai-responses/gpt-4.1",
3340
  "type": "vision",
3341
+ "input_price_per_1m": 2,
3342
+ "output_price_per_1m": 8,
3343
  "currency": "USD",
3344
  "capabilities": [
3345
  "vision"
3346
  ],
3347
+ "context_window": 1047576
3348
  },
3349
  {
3350
+ "name": "openai/gpt-4o",
3351
  "type": "vision",
3352
  "input_price_per_1m": 2.5,
3353
  "output_price_per_1m": 10,
 
3358
  "context_window": 128000
3359
  },
3360
  {
3361
+ "name": "openai/gpt-4o-2024-08-06",
3362
  "type": "vision",
3363
  "input_price_per_1m": 2.5,
3364
  "output_price_per_1m": 10,
 
3369
  "context_window": 128000
3370
  },
3371
  {
3372
+ "name": "openai/gpt-4o-2024-05-13",
3373
  "type": "vision",
3374
  "input_price_per_1m": 2.5,
3375
+ "output_price_per_1m": 10,
3376
  "currency": "USD",
3377
  "capabilities": [
3378
+ "vision"
 
3379
  ],
3380
+ "context_window": 128000
3381
  },
3382
  {
3383
+ "name": "openai/gpt-4o-2024-11-20",
3384
  "type": "vision",
3385
  "input_price_per_1m": 2.5,
3386
  "output_price_per_1m": 10,
 
3391
  "context_window": 128000
3392
  },
3393
  {
3394
+ "name": "openai/gpt-5.4",
3395
  "type": "vision",
3396
  "input_price_per_1m": 2.5,
3397
  "output_price_per_1m": 15,
 
3415
  "context_window": 1050000
3416
  },
3417
  {
3418
+ "name": "openai-responses/gpt-5.4",
3419
  "type": "vision",
3420
+ "input_price_per_1m": 2.5,
3421
  "output_price_per_1m": 15,
3422
  "currency": "USD",
 
3423
  "capabilities": [
3424
+ "vision",
3425
+ "reasoning"
3426
+ ],
3427
+ "context_window": 1050000
3428
  },
3429
  {
3430
+ "name": "anthropic/claude-sonnet-4-6",
3431
  "type": "vision",
3432
  "input_price_per_1m": 3,
3433
  "output_price_per_1m": 15,
 
3436
  "vision",
3437
  "reasoning"
3438
  ],
3439
+ "context_window": 1000000
3440
  },
3441
  {
3442
+ "name": "anthropic/claude-sonnet-4-5",
3443
  "type": "vision",
3444
  "input_price_per_1m": 3,
3445
  "output_price_per_1m": 15,
 
3451
  "context_window": 1000000
3452
  },
3453
  {
3454
+ "name": "anthropic/claude-sonnet-4",
3455
  "type": "vision",
3456
  "input_price_per_1m": 3,
3457
  "output_price_per_1m": 15,
 
3460
  "vision",
3461
  "reasoning"
3462
  ],
3463
+ "context_window": 1000000
3464
  },
3465
  {
3466
+ "name": "bedrock/claude-sonnet-4-6",
3467
  "type": "vision",
3468
  "input_price_per_1m": 3,
3469
  "output_price_per_1m": 15,
 
3472
  "vision",
3473
  "reasoning"
3474
  ],
3475
+ "context_window": 1000000
3476
  },
3477
  {
3478
+ "name": "bedrock/claude-sonnet-4-5",
3479
  "type": "vision",
3480
  "input_price_per_1m": 3,
3481
  "output_price_per_1m": 15,
 
3487
  "context_window": 200000
3488
  },
3489
  {
3490
+ "name": "bedrock/claude-3-7-sonnet",
3491
  "type": "vision",
3492
  "input_price_per_1m": 3,
3493
  "output_price_per_1m": 15,
 
3499
  "context_window": 200000
3500
  },
3501
  {
3502
+ "name": "bedrock/claude-sonnet-4",
3503
  "type": "vision",
3504
  "input_price_per_1m": 3,
3505
  "output_price_per_1m": 15,
 
3511
  "context_window": 200000
3512
  },
3513
  {
3514
+ "name": "perplexity/sonar-pro",
3515
  "type": "vision",
3516
  "input_price_per_1m": 3,
3517
  "output_price_per_1m": 15,
3518
  "currency": "USD",
3519
+ "context_window": 204800,
3520
  "capabilities": [
3521
  "vision"
3522
+ ]
 
3523
  },
3524
  {
3525
+ "name": "vertex/claude-3-5-sonnet",
3526
  "type": "vision",
3527
  "input_price_per_1m": 3,
3528
  "output_price_per_1m": 15,
3529
  "currency": "USD",
3530
  "capabilities": [
3531
+ "vision"
 
3532
  ],
3533
  "context_window": 200000
3534
  },
3535
  {
3536
+ "name": "vertex/claude-3-7-sonnet",
3537
  "type": "vision",
3538
  "input_price_per_1m": 3,
3539
  "output_price_per_1m": 15,
 
3542
  "vision",
3543
  "reasoning"
3544
  ],
3545
+ "context_window": 200000
3546
  },
3547
  {
3548
+ "name": "vertex/claude-sonnet-4-5",
3549
  "type": "vision",
3550
  "input_price_per_1m": 3,
3551
  "output_price_per_1m": 15,
 
3554
  "vision",
3555
  "reasoning"
3556
  ],
3557
+ "context_window": 200000
3558
  },
3559
  {
3560
+ "name": "vertex/claude-sonnet-4",
3561
  "type": "vision",
3562
  "input_price_per_1m": 3,
3563
  "output_price_per_1m": 15,
 
3566
  "vision",
3567
  "reasoning"
3568
  ],
3569
+ "context_window": 200000
3570
  },
3571
  {
3572
  "name": "xai/grok-4",
 
3590
  "tools",
3591
  "reasoning"
3592
  ],
3593
+ "hf_id": "deepseek-ai/DeepSeek-R1",
3594
+ "size_b": 684.5
3595
+ },
3596
+ {
3597
+ "name": "coding/claude-sonnet-4-20250514",
3598
+ "type": "vision",
3599
+ "input_price_per_1m": 3,
3600
+ "output_price_per_1m": 15,
3601
+ "currency": "USD",
3602
+ "capabilities": [
3603
+ "vision",
3604
+ "reasoning"
3605
+ ],
3606
+ "context_window": 200000
3607
  },
3608
  {
3609
  "name": "novita/deepseek/deepseek-r1",
 
3616
  "tools",
3617
  "reasoning"
3618
  ],
3619
+ "hf_id": "deepseek-ai/DeepSeek-R1",
3620
+ "size_b": 684.5
3621
  },
3622
  {
3623
+ "name": "anthropic/claude-opus-4-5",
3624
  "type": "vision",
3625
  "input_price_per_1m": 5,
3626
  "output_price_per_1m": 25,
 
3632
  "context_window": 200000
3633
  },
3634
  {
3635
+ "name": "anthropic/claude-opus-4-6",
3636
  "type": "vision",
3637
  "input_price_per_1m": 5,
3638
  "output_price_per_1m": 25,
 
3644
  "context_window": 1000000
3645
  },
3646
  {
3647
+ "name": "openai/chatgpt-4o",
3648
  "type": "vision",
3649
  "input_price_per_1m": 5,
3650
+ "output_price_per_1m": 15,
3651
  "currency": "USD",
3652
  "capabilities": [
3653
+ "vision"
 
3654
  ],
3655
+ "context_window": 128000
3656
  },
3657
  {
3658
+ "name": "bedrock/claude-opus-4-5",
3659
  "type": "vision",
3660
  "input_price_per_1m": 5,
3661
  "output_price_per_1m": 25,
 
3667
  "context_window": 200000
3668
  },
3669
  {
3670
+ "name": "bedrock/claude-opus-4-6",
3671
  "type": "vision",
3672
  "input_price_per_1m": 5,
3673
+ "output_price_per_1m": 25,
3674
  "currency": "USD",
3675
  "capabilities": [
3676
+ "vision",
3677
+ "reasoning"
3678
  ],
3679
+ "context_window": 1000000
3680
  },
3681
  {
3682
+ "name": "vertex/claude-opus-4-6",
3683
  "type": "vision",
3684
  "input_price_per_1m": 5,
3685
  "output_price_per_1m": 25,
 
3691
  "context_window": 1000000
3692
  },
3693
  {
3694
+ "name": "vertex/claude-opus-4-5",
3695
  "type": "vision",
3696
  "input_price_per_1m": 5,
3697
  "output_price_per_1m": 25,
 
3726
  "context_window": 100000
3727
  },
3728
  {
3729
+ "name": "anthropic/claude-opus-4-1",
3730
  "type": "vision",
3731
  "input_price_per_1m": 15,
3732
  "output_price_per_1m": 75,
 
3738
  "context_window": 200000
3739
  },
3740
  {
3741
+ "name": "anthropic/claude-opus-4",
3742
  "type": "vision",
3743
  "input_price_per_1m": 15,
3744
  "output_price_per_1m": 75,
 
3750
  "context_window": 200000
3751
  },
3752
  {
3753
+ "name": "openai/o1",
3754
  "type": "vision",
3755
  "input_price_per_1m": 15,
3756
+ "output_price_per_1m": 60,
3757
  "currency": "USD",
3758
  "capabilities": [
3759
  "vision",
 
3762
  "context_window": 200000
3763
  },
3764
  {
3765
+ "name": "bedrock/claude-opus-4",
3766
  "type": "vision",
3767
  "input_price_per_1m": 15,
3768
+ "output_price_per_1m": 75,
3769
  "currency": "USD",
3770
  "capabilities": [
3771
  "vision",
 
3774
  "context_window": 200000
3775
  },
3776
  {
3777
+ "name": "vertex/claude-opus-4-1",
3778
  "type": "vision",
3779
  "input_price_per_1m": 15,
3780
  "output_price_per_1m": 75,
 
3786
  "context_window": 200000
3787
  },
3788
  {
3789
+ "name": "vertex/claude-opus-4",
3790
  "type": "vision",
3791
  "input_price_per_1m": 15,
3792
  "output_price_per_1m": 75,
 
3798
  "context_window": 200000
3799
  },
3800
  {
3801
+ "name": "openai-responses/gpt-5-pro",
3802
  "type": "vision",
3803
  "input_price_per_1m": 15,
3804
+ "output_price_per_1m": 120,
3805
  "currency": "USD",
3806
  "capabilities": [
3807
  "vision",
3808
  "reasoning"
3809
  ],
3810
+ "context_window": 400000
3811
  },
3812
  {
3813
+ "name": "coding/claude-opus-4-20250514",
3814
  "type": "vision",
3815
  "input_price_per_1m": 15,
3816
+ "output_price_per_1m": 75,
3817
  "currency": "USD",
3818
  "capabilities": [
3819
  "vision",
3820
  "reasoning"
3821
  ],
3822
+ "context_window": 200000
3823
  },
3824
  {
3825
  "name": "openai-responses/o3-pro",
 
3846
  "context_window": 1050000
3847
  },
3848
  {
3849
+ "name": "azure/openai-responses/gpt-5.4-pro",
3850
  "type": "vision",
3851
  "input_price_per_1m": 30,
3852
  "output_price_per_1m": 180,
 
3858
  "context_window": 1050000
3859
  },
3860
  {
3861
+ "name": "openai-responses/gpt-5.4-pro",
3862
  "type": "vision",
3863
  "input_price_per_1m": 30,
3864
  "output_price_per_1m": 180,
 
3930
  "capabilities": [
3931
  "tools"
3932
  ],
3933
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
3934
+ "size_b": 1026.5
3935
  },
3936
  {
3937
  "name": "Qwen3-Coder-480B-A35B-Instruct (base)",
 
4127
  "tools",
4128
  "reasoning"
4129
  ],
4130
+ "hf_id": "zai-org/GLM-4.5",
4131
+ "size_b": 358.3
4132
  },
4133
  {
4134
  "name": "GLM-4.5-Air (base)",
 
4155
  "tools",
4156
  "reasoning"
4157
  ],
4158
+ "hf_id": "deepseek-ai/DeepSeek-R1-0528",
4159
+ "size_b": 684.5
4160
  },
4161
  {
4162
  "name": "DeepSeek-R1-0528 (base)",
 
4169
  "tools",
4170
  "reasoning"
4171
  ],
4172
+ "hf_id": "deepseek-ai/DeepSeek-R1-0528",
4173
+ "size_b": 684.5
4174
  },
4175
  {
4176
  "name": "DeepSeek-V3-0324 (fast)",
 
4529
  "type": "audio",
4530
  "input_price_per_1m": 0.003,
4531
  "output_price_per_1m": 0,
4532
+ "currency": "EUR",
4533
+ "hf_id": "openai/whisper-large-v3"
4534
  },
4535
  {
4536
  "name": "holo2-30b-a3b",
 
4988
  "input_price_per_1m": 0.017,
4989
  "output_price_per_1m": 0.11,
4990
  "currency": "USD",
4991
+ "hf_id": "ibm-granite/granite-4.0-h-micro",
4992
+ "size_b": 3.2
4993
  },
4994
  {
4995
  "name": "google/gemma-3n-e4b-it",
 
5316
  "capabilities": [
5317
  "tools",
5318
  "reasoning"
5319
+ ],
5320
+ "size_b": 31.2
5321
  },
5322
  {
5323
  "name": "qwen/qwen3-14b",
 
5567
  "capabilities": [
5568
  "tools",
5569
  "reasoning"
5570
+ ],
5571
+ "size_b": 309.8
5572
  },
5573
  {
5574
  "name": "alibaba/tongyi-deepresearch-30b-a3b",
 
5658
  "capabilities": [
5659
  "tools",
5660
  "reasoning"
5661
+ ],
5662
+ "size_b": 199.4
5663
  },
5664
  {
5665
  "name": "mistralai/mistral-small-creative",
 
5883
  "hf_id": "Qwen/Qwen3-Coder-Next",
5884
  "capabilities": [
5885
  "tools"
5886
+ ],
5887
+ "size_b": 79.7
5888
  },
5889
  {
5890
  "name": "allenai/olmo-3-7b-think",
 
6272
  "capabilities": [
6273
  "tools",
6274
  "reasoning"
6275
+ ],
6276
+ "size_b": 228.7
6277
  },
6278
  {
6279
  "name": "allenai/molmo-2-8b",
 
6386
  "hf_id": "meituan-longcat/LongCat-Flash-Chat",
6387
  "capabilities": [
6388
  "tools"
6389
+ ],
6390
+ "size_b": 561.9
6391
  },
6392
  {
6393
  "name": "x-ai/grok-code-fast-1",
 
6629
  "tools",
6630
  "reasoning",
6631
  "eu-endpoint"
6632
+ ],
6633
+ "size_b": 228.7
6634
  },
6635
  {
6636
  "name": "qwen/qwen3.5-122b-a10b",
 
6671
  "tools",
6672
  "reasoning",
6673
  "eu-endpoint"
6674
+ ],
6675
+ "size_b": 685.4
6676
  },
6677
  {
6678
  "name": "qwen/qwen3-vl-235b-a22b-thinking",
 
6729
  "capabilities": [
6730
  "tools",
6731
  "reasoning"
6732
+ ],
6733
+ "size_b": 228.7
6734
  },
6735
  {
6736
  "name": "nex-agi/deepseek-v3.1-nex-n1",
 
6741
  "hf_id": "nex-agi/DeepSeek-V3.1-Nex-N1",
6742
  "capabilities": [
6743
  "tools"
6744
+ ],
6745
+ "size_b": 671.1
6746
  },
6747
  {
6748
  "name": "deepseek/deepseek-v3.2-exp",
 
6940
  "tools",
6941
  "reasoning",
6942
  "eu-endpoint"
6943
+ ],
6944
+ "size_b": 358.3
6945
  },
6946
  {
6947
  "name": "z-ai/glm-4.6",
 
6953
  "capabilities": [
6954
  "tools",
6955
  "reasoning"
6956
+ ],
6957
+ "size_b": 356.8
6958
  },
6959
  {
6960
  "name": "xiaomi/mimo-v2-omni",
 
7002
  "hf_id": "moonshotai/Kimi-K2-Instruct-0905",
7003
  "capabilities": [
7004
  "tools"
7005
+ ],
7006
+ "size_b": 1026.5
7007
  },
7008
  {
7009
  "name": "mistralai/mistral-medium-3.1",
 
7122
  "capabilities": [
7123
  "tools",
7124
  "reasoning"
7125
+ ],
7126
+ "size_b": 684.5
7127
  },
7128
  {
7129
  "name": "undi95/remm-slerp-l2-13b",
 
7158
  "tools",
7159
  "reasoning",
7160
  "eu-endpoint"
7161
+ ],
7162
+ "size_b": 1058.1
7163
  },
7164
  {
7165
  "name": "google/gemini-3.1-flash-image-preview",
 
7315
  "capabilities": [
7316
  "tools",
7317
  "reasoning"
7318
+ ],
7319
+ "size_b": 358.3
7320
  },
7321
  {
7322
  "name": "nvidia/llama-3.1-nemotron-ultra-253b-v1",
 
7410
  "tools",
7411
  "reasoning",
7412
  "eu-endpoint"
7413
+ ],
7414
+ "size_b": 684.5
7415
  },
7416
  {
7417
  "name": "z-ai/glm-5",
 
7423
  "capabilities": [
7424
  "tools",
7425
  "reasoning"
7426
+ ],
7427
+ "size_b": 753.9
7428
  },
7429
  {
7430
  "name": "openai/gpt-5.4-mini",
 
8790
  "capabilities": [
8791
  "tools",
8792
  "reasoning"
8793
+ ],
8794
+ "size_b": 199.4
8795
  },
8796
  {
8797
  "name": "arcee-ai/trinity-large-preview:free",
 
9092
  "capabilities": [
9093
  "tools"
9094
  ],
9095
+ "hf_id": "moonshotai/Kimi-K2-Instruct-0905",
9096
+ "size_b": 1026.5
9097
  },
9098
  {
9099
  "name": "Llama 4 Scout (17Bx16E) 128k",
scripts/fetch-providers.js CHANGED
@@ -52,7 +52,26 @@ function updateProviderModels(providers, providerName, models) {
52
  console.warn(` ⚠ Provider "${providerName}" not found in providers.json – skipping.`);
53
  return false;
54
  }
55
- provider.models = models;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
56
  return true;
57
  }
58
 
@@ -142,7 +161,7 @@ async function fetchHFSize(hfId) {
142
  const token = process.env.HF_TOKEN;
143
  const headers = token ? { Authorization: `Bearer ${token}` } : {};
144
  try {
145
- const data = await getJson(`https://huggingface.co/api/models/${hfId}`, { headers });
146
  // Check various common metadata locations for total parameters
147
  let params = data.safetensors?.total || data.config?.total_parameters || data.config?.model_type_params;
148
  if (!params && data.cardData?.model_details?.parameters) {
@@ -164,7 +183,13 @@ const EMBEDDER_KEYWORDS = ['embed', 'bge', 'gte', 'e5', 'stella', 'minilm', 'mul
164
  const MANUAL_HF_ID_MAP = {
165
  'all minilm l12 v2': 'sentence-transformers/all-MiniLM-L12-v2',
166
  'whisper v3': 'openai/whisper-large-v3',
167
- 'whisper-large-v3': 'openai/whisper-large-v3',
 
 
 
 
 
 
168
  };
169
 
170
  // Propagate capabilities and size from benchmarks, OpenRouter, or HF Hub to all other providers' models.
@@ -210,13 +235,16 @@ async function propagateExtraData(data) {
210
 
211
  // 1. STRUCTURED LOOKUP: Match size by hf_id if available (Benchmark gold-standard)
212
  if (!model.size_b && model.hf_id) {
213
- const size = hfIdToSize.get(model.hf_id.toLowerCase());
214
- if (size) {
215
- model.size_b = size;
216
  propagatedSize++;
 
 
 
217
  }
218
  }
219
 
 
220
  // 2. AUTO-TAG image-gen and embedding models
221
  if (model.type === 'image' && (!model.capabilities || !model.capabilities.length)) {
222
  model.capabilities = ['image-gen'];
@@ -271,27 +299,40 @@ async function propagateExtraData(data) {
271
  }
272
  }
273
 
274
- // 7. HUB API: Inspect technical metadata (Limit 30 unique IDs to avoid long startup)
275
- const uniqueIds = [...new Set(hfLookupQueue.map(m => m.hf_id || m.name).filter(id => id.includes('/')))].slice(0, 30);
276
  if (uniqueIds.length > 0) {
277
- process.stdout.write(` HF Hub: technical metadata inspection for ${uniqueIds.length} models... `);
278
  const idToSize = new Map();
279
- await Promise.all(uniqueIds.map(async (id) => {
 
 
 
 
280
  const size = await fetchHFSize(id);
281
- if (size) idToSize.set(id, size);
282
- }));
 
 
 
 
 
 
 
283
  for (const model of hfLookupQueue) {
284
  if (!model.size_b) {
285
- const size = idToSize.get(model.hf_id || model.name);
 
286
  if (size) {
287
  model.size_b = size;
288
  hfSizeFetched++;
289
  }
290
  }
291
  }
292
- console.log(`βœ“ ${hfSizeFetched} sizes found`);
293
  }
294
 
 
295
  if (autoTagged > 0) console.log(`Auto-tagged ${autoTagged} image-gen/embedding models.`);
296
  if (propagatedCaps > 0) console.log(`Propagated capabilities to ${propagatedCaps} models.`);
297
  if (propagatedSize + hfSizeFetched > 0) console.log(`Enriched size data for ${propagatedSize + hfSizeFetched} models.`);
 
52
  console.warn(` ⚠ Provider "${providerName}" not found in providers.json – skipping.`);
53
  return false;
54
  }
55
+
56
+ // Smart merge: preserve existing metadata (size_b, hf_id, capabilities) if missing in new data
57
+ const existingMap = new Map((provider.models || []).map(m => [m.name, m]));
58
+
59
+ provider.models = models.map(newModel => {
60
+ const existing = existingMap.get(newModel.name);
61
+ if (!existing) return newModel;
62
+
63
+ return {
64
+ ...existing, // Start with existing metadata
65
+ ...newModel, // Overwrite with new prices/type
66
+ // But preserve these if newModel doesn't have them
67
+ size_b: newModel.size_b || existing.size_b,
68
+ hf_id: newModel.hf_id || existing.hf_id,
69
+ capabilities: (newModel.capabilities && newModel.capabilities.length > 0)
70
+ ? newModel.capabilities
71
+ : existing.capabilities,
72
+ };
73
+ });
74
+
75
  return true;
76
  }
77
 
 
161
  const token = process.env.HF_TOKEN;
162
  const headers = token ? { Authorization: `Bearer ${token}` } : {};
163
  try {
164
+ const data = await getJson(`https://huggingface.co/api/models/${hfId}`, { headers, retries: 1 });
165
  // Check various common metadata locations for total parameters
166
  let params = data.safetensors?.total || data.config?.total_parameters || data.config?.model_type_params;
167
  if (!params && data.cardData?.model_details?.parameters) {
 
183
  const MANUAL_HF_ID_MAP = {
184
  'all minilm l12 v2': 'sentence-transformers/all-MiniLM-L12-v2',
185
  'whisper v3': 'openai/whisper-large-v3',
186
+ 'whisper large v3': 'openai/whisper-large-v3',
187
+ 'step 3 5 flash': 'stepfun-ai/Step-3.5-Flash',
188
+ 'bge m3': 'BAAI/bge-m3',
189
+ };
190
+
191
+ const MANUAL_SIZE_MAP = {
192
+ 'BAAI/bge-m3': 0.57,
193
  };
194
 
195
  // Propagate capabilities and size from benchmarks, OpenRouter, or HF Hub to all other providers' models.
 
235
 
236
  // 1. STRUCTURED LOOKUP: Match size by hf_id if available (Benchmark gold-standard)
237
  if (!model.size_b && model.hf_id) {
238
+ if (MANUAL_SIZE_MAP[model.hf_id]) {
239
+ model.size_b = MANUAL_SIZE_MAP[model.hf_id];
 
240
  propagatedSize++;
241
+ } else {
242
+ const size = hfIdToSize.get(model.hf_id.toLowerCase());
243
+ if (size) { model.size_b = size; propagatedSize++; }
244
  }
245
  }
246
 
247
+
248
  // 2. AUTO-TAG image-gen and embedding models
249
  if (model.type === 'image' && (!model.capabilities || !model.capabilities.length)) {
250
  model.capabilities = ['image-gen'];
 
299
  }
300
  }
301
 
302
+ // 7. HUB API: Inspect technical metadata (Limit 200 unique IDs to ensure better coverage)
303
+ const uniqueIds = [...new Set(hfLookupQueue.map(m => m.hf_id || m.name).filter(id => id.includes('/')))].slice(0, 200);
304
  if (uniqueIds.length > 0) {
305
+ console.log(`\n HF Hub: technical metadata inspection for ${uniqueIds.length} models...`);
306
  const idToSize = new Map();
307
+
308
+ // Process sequentially with small delay to avoid 429 rate limits
309
+ for (let i = 0; i < uniqueIds.length; i++) {
310
+ const id = uniqueIds[i];
311
+ process.stdout.write(` [${i + 1}/${uniqueIds.length}] ${id.padEnd(50)} `);
312
  const size = await fetchHFSize(id);
313
+ if (size) {
314
+ idToSize.set(id, size);
315
+ process.stdout.write(`βœ“ ${size}B\n`);
316
+ } else {
317
+ process.stdout.write(`βœ—\n`);
318
+ }
319
+ await new Promise(r => setTimeout(r, 50)); // Tiny delay
320
+ }
321
+
322
  for (const model of hfLookupQueue) {
323
  if (!model.size_b) {
324
+ const id = model.hf_id || model.name;
325
+ const size = idToSize.get(id);
326
  if (size) {
327
  model.size_b = size;
328
  hfSizeFetched++;
329
  }
330
  }
331
  }
332
+ console.log(` βœ“ Total ${hfSizeFetched} new sizes from HF metadata`);
333
  }
334
 
335
+
336
  if (autoTagged > 0) console.log(`Auto-tagged ${autoTagged} image-gen/embedding models.`);
337
  if (propagatedCaps > 0) console.log(`Propagated capabilities to ${propagatedCaps} models.`);
338
  if (propagatedSize + hfSizeFetched > 0) console.log(`Enriched size data for ${propagatedSize + hfSizeFetched} models.`);