kristaller486 commited on
Commit
c934e25
·
verified ·
1 Parent(s): 0aadcf7

add kimi-k2.5

Browse files
Files changed (1) hide show
  1. index.html +96 -24
index.html CHANGED
@@ -1138,8 +1138,44 @@
1138
  <td class="num mono" data-label="Всего токенов">99,705</td>
1139
  </tr>
1140
 
1141
- <tr data-model="openai/t-tech/T-pro-it-2.0">
1142
  <td class="rank mono sticky-0" data-label="#">#30</td>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1143
  <td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
1144
  <td class="num mono" data-label="Критичные/1000">
1145
 
@@ -1175,7 +1211,7 @@
1175
  </tr>
1176
 
1177
  <tr data-model="openrouter/openrouter/polaris-alpha">
1178
- <td class="rank mono sticky-0" data-label="#">#31</td>
1179
  <td class="model-name sticky-1" data-label="Модель">Polaris Alpha</td>
1180
  <td class="num mono" data-label="Критичные/1000">
1181
 
@@ -1211,7 +1247,7 @@
1211
  </tr>
1212
 
1213
  <tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
1214
- <td class="rank mono sticky-0" data-label="#">#32</td>
1215
  <td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
1216
  <td class="num mono" data-label="Критичные/1000">
1217
 
@@ -1247,7 +1283,7 @@
1247
  </tr>
1248
 
1249
  <tr data-model="openrouter/z-ai/glm-4.7-flash">
1250
- <td class="rank mono sticky-0" data-label="#">#33</td>
1251
  <td class="model-name sticky-1" data-label="Модель">zai-org/GLM-4.7-Flash (z.ai API, reasoning, temp=0.6)</td>
1252
  <td class="num mono" data-label="Критичные/1000">
1253
 
@@ -1283,7 +1319,7 @@
1283
  </tr>
1284
 
1285
  <tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
1286
- <td class="rank mono sticky-0" data-label="#">#34</td>
1287
  <td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
1288
  <td class="num mono" data-label="Критичные/1000">
1289
 
@@ -1319,7 +1355,7 @@
1319
  </tr>
1320
 
1321
  <tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
1322
- <td class="rank mono sticky-0" data-label="#">#35</td>
1323
  <td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
1324
  <td class="num mono" data-label="Критичные/1000">
1325
 
@@ -1354,8 +1390,44 @@
1354
  <td class="num mono" data-label="Всего токенов">165,307</td>
1355
  </tr>
1356
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1357
  <tr data-model="openrouter/moonshotai/kimi-k2-0905">
1358
- <td class="rank mono sticky-0" data-label="#">#36</td>
1359
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
1360
  <td class="num mono" data-label="Критичные/1000">
1361
 
@@ -1391,7 +1463,7 @@
1391
  </tr>
1392
 
1393
  <tr data-model="openrouter/z-ai/glm-4.6">
1394
- <td class="rank mono sticky-0" data-label="#">#37</td>
1395
  <td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
1396
  <td class="num mono" data-label="Критичные/1000">
1397
 
@@ -1427,7 +1499,7 @@
1427
  </tr>
1428
 
1429
  <tr data-model="openrouter/openai/gpt-5">
1430
- <td class="rank mono sticky-0" data-label="#">#38</td>
1431
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
1432
  <td class="num mono" data-label="Критичные/1000">
1433
 
@@ -1463,7 +1535,7 @@
1463
  </tr>
1464
 
1465
  <tr data-model="openai/aquif-3.5-Max-42B-A3B.Q8_0.gguf">
1466
- <td class="rank mono sticky-0" data-label="#">#39</td>
1467
  <td class="model-name sticky-1" data-label="Модель">aquif-ai/aquif-3.5-Plus-30B-A3B (Q8_0 llama.cpp, without reasoning)</td>
1468
  <td class="num mono" data-label="Критичные/1000">
1469
 
@@ -1499,7 +1571,7 @@
1499
  </tr>
1500
 
1501
  <tr data-model="openrouter/openai/gpt-5">
1502
- <td class="rank mono sticky-0" data-label="#">#40</td>
1503
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
1504
  <td class="num mono" data-label="Критичные/1000">
1505
 
@@ -1535,7 +1607,7 @@
1535
  </tr>
1536
 
1537
  <tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
1538
- <td class="rank mono sticky-0" data-label="#">#41</td>
1539
  <td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
1540
  <td class="num mono" data-label="Критичные/1000">
1541
 
@@ -1571,7 +1643,7 @@
1571
  </tr>
1572
 
1573
  <tr data-model="openrouter/openai/gpt-oss-120b">
1574
- <td class="rank mono sticky-0" data-label="#">#42</td>
1575
  <td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
1576
  <td class="num mono" data-label="Критичные/1000">
1577
 
@@ -1607,7 +1679,7 @@
1607
  </tr>
1608
 
1609
  <tr data-model="openai/gpt-4.1">
1610
- <td class="rank mono sticky-0" data-label="#">#43</td>
1611
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1</td>
1612
  <td class="num mono" data-label="Критичные/1000">
1613
 
@@ -1643,7 +1715,7 @@
1643
  </tr>
1644
 
1645
  <tr data-model="openrouter/nvidia/nemotron-3-nano-30b-a3b:free">
1646
- <td class="rank mono sticky-0" data-label="#">#44</td>
1647
  <td class="model-name sticky-1" data-label="Модель">Nemotron-3-Nano-30B-A3B (NVIDIA API, non-reasoning)</td>
1648
  <td class="num mono" data-label="Критичные/1000">
1649
 
@@ -1679,7 +1751,7 @@
1679
  </tr>
1680
 
1681
  <tr data-model="mistral/ministral-3b-2512">
1682
- <td class="rank mono sticky-0" data-label="#">#45</td>
1683
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-3B-Instruct-2512 (Mistral API)</td>
1684
  <td class="num mono" data-label="Критичные/1000">
1685
 
@@ -1715,7 +1787,7 @@
1715
  </tr>
1716
 
1717
  <tr data-model="openrouter/mistralai/mistral-nemo">
1718
- <td class="rank mono sticky-0" data-label="#">#46</td>
1719
  <td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
1720
  <td class="num mono" data-label="Критичные/1000">
1721
 
@@ -1751,7 +1823,7 @@
1751
  </tr>
1752
 
1753
  <tr data-model="openai/gpt-4.1-mini">
1754
- <td class="rank mono sticky-0" data-label="#">#47</td>
1755
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-mini</td>
1756
  <td class="num mono" data-label="Критичные/1000">
1757
 
@@ -1787,7 +1859,7 @@
1787
  </tr>
1788
 
1789
  <tr data-model="openrouter/minimax/minimax-m2:free">
1790
- <td class="rank mono sticky-0" data-label="#">#48</td>
1791
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
1792
  <td class="num mono" data-label="Критичные/1000">
1793
 
@@ -1823,7 +1895,7 @@
1823
  </tr>
1824
 
1825
  <tr data-model="openrouter/minimax/minimax-m2:free">
1826
- <td class="rank mono sticky-0" data-label="#">#49</td>
1827
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
1828
  <td class="num mono" data-label="Критичные/1000">
1829
 
@@ -1859,7 +1931,7 @@
1859
  </tr>
1860
 
1861
  <tr data-model="openai/gpt-4.1-nano">
1862
- <td class="rank mono sticky-0" data-label="#">#50</td>
1863
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-nano</td>
1864
  <td class="num mono" data-label="Критичные/1000">
1865
 
@@ -1895,7 +1967,7 @@
1895
  </tr>
1896
 
1897
  <tr data-model="openai/ai-sage/GigaChat3-10B-A1.8B-bf16">
1898
- <td class="rank mono sticky-0" data-label="#">#51</td>
1899
  <td class="model-name sticky-1" data-label="Модель">ai-sage/GigaChat3-10B-A1.8B-bf16 (sglang)</td>
1900
  <td class="num mono" data-label="Критичные/1000">
1901
 
@@ -1931,7 +2003,7 @@
1931
  </tr>
1932
 
1933
  <tr data-model="openrouter/openai/gpt-oss-20b">
1934
- <td class="rank mono sticky-0" data-label="#">#52</td>
1935
  <td class="model-name sticky-1" data-label="Модель">openai/gpt-oss-20b (Vertex API)</td>
1936
  <td class="num mono" data-label="Критичные/1000">
1937
 
@@ -1989,7 +2061,7 @@
1989
  </div>
1990
  <p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
1991
  <p class="info-text">
1992
- Обновлено: 2026-01-20 15:58:54 | Всего моделей: 52 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
1993
  </p>
1994
  </div>
1995
  <script>
 
1138
  <td class="num mono" data-label="Всего токенов">99,705</td>
1139
  </tr>
1140
 
1141
+ <tr data-model="openrouter/moonshotai/kimi-k2.5">
1142
  <td class="rank mono sticky-0" data-label="#">#30</td>
1143
+ <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2.5 (non-reasoning, Moonshot AI API)</td>
1144
+ <td class="num mono" data-label="Критичные/1000">
1145
+
1146
+ 0.22 ± 0.05
1147
+
1148
+ </td>
1149
+ <td class="num mono" data-label="Обычные/1000">
1150
+
1151
+ 0.71 ± 0.07
1152
+
1153
+ </td>
1154
+ <td class="num mono" data-label="Доп./1000">
1155
+
1156
+ 0.21 ± 0.03
1157
+
1158
+ </td>
1159
+ <td data-label="Нормировано ошибок">
1160
+ <div class="score-cell">
1161
+ <div class="progress-bar">
1162
+
1163
+
1164
+
1165
+ <div class="progress-fill" style="width: 68.5%"></div>
1166
+ </div>
1167
+ <span class="score-value">
1168
+
1169
+ 1.26 ± 0.11
1170
+
1171
+ </span>
1172
+ </div>
1173
+ </td>
1174
+ <td class="num mono" data-label="Всего токенов">142,514</td>
1175
+ </tr>
1176
+
1177
+ <tr data-model="openai/t-tech/T-pro-it-2.0">
1178
+ <td class="rank mono sticky-0" data-label="#">#31</td>
1179
  <td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
1180
  <td class="num mono" data-label="Критичные/1000">
1181
 
 
1211
  </tr>
1212
 
1213
  <tr data-model="openrouter/openrouter/polaris-alpha">
1214
+ <td class="rank mono sticky-0" data-label="#">#32</td>
1215
  <td class="model-name sticky-1" data-label="Модель">Polaris Alpha</td>
1216
  <td class="num mono" data-label="Критичные/1000">
1217
 
 
1247
  </tr>
1248
 
1249
  <tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
1250
+ <td class="rank mono sticky-0" data-label="#">#33</td>
1251
  <td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
1252
  <td class="num mono" data-label="Критичные/1000">
1253
 
 
1283
  </tr>
1284
 
1285
  <tr data-model="openrouter/z-ai/glm-4.7-flash">
1286
+ <td class="rank mono sticky-0" data-label="#">#34</td>
1287
  <td class="model-name sticky-1" data-label="Модель">zai-org/GLM-4.7-Flash (z.ai API, reasoning, temp=0.6)</td>
1288
  <td class="num mono" data-label="Критичные/1000">
1289
 
 
1319
  </tr>
1320
 
1321
  <tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
1322
+ <td class="rank mono sticky-0" data-label="#">#35</td>
1323
  <td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
1324
  <td class="num mono" data-label="Критичные/1000">
1325
 
 
1355
  </tr>
1356
 
1357
  <tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
1358
+ <td class="rank mono sticky-0" data-label="#">#36</td>
1359
  <td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
1360
  <td class="num mono" data-label="Критичные/1000">
1361
 
 
1390
  <td class="num mono" data-label="Всего токенов">165,307</td>
1391
  </tr>
1392
 
1393
+ <tr data-model="openrouter/moonshotai/kimi-k2.5">
1394
+ <td class="rank mono sticky-0" data-label="#">#37</td>
1395
+ <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2.5 (reasoning, temp=1, Moonshot AI API)</td>
1396
+ <td class="num mono" data-label="Критичные/1000">
1397
+
1398
+ 0.42 ± 0.05
1399
+
1400
+ </td>
1401
+ <td class="num mono" data-label="Обычные/1000">
1402
+
1403
+ 0.73 ± 0.04
1404
+
1405
+ </td>
1406
+ <td class="num mono" data-label="Доп./1000">
1407
+
1408
+ 0.21 ± 0.04
1409
+
1410
+ </td>
1411
+ <td data-label="Нормировано ошибок">
1412
+ <div class="score-cell">
1413
+ <div class="progress-bar">
1414
+
1415
+
1416
+
1417
+ <div class="progress-fill" style="width: 58.25%"></div>
1418
+ </div>
1419
+ <span class="score-value">
1420
+
1421
+ 1.67 ± 0.14
1422
+
1423
+ </span>
1424
+ </div>
1425
+ </td>
1426
+ <td class="num mono" data-label="Всего токенов">132,843</td>
1427
+ </tr>
1428
+
1429
  <tr data-model="openrouter/moonshotai/kimi-k2-0905">
1430
+ <td class="rank mono sticky-0" data-label="#">#38</td>
1431
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
1432
  <td class="num mono" data-label="Критичные/1000">
1433
 
 
1463
  </tr>
1464
 
1465
  <tr data-model="openrouter/z-ai/glm-4.6">
1466
+ <td class="rank mono sticky-0" data-label="#">#39</td>
1467
  <td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
1468
  <td class="num mono" data-label="Критичные/1000">
1469
 
 
1499
  </tr>
1500
 
1501
  <tr data-model="openrouter/openai/gpt-5">
1502
+ <td class="rank mono sticky-0" data-label="#">#40</td>
1503
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
1504
  <td class="num mono" data-label="Критичные/1000">
1505
 
 
1535
  </tr>
1536
 
1537
  <tr data-model="openai/aquif-3.5-Max-42B-A3B.Q8_0.gguf">
1538
+ <td class="rank mono sticky-0" data-label="#">#41</td>
1539
  <td class="model-name sticky-1" data-label="Модель">aquif-ai/aquif-3.5-Plus-30B-A3B (Q8_0 llama.cpp, without reasoning)</td>
1540
  <td class="num mono" data-label="Критичные/1000">
1541
 
 
1571
  </tr>
1572
 
1573
  <tr data-model="openrouter/openai/gpt-5">
1574
+ <td class="rank mono sticky-0" data-label="#">#42</td>
1575
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
1576
  <td class="num mono" data-label="Критичные/1000">
1577
 
 
1607
  </tr>
1608
 
1609
  <tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
1610
+ <td class="rank mono sticky-0" data-label="#">#43</td>
1611
  <td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
1612
  <td class="num mono" data-label="Критичные/1000">
1613
 
 
1643
  </tr>
1644
 
1645
  <tr data-model="openrouter/openai/gpt-oss-120b">
1646
+ <td class="rank mono sticky-0" data-label="#">#44</td>
1647
  <td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
1648
  <td class="num mono" data-label="Критичные/1000">
1649
 
 
1679
  </tr>
1680
 
1681
  <tr data-model="openai/gpt-4.1">
1682
+ <td class="rank mono sticky-0" data-label="#">#45</td>
1683
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1</td>
1684
  <td class="num mono" data-label="Критичные/1000">
1685
 
 
1715
  </tr>
1716
 
1717
  <tr data-model="openrouter/nvidia/nemotron-3-nano-30b-a3b:free">
1718
+ <td class="rank mono sticky-0" data-label="#">#46</td>
1719
  <td class="model-name sticky-1" data-label="Модель">Nemotron-3-Nano-30B-A3B (NVIDIA API, non-reasoning)</td>
1720
  <td class="num mono" data-label="Критичные/1000">
1721
 
 
1751
  </tr>
1752
 
1753
  <tr data-model="mistral/ministral-3b-2512">
1754
+ <td class="rank mono sticky-0" data-label="#">#47</td>
1755
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-3B-Instruct-2512 (Mistral API)</td>
1756
  <td class="num mono" data-label="Критичные/1000">
1757
 
 
1787
  </tr>
1788
 
1789
  <tr data-model="openrouter/mistralai/mistral-nemo">
1790
+ <td class="rank mono sticky-0" data-label="#">#48</td>
1791
  <td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
1792
  <td class="num mono" data-label="Критичные/1000">
1793
 
 
1823
  </tr>
1824
 
1825
  <tr data-model="openai/gpt-4.1-mini">
1826
+ <td class="rank mono sticky-0" data-label="#">#49</td>
1827
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-mini</td>
1828
  <td class="num mono" data-label="Критичные/1000">
1829
 
 
1859
  </tr>
1860
 
1861
  <tr data-model="openrouter/minimax/minimax-m2:free">
1862
+ <td class="rank mono sticky-0" data-label="#">#50</td>
1863
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
1864
  <td class="num mono" data-label="Критичные/1000">
1865
 
 
1895
  </tr>
1896
 
1897
  <tr data-model="openrouter/minimax/minimax-m2:free">
1898
+ <td class="rank mono sticky-0" data-label="#">#51</td>
1899
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
1900
  <td class="num mono" data-label="Критичные/1000">
1901
 
 
1931
  </tr>
1932
 
1933
  <tr data-model="openai/gpt-4.1-nano">
1934
+ <td class="rank mono sticky-0" data-label="#">#52</td>
1935
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-nano</td>
1936
  <td class="num mono" data-label="Критичные/1000">
1937
 
 
1967
  </tr>
1968
 
1969
  <tr data-model="openai/ai-sage/GigaChat3-10B-A1.8B-bf16">
1970
+ <td class="rank mono sticky-0" data-label="#">#53</td>
1971
  <td class="model-name sticky-1" data-label="Модель">ai-sage/GigaChat3-10B-A1.8B-bf16 (sglang)</td>
1972
  <td class="num mono" data-label="Критичные/1000">
1973
 
 
2003
  </tr>
2004
 
2005
  <tr data-model="openrouter/openai/gpt-oss-20b">
2006
+ <td class="rank mono sticky-0" data-label="#">#54</td>
2007
  <td class="model-name sticky-1" data-label="Модель">openai/gpt-oss-20b (Vertex API)</td>
2008
  <td class="num mono" data-label="Критичные/1000">
2009
 
 
2061
  </div>
2062
  <p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
2063
  <p class="info-text">
2064
+ Обновлено: 2026-01-27 11:14:40 | Всего моделей: 54 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
2065
  </p>
2066
  </div>
2067
  <script>