kristaller486 commited on
Commit
fbf6ef6
·
verified ·
1 Parent(s): 32b05d5

add qwen3.5

Browse files
Files changed (1) hide show
  1. index.html +117 -45
index.html CHANGED
@@ -598,8 +598,44 @@
598
  <td class="num mono" data-label="Всего токенов">47,060</td>
599
  </tr>
600
 
601
- <tr data-model="deepseek/deepseek-chat">
602
  <td class="rank mono sticky-0" data-label="#">#15</td>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
603
  <td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-chat (Deepseek API)</td>
604
  <td class="num mono" data-label="Критичные/1000">
605
 
@@ -635,7 +671,7 @@
635
  </tr>
636
 
637
  <tr data-model="openrouter/anthropic/claude-haiku-4.5">
638
- <td class="rank mono sticky-0" data-label="#">#16</td>
639
  <td class="model-name sticky-1" data-label="Модель">Claude Haiku 4.5</td>
640
  <td class="num mono" data-label="Критичные/1000">
641
 
@@ -671,7 +707,7 @@
671
  </tr>
672
 
673
  <tr data-model="openai/t-tech/T-pro-it-2.1">
674
- <td class="rank mono sticky-0" data-label="#">#17</td>
675
  <td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.1 (sglang)</td>
676
  <td class="num mono" data-label="Критичные/1000">
677
 
@@ -707,7 +743,7 @@
707
  </tr>
708
 
709
  <tr data-model="openai/Qwen/Qwen3-VL-32B-Instruct">
710
- <td class="rank mono sticky-0" data-label="#">#18</td>
711
  <td class="model-name sticky-1" data-label="Модель">Qwen3-VL-32B-Instruct (SGLang)</td>
712
  <td class="num mono" data-label="Критичные/1000">
713
 
@@ -743,7 +779,7 @@
743
  </tr>
744
 
745
  <tr data-model="openai/AvitoTech/avibe">
746
- <td class="rank mono sticky-0" data-label="#">#19</td>
747
  <td class="model-name sticky-1" data-label="Модель">AvitoTech/avibe</td>
748
  <td class="num mono" data-label="Критичные/1000">
749
 
@@ -779,7 +815,7 @@
779
  </tr>
780
 
781
  <tr data-model="openrouter/openrouter/pony-alpha">
782
- <td class="rank mono sticky-0" data-label="#">#20</td>
783
  <td class="model-name sticky-1" data-label="Модель">Pony Alpha (temp=0.6)</td>
784
  <td class="num mono" data-label="Критичные/1000">
785
 
@@ -815,7 +851,7 @@
815
  </tr>
816
 
817
  <tr data-model="openai/ai-sage/GigaChat-20B-A3B-instruct-v1.5-bf16">
818
- <td class="rank mono sticky-0" data-label="#">#21</td>
819
  <td class="model-name sticky-1" data-label="Модель">GigaChat-20B-A3B-instruct-v1.5 (SGLang)</td>
820
  <td class="num mono" data-label="Критичные/1000">
821
 
@@ -851,7 +887,7 @@
851
  </tr>
852
 
853
  <tr data-model="deepseek/deepseek-reasoner">
854
- <td class="rank mono sticky-0" data-label="#">#22</td>
855
  <td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-reasoner (Deepseek API)</td>
856
  <td class="num mono" data-label="Критичные/1000">
857
 
@@ -887,7 +923,7 @@
887
  </tr>
888
 
889
  <tr data-model="mistral/ministral-14b-2512">
890
- <td class="rank mono sticky-0" data-label="#">#23</td>
891
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-14B-Instruct-2512 (Mistral API)</td>
892
  <td class="num mono" data-label="Критичные/1000">
893
 
@@ -923,7 +959,7 @@
923
  </tr>
924
 
925
  <tr data-model="litellm_proxy/deepseek-v3">
926
- <td class="rank mono sticky-0" data-label="#">#24</td>
927
  <td class="model-name sticky-1" data-label="Модель">Deepseek V3.2-Exp (Deepseek API)</td>
928
  <td class="num mono" data-label="Критичные/1000">
929
 
@@ -959,7 +995,7 @@
959
  </tr>
960
 
961
  <tr data-model="litellm_proxy/tmp-gemma-3n-e4b-it">
962
- <td class="rank mono sticky-0" data-label="#">#25</td>
963
  <td class="model-name sticky-1" data-label="Модель">google/gemma-3n-E4B-it (AI Studio)</td>
964
  <td class="num mono" data-label="Критичные/1000">
965
 
@@ -995,7 +1031,7 @@
995
  </tr>
996
 
997
  <tr data-model="mistral/ministral-8b-2512">
998
- <td class="rank mono sticky-0" data-label="#">#26</td>
999
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-8B-Instruct-2512 (Mistral API)</td>
1000
  <td class="num mono" data-label="Критичные/1000">
1001
 
@@ -1031,7 +1067,7 @@
1031
  </tr>
1032
 
1033
  <tr data-model="openrouter/qwen/qwen3-next-80b-a3b-instruct">
1034
- <td class="rank mono sticky-0" data-label="#">#27</td>
1035
  <td class="model-name sticky-1" data-label="Модель">Qwen3-Next-80B-A3B-Instruct (Alibaba API)</td>
1036
  <td class="num mono" data-label="Критичные/1000">
1037
 
@@ -1067,7 +1103,7 @@
1067
  </tr>
1068
 
1069
  <tr data-model="openrouter/baidu/ernie-4.5-300b-a47b">
1070
- <td class="rank mono sticky-0" data-label="#">#28</td>
1071
  <td class="model-name sticky-1" data-label="Модель">baidu/ERNIE-4.5-300B-A47B-PT (Novita API)</td>
1072
  <td class="num mono" data-label="Критичные/1000">
1073
 
@@ -1103,7 +1139,7 @@
1103
  </tr>
1104
 
1105
  <tr data-model="openai/mimo-v2-flash">
1106
- <td class="rank mono sticky-0" data-label="#">#29</td>
1107
  <td class="model-name sticky-1" data-label="Модель">Xiaomi Mimo V2 Flash (Xiaomi API, non-reasoning)</td>
1108
  <td class="num mono" data-label="Критичные/1000">
1109
 
@@ -1139,7 +1175,7 @@
1139
  </tr>
1140
 
1141
  <tr data-model="openai/Qwen/Qwen3-32B">
1142
- <td class="rank mono sticky-0" data-label="#">#30</td>
1143
  <td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
1144
  <td class="num mono" data-label="Критичные/1000">
1145
 
@@ -1175,7 +1211,7 @@
1175
  </tr>
1176
 
1177
  <tr data-model="openrouter/moonshotai/kimi-k2.5">
1178
- <td class="rank mono sticky-0" data-label="#">#31</td>
1179
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2.5 (non-reasoning, Moonshot AI API)</td>
1180
  <td class="num mono" data-label="Критичные/1000">
1181
 
@@ -1211,7 +1247,7 @@
1211
  </tr>
1212
 
1213
  <tr data-model="openai/t-tech/T-pro-it-2.0">
1214
- <td class="rank mono sticky-0" data-label="#">#32</td>
1215
  <td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
1216
  <td class="num mono" data-label="Критичные/1000">
1217
 
@@ -1247,7 +1283,7 @@
1247
  </tr>
1248
 
1249
  <tr data-model="openrouter/openrouter/polaris-alpha">
1250
- <td class="rank mono sticky-0" data-label="#">#33</td>
1251
  <td class="model-name sticky-1" data-label="Модель">Polaris Alpha</td>
1252
  <td class="num mono" data-label="Критичные/1000">
1253
 
@@ -1283,7 +1319,7 @@
1283
  </tr>
1284
 
1285
  <tr data-model="openrouter/arcee-ai/trinity-large-preview:free">
1286
- <td class="rank mono sticky-0" data-label="#">#34</td>
1287
  <td class="model-name sticky-1" data-label="Модель">arcee-ai/Trinity-Large-Preview 0.6 (Arcee-AI API)</td>
1288
  <td class="num mono" data-label="Критичные/1000">
1289
 
@@ -1318,8 +1354,44 @@
1318
  <td class="num mono" data-label="Всего токенов">61,298</td>
1319
  </tr>
1320
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1321
  <tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
1322
- <td class="rank mono sticky-0" data-label="#">#35</td>
1323
  <td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
1324
  <td class="num mono" data-label="Критичные/1000">
1325
 
@@ -1355,7 +1427,7 @@
1355
  </tr>
1356
 
1357
  <tr data-model="openrouter/z-ai/glm-4.7-flash">
1358
- <td class="rank mono sticky-0" data-label="#">#36</td>
1359
  <td class="model-name sticky-1" data-label="Модель">zai-org/GLM-4.7-Flash (z.ai API, reasoning, temp=0.6)</td>
1360
  <td class="num mono" data-label="Критичные/1000">
1361
 
@@ -1391,7 +1463,7 @@
1391
  </tr>
1392
 
1393
  <tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
1394
- <td class="rank mono sticky-0" data-label="#">#37</td>
1395
  <td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
1396
  <td class="num mono" data-label="Критичные/1000">
1397
 
@@ -1427,7 +1499,7 @@
1427
  </tr>
1428
 
1429
  <tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
1430
- <td class="rank mono sticky-0" data-label="#">#38</td>
1431
  <td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
1432
  <td class="num mono" data-label="Критичные/1000">
1433
 
@@ -1463,7 +1535,7 @@
1463
  </tr>
1464
 
1465
  <tr data-model="openrouter/moonshotai/kimi-k2.5">
1466
- <td class="rank mono sticky-0" data-label="#">#39</td>
1467
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2.5 (reasoning, temp=1, Moonshot AI API)</td>
1468
  <td class="num mono" data-label="Критичные/1000">
1469
 
@@ -1499,7 +1571,7 @@
1499
  </tr>
1500
 
1501
  <tr data-model="openrouter/moonshotai/kimi-k2-0905">
1502
- <td class="rank mono sticky-0" data-label="#">#40</td>
1503
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
1504
  <td class="num mono" data-label="Критичные/1000">
1505
 
@@ -1535,7 +1607,7 @@
1535
  </tr>
1536
 
1537
  <tr data-model="openrouter/z-ai/glm-4.6">
1538
- <td class="rank mono sticky-0" data-label="#">#41</td>
1539
  <td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
1540
  <td class="num mono" data-label="Критичные/1000">
1541
 
@@ -1571,7 +1643,7 @@
1571
  </tr>
1572
 
1573
  <tr data-model="openrouter/arcee-ai/trinity-large-preview:free">
1574
- <td class="rank mono sticky-0" data-label="#">#42</td>
1575
  <td class="model-name sticky-1" data-label="Модель">arcee-ai/Trinity-Large-Preview (Arcee-AI API)</td>
1576
  <td class="num mono" data-label="Критичные/1000">
1577
 
@@ -1607,7 +1679,7 @@
1607
  </tr>
1608
 
1609
  <tr data-model="openrouter/openai/gpt-5">
1610
- <td class="rank mono sticky-0" data-label="#">#43</td>
1611
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
1612
  <td class="num mono" data-label="Критичные/1000">
1613
 
@@ -1643,7 +1715,7 @@
1643
  </tr>
1644
 
1645
  <tr data-model="openai/aquif-3.5-Max-42B-A3B.Q8_0.gguf">
1646
- <td class="rank mono sticky-0" data-label="#">#44</td>
1647
  <td class="model-name sticky-1" data-label="Модель">aquif-ai/aquif-3.5-Plus-30B-A3B (Q8_0 llama.cpp, without reasoning)</td>
1648
  <td class="num mono" data-label="Критичные/1000">
1649
 
@@ -1679,7 +1751,7 @@
1679
  </tr>
1680
 
1681
  <tr data-model="openrouter/openai/gpt-5">
1682
- <td class="rank mono sticky-0" data-label="#">#45</td>
1683
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
1684
  <td class="num mono" data-label="Критичные/1000">
1685
 
@@ -1715,7 +1787,7 @@
1715
  </tr>
1716
 
1717
  <tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
1718
- <td class="rank mono sticky-0" data-label="#">#46</td>
1719
  <td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
1720
  <td class="num mono" data-label="Критичные/1000">
1721
 
@@ -1751,7 +1823,7 @@
1751
  </tr>
1752
 
1753
  <tr data-model="openrouter/stepfun/step-3.5-flash:free">
1754
- <td class="rank mono sticky-0" data-label="#">#47</td>
1755
  <td class="model-name sticky-1" data-label="Модель">Step-3.5-flash (StepFun API, fp8, temp=0.6, reasoning)</td>
1756
  <td class="num mono" data-label="Критичные/1000">
1757
 
@@ -1787,7 +1859,7 @@
1787
  </tr>
1788
 
1789
  <tr data-model="openrouter/openai/gpt-oss-120b">
1790
- <td class="rank mono sticky-0" data-label="#">#48</td>
1791
  <td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
1792
  <td class="num mono" data-label="Критичные/1000">
1793
 
@@ -1823,7 +1895,7 @@
1823
  </tr>
1824
 
1825
  <tr data-model="openai/gpt-4.1">
1826
- <td class="rank mono sticky-0" data-label="#">#49</td>
1827
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1</td>
1828
  <td class="num mono" data-label="Критичные/1000">
1829
 
@@ -1859,7 +1931,7 @@
1859
  </tr>
1860
 
1861
  <tr data-model="openrouter/nvidia/nemotron-3-nano-30b-a3b:free">
1862
- <td class="rank mono sticky-0" data-label="#">#50</td>
1863
  <td class="model-name sticky-1" data-label="Модель">Nemotron-3-Nano-30B-A3B (NVIDIA API, non-reasoning)</td>
1864
  <td class="num mono" data-label="Критичные/1000">
1865
 
@@ -1895,7 +1967,7 @@
1895
  </tr>
1896
 
1897
  <tr data-model="mistral/ministral-3b-2512">
1898
- <td class="rank mono sticky-0" data-label="#">#51</td>
1899
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-3B-Instruct-2512 (Mistral API)</td>
1900
  <td class="num mono" data-label="Критичные/1000">
1901
 
@@ -1931,7 +2003,7 @@
1931
  </tr>
1932
 
1933
  <tr data-model="openrouter/mistralai/mistral-nemo">
1934
- <td class="rank mono sticky-0" data-label="#">#52</td>
1935
  <td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
1936
  <td class="num mono" data-label="Критичные/1000">
1937
 
@@ -1967,7 +2039,7 @@
1967
  </tr>
1968
 
1969
  <tr data-model="openai/gpt-4.1-mini">
1970
- <td class="rank mono sticky-0" data-label="#">#53</td>
1971
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-mini</td>
1972
  <td class="num mono" data-label="Критичные/1000">
1973
 
@@ -2003,7 +2075,7 @@
2003
  </tr>
2004
 
2005
  <tr data-model="openrouter/minimax/minimax-m2:free">
2006
- <td class="rank mono sticky-0" data-label="#">#54</td>
2007
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
2008
  <td class="num mono" data-label="Критичные/1000">
2009
 
@@ -2039,7 +2111,7 @@
2039
  </tr>
2040
 
2041
  <tr data-model="openrouter/minimax/minimax-m2:free">
2042
- <td class="rank mono sticky-0" data-label="#">#55</td>
2043
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
2044
  <td class="num mono" data-label="Критичные/1000">
2045
 
@@ -2075,7 +2147,7 @@
2075
  </tr>
2076
 
2077
  <tr data-model="openai/gpt-4.1-nano">
2078
- <td class="rank mono sticky-0" data-label="#">#56</td>
2079
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-nano</td>
2080
  <td class="num mono" data-label="Критичные/1000">
2081
 
@@ -2111,7 +2183,7 @@
2111
  </tr>
2112
 
2113
  <tr data-model="openai/ai-sage/GigaChat3-10B-A1.8B-bf16">
2114
- <td class="rank mono sticky-0" data-label="#">#57</td>
2115
  <td class="model-name sticky-1" data-label="Модель">ai-sage/GigaChat3-10B-A1.8B-bf16 (sglang)</td>
2116
  <td class="num mono" data-label="Критичные/1000">
2117
 
@@ -2147,7 +2219,7 @@
2147
  </tr>
2148
 
2149
  <tr data-model="openrouter/openai/gpt-oss-20b">
2150
- <td class="rank mono sticky-0" data-label="#">#58</td>
2151
  <td class="model-name sticky-1" data-label="Модель">openai/gpt-oss-20b (Vertex API)</td>
2152
  <td class="num mono" data-label="Критичные/1000">
2153
 
@@ -2205,7 +2277,7 @@
2205
  </div>
2206
  <p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
2207
  <p class="info-text">
2208
- Обновлено: 2026-02-09 17:13:53 | Всего моделей: 58 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
2209
  </p>
2210
  </div>
2211
  <script>
 
598
  <td class="num mono" data-label="Всего токенов">47,060</td>
599
  </tr>
600
 
601
+ <tr data-model="openrouter/qwen/qwen3.5-397b-a17b">
602
  <td class="rank mono sticky-0" data-label="#">#15</td>
603
+ <td class="model-name sticky-1" data-label="Модель">qwen/qwen3.5-397b-a17b, non-reasoning, Alibaba API</td>
604
+ <td class="num mono" data-label="Критичные/1000">
605
+
606
+ 0.19 ± 0.02
607
+
608
+ </td>
609
+ <td class="num mono" data-label="Обычные/1000">
610
+
611
+ 0.34 ± 0.05
612
+
613
+ </td>
614
+ <td class="num mono" data-label="Доп./1000">
615
+
616
+ 0.13 ± 0.02
617
+
618
+ </td>
619
+ <td data-label="Нормировано ошибок">
620
+ <div class="score-cell">
621
+ <div class="progress-bar">
622
+
623
+
624
+
625
+ <div class="progress-fill" style="width: 80.5%"></div>
626
+ </div>
627
+ <span class="score-value">
628
+
629
+ 0.78 ± 0.08
630
+
631
+ </span>
632
+ </div>
633
+ </td>
634
+ <td class="num mono" data-label="Всего токенов">147,482</td>
635
+ </tr>
636
+
637
+ <tr data-model="deepseek/deepseek-chat">
638
+ <td class="rank mono sticky-0" data-label="#">#16</td>
639
  <td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-chat (Deepseek API)</td>
640
  <td class="num mono" data-label="Критичные/1000">
641
 
 
671
  </tr>
672
 
673
  <tr data-model="openrouter/anthropic/claude-haiku-4.5">
674
+ <td class="rank mono sticky-0" data-label="#">#17</td>
675
  <td class="model-name sticky-1" data-label="Модель">Claude Haiku 4.5</td>
676
  <td class="num mono" data-label="Критичные/1000">
677
 
 
707
  </tr>
708
 
709
  <tr data-model="openai/t-tech/T-pro-it-2.1">
710
+ <td class="rank mono sticky-0" data-label="#">#18</td>
711
  <td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.1 (sglang)</td>
712
  <td class="num mono" data-label="Критичные/1000">
713
 
 
743
  </tr>
744
 
745
  <tr data-model="openai/Qwen/Qwen3-VL-32B-Instruct">
746
+ <td class="rank mono sticky-0" data-label="#">#19</td>
747
  <td class="model-name sticky-1" data-label="Модель">Qwen3-VL-32B-Instruct (SGLang)</td>
748
  <td class="num mono" data-label="Критичные/1000">
749
 
 
779
  </tr>
780
 
781
  <tr data-model="openai/AvitoTech/avibe">
782
+ <td class="rank mono sticky-0" data-label="#">#20</td>
783
  <td class="model-name sticky-1" data-label="Модель">AvitoTech/avibe</td>
784
  <td class="num mono" data-label="Критичные/1000">
785
 
 
815
  </tr>
816
 
817
  <tr data-model="openrouter/openrouter/pony-alpha">
818
+ <td class="rank mono sticky-0" data-label="#">#21</td>
819
  <td class="model-name sticky-1" data-label="Модель">Pony Alpha (temp=0.6)</td>
820
  <td class="num mono" data-label="Критичные/1000">
821
 
 
851
  </tr>
852
 
853
  <tr data-model="openai/ai-sage/GigaChat-20B-A3B-instruct-v1.5-bf16">
854
+ <td class="rank mono sticky-0" data-label="#">#22</td>
855
  <td class="model-name sticky-1" data-label="Модель">GigaChat-20B-A3B-instruct-v1.5 (SGLang)</td>
856
  <td class="num mono" data-label="Критичные/1000">
857
 
 
887
  </tr>
888
 
889
  <tr data-model="deepseek/deepseek-reasoner">
890
+ <td class="rank mono sticky-0" data-label="#">#23</td>
891
  <td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-reasoner (Deepseek API)</td>
892
  <td class="num mono" data-label="Критичные/1000">
893
 
 
923
  </tr>
924
 
925
  <tr data-model="mistral/ministral-14b-2512">
926
+ <td class="rank mono sticky-0" data-label="#">#24</td>
927
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-14B-Instruct-2512 (Mistral API)</td>
928
  <td class="num mono" data-label="Критичные/1000">
929
 
 
959
  </tr>
960
 
961
  <tr data-model="litellm_proxy/deepseek-v3">
962
+ <td class="rank mono sticky-0" data-label="#">#25</td>
963
  <td class="model-name sticky-1" data-label="Модель">Deepseek V3.2-Exp (Deepseek API)</td>
964
  <td class="num mono" data-label="Критичные/1000">
965
 
 
995
  </tr>
996
 
997
  <tr data-model="litellm_proxy/tmp-gemma-3n-e4b-it">
998
+ <td class="rank mono sticky-0" data-label="#">#26</td>
999
  <td class="model-name sticky-1" data-label="Модель">google/gemma-3n-E4B-it (AI Studio)</td>
1000
  <td class="num mono" data-label="Критичные/1000">
1001
 
 
1031
  </tr>
1032
 
1033
  <tr data-model="mistral/ministral-8b-2512">
1034
+ <td class="rank mono sticky-0" data-label="#">#27</td>
1035
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-8B-Instruct-2512 (Mistral API)</td>
1036
  <td class="num mono" data-label="Критичные/1000">
1037
 
 
1067
  </tr>
1068
 
1069
  <tr data-model="openrouter/qwen/qwen3-next-80b-a3b-instruct">
1070
+ <td class="rank mono sticky-0" data-label="#">#28</td>
1071
  <td class="model-name sticky-1" data-label="Модель">Qwen3-Next-80B-A3B-Instruct (Alibaba API)</td>
1072
  <td class="num mono" data-label="Критичные/1000">
1073
 
 
1103
  </tr>
1104
 
1105
  <tr data-model="openrouter/baidu/ernie-4.5-300b-a47b">
1106
+ <td class="rank mono sticky-0" data-label="#">#29</td>
1107
  <td class="model-name sticky-1" data-label="Модель">baidu/ERNIE-4.5-300B-A47B-PT (Novita API)</td>
1108
  <td class="num mono" data-label="Критичные/1000">
1109
 
 
1139
  </tr>
1140
 
1141
  <tr data-model="openai/mimo-v2-flash">
1142
+ <td class="rank mono sticky-0" data-label="#">#30</td>
1143
  <td class="model-name sticky-1" data-label="Модель">Xiaomi Mimo V2 Flash (Xiaomi API, non-reasoning)</td>
1144
  <td class="num mono" data-label="Критичные/1000">
1145
 
 
1175
  </tr>
1176
 
1177
  <tr data-model="openai/Qwen/Qwen3-32B">
1178
+ <td class="rank mono sticky-0" data-label="#">#31</td>
1179
  <td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
1180
  <td class="num mono" data-label="Критичные/1000">
1181
 
 
1211
  </tr>
1212
 
1213
  <tr data-model="openrouter/moonshotai/kimi-k2.5">
1214
+ <td class="rank mono sticky-0" data-label="#">#32</td>
1215
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2.5 (non-reasoning, Moonshot AI API)</td>
1216
  <td class="num mono" data-label="Критичные/1000">
1217
 
 
1247
  </tr>
1248
 
1249
  <tr data-model="openai/t-tech/T-pro-it-2.0">
1250
+ <td class="rank mono sticky-0" data-label="#">#33</td>
1251
  <td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
1252
  <td class="num mono" data-label="Критичные/1000">
1253
 
 
1283
  </tr>
1284
 
1285
  <tr data-model="openrouter/openrouter/polaris-alpha">
1286
+ <td class="rank mono sticky-0" data-label="#">#34</td>
1287
  <td class="model-name sticky-1" data-label="Модель">Polaris Alpha</td>
1288
  <td class="num mono" data-label="Критичные/1000">
1289
 
 
1319
  </tr>
1320
 
1321
  <tr data-model="openrouter/arcee-ai/trinity-large-preview:free">
1322
+ <td class="rank mono sticky-0" data-label="#">#35</td>
1323
  <td class="model-name sticky-1" data-label="Модель">arcee-ai/Trinity-Large-Preview 0.6 (Arcee-AI API)</td>
1324
  <td class="num mono" data-label="Критичные/1000">
1325
 
 
1354
  <td class="num mono" data-label="Всего токенов">61,298</td>
1355
  </tr>
1356
 
1357
+ <tr data-model="openrouter/minimax/minimax-m2.5">
1358
+ <td class="rank mono sticky-0" data-label="#">#36</td>
1359
+ <td class="model-name sticky-1" data-label="Модель">minimax/minimax-m2.5, reasoning, Minimax API</td>
1360
+ <td class="num mono" data-label="Критичные/1000">
1361
+
1362
+ 0.48 ± 0.10
1363
+
1364
+ </td>
1365
+ <td class="num mono" data-label="Обычные/1000">
1366
+
1367
+ 0.36 ± 0.03
1368
+
1369
+ </td>
1370
+ <td class="num mono" data-label="Доп./1000">
1371
+
1372
+ 0.16 ± 0.02
1373
+
1374
+ </td>
1375
+ <td data-label="Нормировано ошибок">
1376
+ <div class="score-cell">
1377
+ <div class="progress-bar">
1378
+
1379
+
1380
+
1381
+ <div class="progress-fill" style="width: 65.25000000000001%"></div>
1382
+ </div>
1383
+ <span class="score-value">
1384
+
1385
+ 1.39 ± 0.23
1386
+
1387
+ </span>
1388
+ </div>
1389
+ </td>
1390
+ <td class="num mono" data-label="Всего токенов">159,619</td>
1391
+ </tr>
1392
+
1393
  <tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
1394
+ <td class="rank mono sticky-0" data-label="#">#37</td>
1395
  <td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
1396
  <td class="num mono" data-label="Критичные/1000">
1397
 
 
1427
  </tr>
1428
 
1429
  <tr data-model="openrouter/z-ai/glm-4.7-flash">
1430
+ <td class="rank mono sticky-0" data-label="#">#38</td>
1431
  <td class="model-name sticky-1" data-label="Модель">zai-org/GLM-4.7-Flash (z.ai API, reasoning, temp=0.6)</td>
1432
  <td class="num mono" data-label="Критичные/1000">
1433
 
 
1463
  </tr>
1464
 
1465
  <tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
1466
+ <td class="rank mono sticky-0" data-label="#">#39</td>
1467
  <td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
1468
  <td class="num mono" data-label="Критичные/1000">
1469
 
 
1499
  </tr>
1500
 
1501
  <tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
1502
+ <td class="rank mono sticky-0" data-label="#">#40</td>
1503
  <td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
1504
  <td class="num mono" data-label="Критичные/1000">
1505
 
 
1535
  </tr>
1536
 
1537
  <tr data-model="openrouter/moonshotai/kimi-k2.5">
1538
+ <td class="rank mono sticky-0" data-label="#">#41</td>
1539
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2.5 (reasoning, temp=1, Moonshot AI API)</td>
1540
  <td class="num mono" data-label="Критичные/1000">
1541
 
 
1571
  </tr>
1572
 
1573
  <tr data-model="openrouter/moonshotai/kimi-k2-0905">
1574
+ <td class="rank mono sticky-0" data-label="#">#42</td>
1575
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
1576
  <td class="num mono" data-label="Критичные/1000">
1577
 
 
1607
  </tr>
1608
 
1609
  <tr data-model="openrouter/z-ai/glm-4.6">
1610
+ <td class="rank mono sticky-0" data-label="#">#43</td>
1611
  <td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
1612
  <td class="num mono" data-label="Критичные/1000">
1613
 
 
1643
  </tr>
1644
 
1645
  <tr data-model="openrouter/arcee-ai/trinity-large-preview:free">
1646
+ <td class="rank mono sticky-0" data-label="#">#44</td>
1647
  <td class="model-name sticky-1" data-label="Модель">arcee-ai/Trinity-Large-Preview (Arcee-AI API)</td>
1648
  <td class="num mono" data-label="Критичные/1000">
1649
 
 
1679
  </tr>
1680
 
1681
  <tr data-model="openrouter/openai/gpt-5">
1682
+ <td class="rank mono sticky-0" data-label="#">#45</td>
1683
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
1684
  <td class="num mono" data-label="Критичные/1000">
1685
 
 
1715
  </tr>
1716
 
1717
  <tr data-model="openai/aquif-3.5-Max-42B-A3B.Q8_0.gguf">
1718
+ <td class="rank mono sticky-0" data-label="#">#46</td>
1719
  <td class="model-name sticky-1" data-label="Модель">aquif-ai/aquif-3.5-Plus-30B-A3B (Q8_0 llama.cpp, without reasoning)</td>
1720
  <td class="num mono" data-label="Критичные/1000">
1721
 
 
1751
  </tr>
1752
 
1753
  <tr data-model="openrouter/openai/gpt-5">
1754
+ <td class="rank mono sticky-0" data-label="#">#47</td>
1755
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
1756
  <td class="num mono" data-label="Критичные/1000">
1757
 
 
1787
  </tr>
1788
 
1789
  <tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
1790
+ <td class="rank mono sticky-0" data-label="#">#48</td>
1791
  <td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
1792
  <td class="num mono" data-label="Критичные/1000">
1793
 
 
1823
  </tr>
1824
 
1825
  <tr data-model="openrouter/stepfun/step-3.5-flash:free">
1826
+ <td class="rank mono sticky-0" data-label="#">#49</td>
1827
  <td class="model-name sticky-1" data-label="Модель">Step-3.5-flash (StepFun API, fp8, temp=0.6, reasoning)</td>
1828
  <td class="num mono" data-label="Критичные/1000">
1829
 
 
1859
  </tr>
1860
 
1861
  <tr data-model="openrouter/openai/gpt-oss-120b">
1862
+ <td class="rank mono sticky-0" data-label="#">#50</td>
1863
  <td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
1864
  <td class="num mono" data-label="Критичные/1000">
1865
 
 
1895
  </tr>
1896
 
1897
  <tr data-model="openai/gpt-4.1">
1898
+ <td class="rank mono sticky-0" data-label="#">#51</td>
1899
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1</td>
1900
  <td class="num mono" data-label="Критичные/1000">
1901
 
 
1931
  </tr>
1932
 
1933
  <tr data-model="openrouter/nvidia/nemotron-3-nano-30b-a3b:free">
1934
+ <td class="rank mono sticky-0" data-label="#">#52</td>
1935
  <td class="model-name sticky-1" data-label="Модель">Nemotron-3-Nano-30B-A3B (NVIDIA API, non-reasoning)</td>
1936
  <td class="num mono" data-label="Критичные/1000">
1937
 
 
1967
  </tr>
1968
 
1969
  <tr data-model="mistral/ministral-3b-2512">
1970
+ <td class="rank mono sticky-0" data-label="#">#53</td>
1971
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-3B-Instruct-2512 (Mistral API)</td>
1972
  <td class="num mono" data-label="Критичные/1000">
1973
 
 
2003
  </tr>
2004
 
2005
  <tr data-model="openrouter/mistralai/mistral-nemo">
2006
+ <td class="rank mono sticky-0" data-label="#">#54</td>
2007
  <td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
2008
  <td class="num mono" data-label="Критичные/1000">
2009
 
 
2039
  </tr>
2040
 
2041
  <tr data-model="openai/gpt-4.1-mini">
2042
+ <td class="rank mono sticky-0" data-label="#">#55</td>
2043
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-mini</td>
2044
  <td class="num mono" data-label="Критичные/1000">
2045
 
 
2075
  </tr>
2076
 
2077
  <tr data-model="openrouter/minimax/minimax-m2:free">
2078
+ <td class="rank mono sticky-0" data-label="#">#56</td>
2079
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
2080
  <td class="num mono" data-label="Критичные/1000">
2081
 
 
2111
  </tr>
2112
 
2113
  <tr data-model="openrouter/minimax/minimax-m2:free">
2114
+ <td class="rank mono sticky-0" data-label="#">#57</td>
2115
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
2116
  <td class="num mono" data-label="Критичные/1000">
2117
 
 
2147
  </tr>
2148
 
2149
  <tr data-model="openai/gpt-4.1-nano">
2150
+ <td class="rank mono sticky-0" data-label="#">#58</td>
2151
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-nano</td>
2152
  <td class="num mono" data-label="Критичные/1000">
2153
 
 
2183
  </tr>
2184
 
2185
  <tr data-model="openai/ai-sage/GigaChat3-10B-A1.8B-bf16">
2186
+ <td class="rank mono sticky-0" data-label="#">#59</td>
2187
  <td class="model-name sticky-1" data-label="Модель">ai-sage/GigaChat3-10B-A1.8B-bf16 (sglang)</td>
2188
  <td class="num mono" data-label="Критичные/1000">
2189
 
 
2219
  </tr>
2220
 
2221
  <tr data-model="openrouter/openai/gpt-oss-20b">
2222
+ <td class="rank mono sticky-0" data-label="#">#60</td>
2223
  <td class="model-name sticky-1" data-label="Модель">openai/gpt-oss-20b (Vertex API)</td>
2224
  <td class="num mono" data-label="Критичные/1000">
2225
 
 
2277
  </div>
2278
  <p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
2279
  <p class="info-text">
2280
+ Обновлено: 2026-02-16 14:02:03 | Всего моделей: 60 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
2281
  </p>
2282
  </div>
2283
  <script>