kristaller486 commited on
Commit
a5e5691
·
verified ·
1 Parent(s): 2f72a3d

add Mistral 3

Browse files
Files changed (1) hide show
  1. index.html +187 -43
index.html CHANGED
@@ -130,8 +130,44 @@
130
  <td class="num mono" data-label="Всего токенов">125,802</td>
131
  </tr>
132
 
133
- <tr data-model="litellm_proxy/gemini/gemini-3-pro-preview">
134
  <td class="rank mono sticky-0" data-label="#">#2</td>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
135
  <td class="model-name sticky-1" data-label="Модель">Gemini 3 Pro Preview</td>
136
  <td class="num mono" data-label="Критичные/1000">
137
 
@@ -167,7 +203,7 @@
167
  </tr>
168
 
169
  <tr data-model="openrouter/anthropic/claude-sonnet-4.5">
170
- <td class="rank mono sticky-0" data-label="#">#3</td>
171
  <td class="model-name sticky-1" data-label="Модель">Claude Sonnet 4.5</td>
172
  <td class="num mono" data-label="Критичные/1000">
173
 
@@ -203,7 +239,7 @@
203
  </tr>
204
 
205
  <tr data-model="openrouter/openai/gpt-4o">
206
- <td class="rank mono sticky-0" data-label="#">#4</td>
207
  <td class="model-name sticky-1" data-label="Модель">GPT-4o</td>
208
  <td class="num mono" data-label="Критичные/1000">
209
 
@@ -239,7 +275,7 @@
239
  </tr>
240
 
241
  <tr data-model="litellm_proxy/gemini-2.5-flash">
242
- <td class="rank mono sticky-0" data-label="#">#5</td>
243
  <td class="model-name sticky-1" data-label="Модель">Gemini 2.5 Flash (GA)</td>
244
  <td class="num mono" data-label="Критичные/1000">
245
 
@@ -275,7 +311,7 @@
275
  </tr>
276
 
277
  <tr data-model="openrouter/minimax/minimax-01">
278
- <td class="rank mono sticky-0" data-label="#">#6</td>
279
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-Text-01 (Minimax API)</td>
280
  <td class="num mono" data-label="Критичные/1000">
281
 
@@ -311,7 +347,7 @@
311
  </tr>
312
 
313
  <tr data-model="openai/Vikhrmodels/Vistral-24B-Instruct">
314
- <td class="rank mono sticky-0" data-label="#">#7</td>
315
  <td class="model-name sticky-1" data-label="Модель">Vikhrmodels/Vistral-24B-Instruct (SGLang)</td>
316
  <td class="num mono" data-label="Критичные/1000">
317
 
@@ -347,7 +383,7 @@
347
  </tr>
348
 
349
  <tr data-model="openai/unsloth/gemma-3-27b-it">
350
- <td class="rank mono sticky-0" data-label="#">#8</td>
351
  <td class="model-name sticky-1" data-label="Модель">Gemma-3-27b-it (SGLang)</td>
352
  <td class="num mono" data-label="Критичные/1000">
353
 
@@ -383,7 +419,7 @@
383
  </tr>
384
 
385
  <tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
386
- <td class="rank mono sticky-0" data-label="#">#9</td>
387
  <td class="model-name sticky-1" data-label="Модель">Qwen/Qwen3-235B-A22B-Instruct-2507 (Vertex AI API)</td>
388
  <td class="num mono" data-label="Критичные/1000">
389
 
@@ -419,7 +455,7 @@
419
  </tr>
420
 
421
  <tr data-model="openai/mistralai/Mistral-Small-3.2-24B-Instruct-2506">
422
- <td class="rank mono sticky-0" data-label="#">#10</td>
423
  <td class="model-name sticky-1" data-label="Модель">Mistral-Small-3.2-24B-Instruct-2506 (vllm)</td>
424
  <td class="num mono" data-label="Критичные/1000">
425
 
@@ -455,7 +491,7 @@
455
  </tr>
456
 
457
  <tr data-model="openrouter/deepseek/deepseek-chat">
458
- <td class="rank mono sticky-0" data-label="#">#11</td>
459
  <td class="model-name sticky-1" data-label="Модель">DeepSeek V3 (Novita API)</td>
460
  <td class="num mono" data-label="Критичные/1000">
461
 
@@ -491,7 +527,7 @@
491
  </tr>
492
 
493
  <tr data-model="openai/RefalMachine/RuadaptQwen3-32B-Instruct">
494
- <td class="rank mono sticky-0" data-label="#">#12</td>
495
  <td class="model-name sticky-1" data-label="Модель">RefalMachine/RuadaptQwen3-32B-Instruct (SGLang)</td>
496
  <td class="num mono" data-label="Критичные/1000">
497
 
@@ -527,7 +563,7 @@
527
  </tr>
528
 
529
  <tr data-model="openai/yandex/YandexGPT-5-Lite-8B-instruct">
530
- <td class="rank mono sticky-0" data-label="#">#13</td>
531
  <td class="model-name sticky-1" data-label="Модель">yandex/YandexGPT-5-Lite-8B-instruct (SGLang)</td>
532
  <td class="num mono" data-label="Критичные/1000">
533
 
@@ -563,7 +599,7 @@
563
  </tr>
564
 
565
  <tr data-model="deepseek/deepseek-chat">
566
- <td class="rank mono sticky-0" data-label="#">#14</td>
567
  <td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-chat (Deepseek API)</td>
568
  <td class="num mono" data-label="Критичные/1000">
569
 
@@ -599,7 +635,7 @@
599
  </tr>
600
 
601
  <tr data-model="openrouter/anthropic/claude-haiku-4.5">
602
- <td class="rank mono sticky-0" data-label="#">#15</td>
603
  <td class="model-name sticky-1" data-label="Модель">Claude Haiku 4.5</td>
604
  <td class="num mono" data-label="Критичные/1000">
605
 
@@ -635,7 +671,7 @@
635
  </tr>
636
 
637
  <tr data-model="openai/Qwen/Qwen3-VL-32B-Instruct">
638
- <td class="rank mono sticky-0" data-label="#">#16</td>
639
  <td class="model-name sticky-1" data-label="Модель">Qwen3-VL-32B-Instruct (SGLang)</td>
640
  <td class="num mono" data-label="Критичные/1000">
641
 
@@ -671,7 +707,7 @@
671
  </tr>
672
 
673
  <tr data-model="openai/AvitoTech/avibe">
674
- <td class="rank mono sticky-0" data-label="#">#17</td>
675
  <td class="model-name sticky-1" data-label="Модель">AvitoTech/avibe</td>
676
  <td class="num mono" data-label="Критичные/1000">
677
 
@@ -707,7 +743,7 @@
707
  </tr>
708
 
709
  <tr data-model="openai/ai-sage/GigaChat-20B-A3B-instruct-v1.5-bf16">
710
- <td class="rank mono sticky-0" data-label="#">#18</td>
711
  <td class="model-name sticky-1" data-label="Модель">GigaChat-20B-A3B-instruct-v1.5 (SGLang)</td>
712
  <td class="num mono" data-label="Критичные/1000">
713
 
@@ -743,7 +779,7 @@
743
  </tr>
744
 
745
  <tr data-model="deepseek/deepseek-reasoner">
746
- <td class="rank mono sticky-0" data-label="#">#19</td>
747
  <td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-reasoner (Deepseek API)</td>
748
  <td class="num mono" data-label="Критичные/1000">
749
 
@@ -778,8 +814,44 @@
778
  <td class="num mono" data-label="Всего токенов">118,309</td>
779
  </tr>
780
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
781
  <tr data-model="litellm_proxy/deepseek-v3">
782
- <td class="rank mono sticky-0" data-label="#">#20</td>
783
  <td class="model-name sticky-1" data-label="Модель">Deepseek V3.2-Exp (Deepseek API)</td>
784
  <td class="num mono" data-label="Критичные/1000">
785
 
@@ -815,7 +887,7 @@
815
  </tr>
816
 
817
  <tr data-model="litellm_proxy/tmp-gemma-3n-e4b-it">
818
- <td class="rank mono sticky-0" data-label="#">#21</td>
819
  <td class="model-name sticky-1" data-label="Модель">google/gemma-3n-E4B-it (AI Studio)</td>
820
  <td class="num mono" data-label="Критичные/1000">
821
 
@@ -850,8 +922,44 @@
850
  <td class="num mono" data-label="Всего токенов">99,646</td>
851
  </tr>
852
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
853
  <tr data-model="openrouter/qwen/qwen3-next-80b-a3b-instruct">
854
- <td class="rank mono sticky-0" data-label="#">#22</td>
855
  <td class="model-name sticky-1" data-label="Модель">Qwen3-Next-80B-A3B-Instruct (Alibaba API)</td>
856
  <td class="num mono" data-label="Критичные/1000">
857
 
@@ -887,7 +995,7 @@
887
  </tr>
888
 
889
  <tr data-model="openrouter/baidu/ernie-4.5-300b-a47b">
890
- <td class="rank mono sticky-0" data-label="#">#23</td>
891
  <td class="model-name sticky-1" data-label="Модель">baidu/ERNIE-4.5-300B-A47B-PT (Novita API)</td>
892
  <td class="num mono" data-label="Критичные/1000">
893
 
@@ -923,7 +1031,7 @@
923
  </tr>
924
 
925
  <tr data-model="openai/Qwen/Qwen3-32B">
926
- <td class="rank mono sticky-0" data-label="#">#24</td>
927
  <td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
928
  <td class="num mono" data-label="Критичные/1000">
929
 
@@ -959,7 +1067,7 @@
959
  </tr>
960
 
961
  <tr data-model="openai/t-tech/T-pro-it-2.0">
962
- <td class="rank mono sticky-0" data-label="#">#25</td>
963
  <td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
964
  <td class="num mono" data-label="Критичные/1000">
965
 
@@ -995,7 +1103,7 @@
995
  </tr>
996
 
997
  <tr data-model="openrouter/openrouter/polaris-alpha">
998
- <td class="rank mono sticky-0" data-label="#">#26</td>
999
  <td class="model-name sticky-1" data-label="Модель">Polaris Alpha</td>
1000
  <td class="num mono" data-label="Критичные/1000">
1001
 
@@ -1031,7 +1139,7 @@
1031
  </tr>
1032
 
1033
  <tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
1034
- <td class="rank mono sticky-0" data-label="#">#27</td>
1035
  <td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
1036
  <td class="num mono" data-label="Критичные/1000">
1037
 
@@ -1067,7 +1175,7 @@
1067
  </tr>
1068
 
1069
  <tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
1070
- <td class="rank mono sticky-0" data-label="#">#28</td>
1071
  <td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
1072
  <td class="num mono" data-label="Критичные/1000">
1073
 
@@ -1103,7 +1211,7 @@
1103
  </tr>
1104
 
1105
  <tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
1106
- <td class="rank mono sticky-0" data-label="#">#29</td>
1107
  <td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
1108
  <td class="num mono" data-label="Критичные/1000">
1109
 
@@ -1139,7 +1247,7 @@
1139
  </tr>
1140
 
1141
  <tr data-model="openrouter/moonshotai/kimi-k2-0905">
1142
- <td class="rank mono sticky-0" data-label="#">#30</td>
1143
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
1144
  <td class="num mono" data-label="Критичные/1000">
1145
 
@@ -1175,7 +1283,7 @@
1175
  </tr>
1176
 
1177
  <tr data-model="openrouter/z-ai/glm-4.6">
1178
- <td class="rank mono sticky-0" data-label="#">#31</td>
1179
  <td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
1180
  <td class="num mono" data-label="Критичные/1000">
1181
 
@@ -1211,7 +1319,7 @@
1211
  </tr>
1212
 
1213
  <tr data-model="openrouter/openai/gpt-5">
1214
- <td class="rank mono sticky-0" data-label="#">#32</td>
1215
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
1216
  <td class="num mono" data-label="Критичные/1000">
1217
 
@@ -1247,7 +1355,7 @@
1247
  </tr>
1248
 
1249
  <tr data-model="openai/aquif-3.5-Max-42B-A3B.Q8_0.gguf">
1250
- <td class="rank mono sticky-0" data-label="#">#33</td>
1251
  <td class="model-name sticky-1" data-label="Модель">aquif-ai/aquif-3.5-Plus-30B-A3B (Q8_0 llama.cpp, without reasoning)</td>
1252
  <td class="num mono" data-label="Критичные/1000">
1253
 
@@ -1283,7 +1391,7 @@
1283
  </tr>
1284
 
1285
  <tr data-model="openrouter/openai/gpt-5">
1286
- <td class="rank mono sticky-0" data-label="#">#34</td>
1287
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
1288
  <td class="num mono" data-label="Критичные/1000">
1289
 
@@ -1319,7 +1427,7 @@
1319
  </tr>
1320
 
1321
  <tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
1322
- <td class="rank mono sticky-0" data-label="#">#35</td>
1323
  <td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
1324
  <td class="num mono" data-label="Критичные/1000">
1325
 
@@ -1355,7 +1463,7 @@
1355
  </tr>
1356
 
1357
  <tr data-model="openrouter/openai/gpt-oss-120b">
1358
- <td class="rank mono sticky-0" data-label="#">#36</td>
1359
  <td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
1360
  <td class="num mono" data-label="Критичные/1000">
1361
 
@@ -1391,7 +1499,7 @@
1391
  </tr>
1392
 
1393
  <tr data-model="openai/gpt-4.1">
1394
- <td class="rank mono sticky-0" data-label="#">#37</td>
1395
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1</td>
1396
  <td class="num mono" data-label="Критичные/1000">
1397
 
@@ -1426,8 +1534,44 @@
1426
  <td class="num mono" data-label="Всего токенов">85,822</td>
1427
  </tr>
1428
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1429
  <tr data-model="openrouter/mistralai/mistral-nemo">
1430
- <td class="rank mono sticky-0" data-label="#">#38</td>
1431
  <td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
1432
  <td class="num mono" data-label="Критичные/1000">
1433
 
@@ -1463,7 +1607,7 @@
1463
  </tr>
1464
 
1465
  <tr data-model="openai/gpt-4.1-mini">
1466
- <td class="rank mono sticky-0" data-label="#">#39</td>
1467
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-mini</td>
1468
  <td class="num mono" data-label="Критичные/1000">
1469
 
@@ -1499,7 +1643,7 @@
1499
  </tr>
1500
 
1501
  <tr data-model="openrouter/minimax/minimax-m2:free">
1502
- <td class="rank mono sticky-0" data-label="#">#40</td>
1503
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
1504
  <td class="num mono" data-label="Критичные/1000">
1505
 
@@ -1535,7 +1679,7 @@
1535
  </tr>
1536
 
1537
  <tr data-model="openrouter/minimax/minimax-m2:free">
1538
- <td class="rank mono sticky-0" data-label="#">#41</td>
1539
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
1540
  <td class="num mono" data-label="Критичные/1000">
1541
 
@@ -1571,7 +1715,7 @@
1571
  </tr>
1572
 
1573
  <tr data-model="openai/gpt-4.1-nano">
1574
- <td class="rank mono sticky-0" data-label="#">#42</td>
1575
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-nano</td>
1576
  <td class="num mono" data-label="Критичные/1000">
1577
 
@@ -1607,7 +1751,7 @@
1607
  </tr>
1608
 
1609
  <tr data-model="openrouter/openai/gpt-oss-20b">
1610
- <td class="rank mono sticky-0" data-label="#">#43</td>
1611
  <td class="model-name sticky-1" data-label="Модель">openai/gpt-oss-20b (Vertex API)</td>
1612
  <td class="num mono" data-label="Критичные/1000">
1613
 
@@ -1665,7 +1809,7 @@
1665
  </div>
1666
  <p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
1667
  <p class="info-text">
1668
- Обновлено: 2025-12-01 20:43:49 | Всего моделей: 43 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
1669
  </p>
1670
  </div>
1671
  <script>
 
130
  <td class="num mono" data-label="Всего токенов">125,802</td>
131
  </tr>
132
 
133
+ <tr data-model="openrouter/mistralai/mistral-large-2512">
134
  <td class="rank mono sticky-0" data-label="#">#2</td>
135
+ <td class="model-name sticky-1" data-label="Модель">Mistral Large 3 2512 (Mistral API)</td>
136
+ <td class="num mono" data-label="Критичные/1000">
137
+
138
+ 0.04 ± 0.01
139
+
140
+ </td>
141
+ <td class="num mono" data-label="Обычные/1000">
142
+
143
+ 0.16 ± 0.02
144
+
145
+ </td>
146
+ <td class="num mono" data-label="Доп./1000">
147
+
148
+ 0.12 ± 0.01
149
+
150
+ </td>
151
+ <td data-label="Нормировано ошибок">
152
+ <div class="score-cell">
153
+ <div class="progress-bar">
154
+
155
+
156
+
157
+ <div class="progress-fill" style="width: 92.5%"></div>
158
+ </div>
159
+ <span class="score-value">
160
+
161
+ 0.30 ± 0.04
162
+
163
+ </span>
164
+ </div>
165
+ </td>
166
+ <td class="num mono" data-label="Всего токенов">136,383</td>
167
+ </tr>
168
+
169
+ <tr data-model="litellm_proxy/gemini/gemini-3-pro-preview">
170
+ <td class="rank mono sticky-0" data-label="#">#3</td>
171
  <td class="model-name sticky-1" data-label="Модель">Gemini 3 Pro Preview</td>
172
  <td class="num mono" data-label="Критичные/1000">
173
 
 
203
  </tr>
204
 
205
  <tr data-model="openrouter/anthropic/claude-sonnet-4.5">
206
+ <td class="rank mono sticky-0" data-label="#">#4</td>
207
  <td class="model-name sticky-1" data-label="Модель">Claude Sonnet 4.5</td>
208
  <td class="num mono" data-label="Критичные/1000">
209
 
 
239
  </tr>
240
 
241
  <tr data-model="openrouter/openai/gpt-4o">
242
+ <td class="rank mono sticky-0" data-label="#">#5</td>
243
  <td class="model-name sticky-1" data-label="Модель">GPT-4o</td>
244
  <td class="num mono" data-label="Критичные/1000">
245
 
 
275
  </tr>
276
 
277
  <tr data-model="litellm_proxy/gemini-2.5-flash">
278
+ <td class="rank mono sticky-0" data-label="#">#6</td>
279
  <td class="model-name sticky-1" data-label="Модель">Gemini 2.5 Flash (GA)</td>
280
  <td class="num mono" data-label="Критичные/1000">
281
 
 
311
  </tr>
312
 
313
  <tr data-model="openrouter/minimax/minimax-01">
314
+ <td class="rank mono sticky-0" data-label="#">#7</td>
315
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-Text-01 (Minimax API)</td>
316
  <td class="num mono" data-label="Критичные/1000">
317
 
 
347
  </tr>
348
 
349
  <tr data-model="openai/Vikhrmodels/Vistral-24B-Instruct">
350
+ <td class="rank mono sticky-0" data-label="#">#8</td>
351
  <td class="model-name sticky-1" data-label="Модель">Vikhrmodels/Vistral-24B-Instruct (SGLang)</td>
352
  <td class="num mono" data-label="Критичные/1000">
353
 
 
383
  </tr>
384
 
385
  <tr data-model="openai/unsloth/gemma-3-27b-it">
386
+ <td class="rank mono sticky-0" data-label="#">#9</td>
387
  <td class="model-name sticky-1" data-label="Модель">Gemma-3-27b-it (SGLang)</td>
388
  <td class="num mono" data-label="Критичные/1000">
389
 
 
419
  </tr>
420
 
421
  <tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
422
+ <td class="rank mono sticky-0" data-label="#">#10</td>
423
  <td class="model-name sticky-1" data-label="Модель">Qwen/Qwen3-235B-A22B-Instruct-2507 (Vertex AI API)</td>
424
  <td class="num mono" data-label="Критичные/1000">
425
 
 
455
  </tr>
456
 
457
  <tr data-model="openai/mistralai/Mistral-Small-3.2-24B-Instruct-2506">
458
+ <td class="rank mono sticky-0" data-label="#">#11</td>
459
  <td class="model-name sticky-1" data-label="Модель">Mistral-Small-3.2-24B-Instruct-2506 (vllm)</td>
460
  <td class="num mono" data-label="Критичные/1000">
461
 
 
491
  </tr>
492
 
493
  <tr data-model="openrouter/deepseek/deepseek-chat">
494
+ <td class="rank mono sticky-0" data-label="#">#12</td>
495
  <td class="model-name sticky-1" data-label="Модель">DeepSeek V3 (Novita API)</td>
496
  <td class="num mono" data-label="Критичные/1000">
497
 
 
527
  </tr>
528
 
529
  <tr data-model="openai/RefalMachine/RuadaptQwen3-32B-Instruct">
530
+ <td class="rank mono sticky-0" data-label="#">#13</td>
531
  <td class="model-name sticky-1" data-label="Модель">RefalMachine/RuadaptQwen3-32B-Instruct (SGLang)</td>
532
  <td class="num mono" data-label="Критичные/1000">
533
 
 
563
  </tr>
564
 
565
  <tr data-model="openai/yandex/YandexGPT-5-Lite-8B-instruct">
566
+ <td class="rank mono sticky-0" data-label="#">#14</td>
567
  <td class="model-name sticky-1" data-label="Модель">yandex/YandexGPT-5-Lite-8B-instruct (SGLang)</td>
568
  <td class="num mono" data-label="Критичные/1000">
569
 
 
599
  </tr>
600
 
601
  <tr data-model="deepseek/deepseek-chat">
602
+ <td class="rank mono sticky-0" data-label="#">#15</td>
603
  <td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-chat (Deepseek API)</td>
604
  <td class="num mono" data-label="Критичные/1000">
605
 
 
635
  </tr>
636
 
637
  <tr data-model="openrouter/anthropic/claude-haiku-4.5">
638
+ <td class="rank mono sticky-0" data-label="#">#16</td>
639
  <td class="model-name sticky-1" data-label="Модель">Claude Haiku 4.5</td>
640
  <td class="num mono" data-label="Критичные/1000">
641
 
 
671
  </tr>
672
 
673
  <tr data-model="openai/Qwen/Qwen3-VL-32B-Instruct">
674
+ <td class="rank mono sticky-0" data-label="#">#17</td>
675
  <td class="model-name sticky-1" data-label="Модель">Qwen3-VL-32B-Instruct (SGLang)</td>
676
  <td class="num mono" data-label="Критичные/1000">
677
 
 
707
  </tr>
708
 
709
  <tr data-model="openai/AvitoTech/avibe">
710
+ <td class="rank mono sticky-0" data-label="#">#18</td>
711
  <td class="model-name sticky-1" data-label="Модель">AvitoTech/avibe</td>
712
  <td class="num mono" data-label="Критичные/1000">
713
 
 
743
  </tr>
744
 
745
  <tr data-model="openai/ai-sage/GigaChat-20B-A3B-instruct-v1.5-bf16">
746
+ <td class="rank mono sticky-0" data-label="#">#19</td>
747
  <td class="model-name sticky-1" data-label="Модель">GigaChat-20B-A3B-instruct-v1.5 (SGLang)</td>
748
  <td class="num mono" data-label="Критичные/1000">
749
 
 
779
  </tr>
780
 
781
  <tr data-model="deepseek/deepseek-reasoner">
782
+ <td class="rank mono sticky-0" data-label="#">#20</td>
783
  <td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-reasoner (Deepseek API)</td>
784
  <td class="num mono" data-label="Критичные/1000">
785
 
 
814
  <td class="num mono" data-label="Всего токенов">118,309</td>
815
  </tr>
816
 
817
+ <tr data-model="mistral/ministral-14b-2512">
818
+ <td class="rank mono sticky-0" data-label="#">#21</td>
819
+ <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-14B-Instruct-2512 (Mistral API)</td>
820
+ <td class="num mono" data-label="Критичные/1000">
821
+
822
+ 0.15 ± 0.01
823
+
824
+ </td>
825
+ <td class="num mono" data-label="Обычные/1000">
826
+
827
+ 0.67 ± 0.02
828
+
829
+ </td>
830
+ <td class="num mono" data-label="Доп./1000">
831
+
832
+ 0.22 ± 0.04
833
+
834
+ </td>
835
+ <td data-label="Нормировано ошибок">
836
+ <div class="score-cell">
837
+ <div class="progress-bar">
838
+
839
+
840
+
841
+ <div class="progress-fill" style="width: 72.75%"></div>
842
+ </div>
843
+ <span class="score-value">
844
+
845
+ 1.09 ± 0.03
846
+
847
+ </span>
848
+ </div>
849
+ </td>
850
+ <td class="num mono" data-label="Всего токенов">126,574</td>
851
+ </tr>
852
+
853
  <tr data-model="litellm_proxy/deepseek-v3">
854
+ <td class="rank mono sticky-0" data-label="#">#22</td>
855
  <td class="model-name sticky-1" data-label="Модель">Deepseek V3.2-Exp (Deepseek API)</td>
856
  <td class="num mono" data-label="Критичные/1000">
857
 
 
887
  </tr>
888
 
889
  <tr data-model="litellm_proxy/tmp-gemma-3n-e4b-it">
890
+ <td class="rank mono sticky-0" data-label="#">#23</td>
891
  <td class="model-name sticky-1" data-label="Модель">google/gemma-3n-E4B-it (AI Studio)</td>
892
  <td class="num mono" data-label="Критичные/1000">
893
 
 
922
  <td class="num mono" data-label="Всего токенов">99,646</td>
923
  </tr>
924
 
925
+ <tr data-model="mistral/ministral-8b-2512">
926
+ <td class="rank mono sticky-0" data-label="#">#24</td>
927
+ <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-8B-Instruct-2512 (Mistral API)</td>
928
+ <td class="num mono" data-label="Критичные/1000">
929
+
930
+ 0.13 ± 0.02
931
+
932
+ </td>
933
+ <td class="num mono" data-label="Обычные/1000">
934
+
935
+ 0.79 ± 0.02
936
+
937
+ </td>
938
+ <td class="num mono" data-label="Доп./1000">
939
+
940
+ 0.25 ± 0.01
941
+
942
+ </td>
943
+ <td data-label="Нормировано ошибок">
944
+ <div class="score-cell">
945
+ <div class="progress-bar">
946
+
947
+
948
+
949
+ <div class="progress-fill" style="width: 70.75%"></div>
950
+ </div>
951
+ <span class="score-value">
952
+
953
+ 1.17 ± 0.03
954
+
955
+ </span>
956
+ </div>
957
+ </td>
958
+ <td class="num mono" data-label="Всего токенов">133,214</td>
959
+ </tr>
960
+
961
  <tr data-model="openrouter/qwen/qwen3-next-80b-a3b-instruct">
962
+ <td class="rank mono sticky-0" data-label="#">#25</td>
963
  <td class="model-name sticky-1" data-label="Модель">Qwen3-Next-80B-A3B-Instruct (Alibaba API)</td>
964
  <td class="num mono" data-label="Критичные/1000">
965
 
 
995
  </tr>
996
 
997
  <tr data-model="openrouter/baidu/ernie-4.5-300b-a47b">
998
+ <td class="rank mono sticky-0" data-label="#">#26</td>
999
  <td class="model-name sticky-1" data-label="Модель">baidu/ERNIE-4.5-300B-A47B-PT (Novita API)</td>
1000
  <td class="num mono" data-label="Критичные/1000">
1001
 
 
1031
  </tr>
1032
 
1033
  <tr data-model="openai/Qwen/Qwen3-32B">
1034
+ <td class="rank mono sticky-0" data-label="#">#27</td>
1035
  <td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
1036
  <td class="num mono" data-label="Критичные/1000">
1037
 
 
1067
  </tr>
1068
 
1069
  <tr data-model="openai/t-tech/T-pro-it-2.0">
1070
+ <td class="rank mono sticky-0" data-label="#">#28</td>
1071
  <td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
1072
  <td class="num mono" data-label="Критичные/1000">
1073
 
 
1103
  </tr>
1104
 
1105
  <tr data-model="openrouter/openrouter/polaris-alpha">
1106
+ <td class="rank mono sticky-0" data-label="#">#29</td>
1107
  <td class="model-name sticky-1" data-label="Модель">Polaris Alpha</td>
1108
  <td class="num mono" data-label="Критичные/1000">
1109
 
 
1139
  </tr>
1140
 
1141
  <tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
1142
+ <td class="rank mono sticky-0" data-label="#">#30</td>
1143
  <td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
1144
  <td class="num mono" data-label="Критичные/1000">
1145
 
 
1175
  </tr>
1176
 
1177
  <tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
1178
+ <td class="rank mono sticky-0" data-label="#">#31</td>
1179
  <td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
1180
  <td class="num mono" data-label="Критичные/1000">
1181
 
 
1211
  </tr>
1212
 
1213
  <tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
1214
+ <td class="rank mono sticky-0" data-label="#">#32</td>
1215
  <td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
1216
  <td class="num mono" data-label="Критичные/1000">
1217
 
 
1247
  </tr>
1248
 
1249
  <tr data-model="openrouter/moonshotai/kimi-k2-0905">
1250
+ <td class="rank mono sticky-0" data-label="#">#33</td>
1251
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
1252
  <td class="num mono" data-label="Критичные/1000">
1253
 
 
1283
  </tr>
1284
 
1285
  <tr data-model="openrouter/z-ai/glm-4.6">
1286
+ <td class="rank mono sticky-0" data-label="#">#34</td>
1287
  <td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
1288
  <td class="num mono" data-label="Критичные/1000">
1289
 
 
1319
  </tr>
1320
 
1321
  <tr data-model="openrouter/openai/gpt-5">
1322
+ <td class="rank mono sticky-0" data-label="#">#35</td>
1323
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
1324
  <td class="num mono" data-label="Критичные/1000">
1325
 
 
1355
  </tr>
1356
 
1357
  <tr data-model="openai/aquif-3.5-Max-42B-A3B.Q8_0.gguf">
1358
+ <td class="rank mono sticky-0" data-label="#">#36</td>
1359
  <td class="model-name sticky-1" data-label="Модель">aquif-ai/aquif-3.5-Plus-30B-A3B (Q8_0 llama.cpp, without reasoning)</td>
1360
  <td class="num mono" data-label="Критичные/1000">
1361
 
 
1391
  </tr>
1392
 
1393
  <tr data-model="openrouter/openai/gpt-5">
1394
+ <td class="rank mono sticky-0" data-label="#">#37</td>
1395
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
1396
  <td class="num mono" data-label="Критичные/1000">
1397
 
 
1427
  </tr>
1428
 
1429
  <tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
1430
+ <td class="rank mono sticky-0" data-label="#">#38</td>
1431
  <td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
1432
  <td class="num mono" data-label="Критичные/1000">
1433
 
 
1463
  </tr>
1464
 
1465
  <tr data-model="openrouter/openai/gpt-oss-120b">
1466
+ <td class="rank mono sticky-0" data-label="#">#39</td>
1467
  <td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
1468
  <td class="num mono" data-label="Критичные/1000">
1469
 
 
1499
  </tr>
1500
 
1501
  <tr data-model="openai/gpt-4.1">
1502
+ <td class="rank mono sticky-0" data-label="#">#40</td>
1503
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1</td>
1504
  <td class="num mono" data-label="Критичные/1000">
1505
 
 
1534
  <td class="num mono" data-label="Всего токенов">85,822</td>
1535
  </tr>
1536
 
1537
+ <tr data-model="mistral/ministral-3b-2512">
1538
+ <td class="rank mono sticky-0" data-label="#">#41</td>
1539
+ <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-3B-Instruct-2512 (Mistral API)</td>
1540
+ <td class="num mono" data-label="Критичные/1000">
1541
+
1542
+ 0.38 ± 0.03
1543
+
1544
+ </td>
1545
+ <td class="num mono" data-label="Обычные/1000">
1546
+
1547
+ 1.44 ± 0.01
1548
+
1549
+ </td>
1550
+ <td class="num mono" data-label="Доп./1000">
1551
+
1552
+ 0.64 ± 0.03
1553
+
1554
+ </td>
1555
+ <td data-label="Нормировано ошибок">
1556
+ <div class="score-cell">
1557
+ <div class="progress-bar">
1558
+
1559
+
1560
+
1561
+ <div class="progress-fill" style="width: 37.0%"></div>
1562
+ </div>
1563
+ <span class="score-value">
1564
+
1565
+ 2.52 ± 0.08
1566
+
1567
+ </span>
1568
+ </div>
1569
+ </td>
1570
+ <td class="num mono" data-label="Всего токенов">123,147</td>
1571
+ </tr>
1572
+
1573
  <tr data-model="openrouter/mistralai/mistral-nemo">
1574
+ <td class="rank mono sticky-0" data-label="#">#42</td>
1575
  <td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
1576
  <td class="num mono" data-label="Критичные/1000">
1577
 
 
1607
  </tr>
1608
 
1609
  <tr data-model="openai/gpt-4.1-mini">
1610
+ <td class="rank mono sticky-0" data-label="#">#43</td>
1611
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-mini</td>
1612
  <td class="num mono" data-label="Критичные/1000">
1613
 
 
1643
  </tr>
1644
 
1645
  <tr data-model="openrouter/minimax/minimax-m2:free">
1646
+ <td class="rank mono sticky-0" data-label="#">#44</td>
1647
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
1648
  <td class="num mono" data-label="Критичные/1000">
1649
 
 
1679
  </tr>
1680
 
1681
  <tr data-model="openrouter/minimax/minimax-m2:free">
1682
+ <td class="rank mono sticky-0" data-label="#">#45</td>
1683
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
1684
  <td class="num mono" data-label="Критичные/1000">
1685
 
 
1715
  </tr>
1716
 
1717
  <tr data-model="openai/gpt-4.1-nano">
1718
+ <td class="rank mono sticky-0" data-label="#">#46</td>
1719
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-nano</td>
1720
  <td class="num mono" data-label="Критичные/1000">
1721
 
 
1751
  </tr>
1752
 
1753
  <tr data-model="openrouter/openai/gpt-oss-20b">
1754
+ <td class="rank mono sticky-0" data-label="#">#47</td>
1755
  <td class="model-name sticky-1" data-label="Модель">openai/gpt-oss-20b (Vertex API)</td>
1756
  <td class="num mono" data-label="Критичные/1000">
1757
 
 
1809
  </div>
1810
  <p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
1811
  <p class="info-text">
1812
+ Обновлено: 2025-12-02 22:09:04 | Всего моделей: 47 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
1813
  </p>
1814
  </div>
1815
  <script>