Spaces:
Running
Running
add AvitoTech/avibe
Browse files- index.html +55 -19
index.html
CHANGED
|
@@ -526,8 +526,44 @@
|
|
| 526 |
<td class="num mono" data-label="Всего токенов">147,626</td>
|
| 527 |
</tr>
|
| 528 |
|
| 529 |
-
<tr data-model="openai/
|
| 530 |
<td class="rank mono sticky-0" data-label="#">#13</td>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 531 |
<td class="model-name sticky-1" data-label="Модель">GigaChat-20B-A3B-instruct-v1.5 (SGLang)</td>
|
| 532 |
<td class="num mono" data-label="Критичные/1000">
|
| 533 |
|
|
@@ -563,7 +599,7 @@
|
|
| 563 |
</tr>
|
| 564 |
|
| 565 |
<tr data-model="litellm_proxy/deepseek-v3">
|
| 566 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 567 |
<td class="model-name sticky-1" data-label="Модель">Deepseek V3.2-Exp (Deepseek API)</td>
|
| 568 |
<td class="num mono" data-label="Критичные/1000">
|
| 569 |
|
|
@@ -599,7 +635,7 @@
|
|
| 599 |
</tr>
|
| 600 |
|
| 601 |
<tr data-model="openrouter/qwen/qwen3-next-80b-a3b-instruct">
|
| 602 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 603 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-Next-80B-A3B-Instruct (Alibaba API)</td>
|
| 604 |
<td class="num mono" data-label="Критичные/1000">
|
| 605 |
|
|
@@ -635,7 +671,7 @@
|
|
| 635 |
</tr>
|
| 636 |
|
| 637 |
<tr data-model="openrouter/baidu/ernie-4.5-300b-a47b">
|
| 638 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 639 |
<td class="model-name sticky-1" data-label="Модель">baidu/ERNIE-4.5-300B-A47B-PT (Novita API)</td>
|
| 640 |
<td class="num mono" data-label="Критичные/1000">
|
| 641 |
|
|
@@ -671,7 +707,7 @@
|
|
| 671 |
</tr>
|
| 672 |
|
| 673 |
<tr data-model="openai/Qwen/Qwen3-32B">
|
| 674 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 675 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
|
| 676 |
<td class="num mono" data-label="Критичные/1000">
|
| 677 |
|
|
@@ -707,7 +743,7 @@
|
|
| 707 |
</tr>
|
| 708 |
|
| 709 |
<tr data-model="openai/t-tech/T-pro-it-2.0">
|
| 710 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 711 |
<td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
|
| 712 |
<td class="num mono" data-label="Критичные/1000">
|
| 713 |
|
|
@@ -743,7 +779,7 @@
|
|
| 743 |
</tr>
|
| 744 |
|
| 745 |
<tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
|
| 746 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 747 |
<td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
|
| 748 |
<td class="num mono" data-label="Критичные/1000">
|
| 749 |
|
|
@@ -779,7 +815,7 @@
|
|
| 779 |
</tr>
|
| 780 |
|
| 781 |
<tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
|
| 782 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 783 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
|
| 784 |
<td class="num mono" data-label="Критичные/1000">
|
| 785 |
|
|
@@ -815,7 +851,7 @@
|
|
| 815 |
</tr>
|
| 816 |
|
| 817 |
<tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
|
| 818 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 819 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
|
| 820 |
<td class="num mono" data-label="Критичные/1000">
|
| 821 |
|
|
@@ -851,7 +887,7 @@
|
|
| 851 |
</tr>
|
| 852 |
|
| 853 |
<tr data-model="openrouter/moonshotai/kimi-k2-0905">
|
| 854 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 855 |
<td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
|
| 856 |
<td class="num mono" data-label="Критичные/1000">
|
| 857 |
|
|
@@ -887,7 +923,7 @@
|
|
| 887 |
</tr>
|
| 888 |
|
| 889 |
<tr data-model="openrouter/z-ai/glm-4.6">
|
| 890 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 891 |
<td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
|
| 892 |
<td class="num mono" data-label="Критичные/1000">
|
| 893 |
|
|
@@ -923,7 +959,7 @@
|
|
| 923 |
</tr>
|
| 924 |
|
| 925 |
<tr data-model="openrouter/openai/gpt-5">
|
| 926 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 927 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
|
| 928 |
<td class="num mono" data-label="Критичные/1000">
|
| 929 |
|
|
@@ -959,7 +995,7 @@
|
|
| 959 |
</tr>
|
| 960 |
|
| 961 |
<tr data-model="openrouter/openai/gpt-5">
|
| 962 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 963 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
|
| 964 |
<td class="num mono" data-label="Критичные/1000">
|
| 965 |
|
|
@@ -995,7 +1031,7 @@
|
|
| 995 |
</tr>
|
| 996 |
|
| 997 |
<tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
|
| 998 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 999 |
<td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
|
| 1000 |
<td class="num mono" data-label="Критичные/1000">
|
| 1001 |
|
|
@@ -1031,7 +1067,7 @@
|
|
| 1031 |
</tr>
|
| 1032 |
|
| 1033 |
<tr data-model="openrouter/openai/gpt-oss-120b">
|
| 1034 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1035 |
<td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
|
| 1036 |
<td class="num mono" data-label="Критичные/1000">
|
| 1037 |
|
|
@@ -1067,7 +1103,7 @@
|
|
| 1067 |
</tr>
|
| 1068 |
|
| 1069 |
<tr data-model="openrouter/mistralai/mistral-nemo">
|
| 1070 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1071 |
<td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
|
| 1072 |
<td class="num mono" data-label="Критичные/1000">
|
| 1073 |
|
|
@@ -1103,7 +1139,7 @@
|
|
| 1103 |
</tr>
|
| 1104 |
|
| 1105 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 1106 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1107 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
|
| 1108 |
<td class="num mono" data-label="Критичные/1000">
|
| 1109 |
|
|
@@ -1139,7 +1175,7 @@
|
|
| 1139 |
</tr>
|
| 1140 |
|
| 1141 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 1142 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1143 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
|
| 1144 |
<td class="num mono" data-label="Критичные/1000">
|
| 1145 |
|
|
@@ -1197,7 +1233,7 @@
|
|
| 1197 |
</div>
|
| 1198 |
<p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
|
| 1199 |
<p class="info-text">
|
| 1200 |
-
Обновлено: 2025-10-
|
| 1201 |
</p>
|
| 1202 |
</div>
|
| 1203 |
<script>
|
|
|
|
| 526 |
<td class="num mono" data-label="Всего токенов">147,626</td>
|
| 527 |
</tr>
|
| 528 |
|
| 529 |
+
<tr data-model="openai/AvitoTech/avibe">
|
| 530 |
<td class="rank mono sticky-0" data-label="#">#13</td>
|
| 531 |
+
<td class="model-name sticky-1" data-label="Модель">AvitoTech/avibe</td>
|
| 532 |
+
<td class="num mono" data-label="Критичные/1000">
|
| 533 |
+
|
| 534 |
+
0.06
|
| 535 |
+
|
| 536 |
+
</td>
|
| 537 |
+
<td class="num mono" data-label="Обычные/1000">
|
| 538 |
+
|
| 539 |
+
0.65 ± 0.04
|
| 540 |
+
|
| 541 |
+
</td>
|
| 542 |
+
<td class="num mono" data-label="Доп./1000">
|
| 543 |
+
|
| 544 |
+
0.44 ± 0.05
|
| 545 |
+
|
| 546 |
+
</td>
|
| 547 |
+
<td data-label="Нормировано ошибок">
|
| 548 |
+
<div class="score-cell">
|
| 549 |
+
<div class="progress-bar">
|
| 550 |
+
|
| 551 |
+
|
| 552 |
+
|
| 553 |
+
<div class="progress-fill" style="width: 77.08333333333334%"></div>
|
| 554 |
+
</div>
|
| 555 |
+
<span class="score-value">
|
| 556 |
+
|
| 557 |
+
0.99 ± 0.06
|
| 558 |
+
|
| 559 |
+
</span>
|
| 560 |
+
</div>
|
| 561 |
+
</td>
|
| 562 |
+
<td class="num mono" data-label="Всего токенов">88,360</td>
|
| 563 |
+
</tr>
|
| 564 |
+
|
| 565 |
+
<tr data-model="openai/ai-sage/GigaChat-20B-A3B-instruct-v1.5-bf16">
|
| 566 |
+
<td class="rank mono sticky-0" data-label="#">#14</td>
|
| 567 |
<td class="model-name sticky-1" data-label="Модель">GigaChat-20B-A3B-instruct-v1.5 (SGLang)</td>
|
| 568 |
<td class="num mono" data-label="Критичные/1000">
|
| 569 |
|
|
|
|
| 599 |
</tr>
|
| 600 |
|
| 601 |
<tr data-model="litellm_proxy/deepseek-v3">
|
| 602 |
+
<td class="rank mono sticky-0" data-label="#">#15</td>
|
| 603 |
<td class="model-name sticky-1" data-label="Модель">Deepseek V3.2-Exp (Deepseek API)</td>
|
| 604 |
<td class="num mono" data-label="Критичные/1000">
|
| 605 |
|
|
|
|
| 635 |
</tr>
|
| 636 |
|
| 637 |
<tr data-model="openrouter/qwen/qwen3-next-80b-a3b-instruct">
|
| 638 |
+
<td class="rank mono sticky-0" data-label="#">#16</td>
|
| 639 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-Next-80B-A3B-Instruct (Alibaba API)</td>
|
| 640 |
<td class="num mono" data-label="Критичные/1000">
|
| 641 |
|
|
|
|
| 671 |
</tr>
|
| 672 |
|
| 673 |
<tr data-model="openrouter/baidu/ernie-4.5-300b-a47b">
|
| 674 |
+
<td class="rank mono sticky-0" data-label="#">#17</td>
|
| 675 |
<td class="model-name sticky-1" data-label="Модель">baidu/ERNIE-4.5-300B-A47B-PT (Novita API)</td>
|
| 676 |
<td class="num mono" data-label="Критичные/1000">
|
| 677 |
|
|
|
|
| 707 |
</tr>
|
| 708 |
|
| 709 |
<tr data-model="openai/Qwen/Qwen3-32B">
|
| 710 |
+
<td class="rank mono sticky-0" data-label="#">#18</td>
|
| 711 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
|
| 712 |
<td class="num mono" data-label="Критичные/1000">
|
| 713 |
|
|
|
|
| 743 |
</tr>
|
| 744 |
|
| 745 |
<tr data-model="openai/t-tech/T-pro-it-2.0">
|
| 746 |
+
<td class="rank mono sticky-0" data-label="#">#19</td>
|
| 747 |
<td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
|
| 748 |
<td class="num mono" data-label="Критичные/1000">
|
| 749 |
|
|
|
|
| 779 |
</tr>
|
| 780 |
|
| 781 |
<tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
|
| 782 |
+
<td class="rank mono sticky-0" data-label="#">#20</td>
|
| 783 |
<td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
|
| 784 |
<td class="num mono" data-label="Критичные/1000">
|
| 785 |
|
|
|
|
| 815 |
</tr>
|
| 816 |
|
| 817 |
<tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
|
| 818 |
+
<td class="rank mono sticky-0" data-label="#">#21</td>
|
| 819 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
|
| 820 |
<td class="num mono" data-label="Критичные/1000">
|
| 821 |
|
|
|
|
| 851 |
</tr>
|
| 852 |
|
| 853 |
<tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
|
| 854 |
+
<td class="rank mono sticky-0" data-label="#">#22</td>
|
| 855 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
|
| 856 |
<td class="num mono" data-label="Критичные/1000">
|
| 857 |
|
|
|
|
| 887 |
</tr>
|
| 888 |
|
| 889 |
<tr data-model="openrouter/moonshotai/kimi-k2-0905">
|
| 890 |
+
<td class="rank mono sticky-0" data-label="#">#23</td>
|
| 891 |
<td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
|
| 892 |
<td class="num mono" data-label="Критичные/1000">
|
| 893 |
|
|
|
|
| 923 |
</tr>
|
| 924 |
|
| 925 |
<tr data-model="openrouter/z-ai/glm-4.6">
|
| 926 |
+
<td class="rank mono sticky-0" data-label="#">#24</td>
|
| 927 |
<td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
|
| 928 |
<td class="num mono" data-label="Критичные/1000">
|
| 929 |
|
|
|
|
| 959 |
</tr>
|
| 960 |
|
| 961 |
<tr data-model="openrouter/openai/gpt-5">
|
| 962 |
+
<td class="rank mono sticky-0" data-label="#">#25</td>
|
| 963 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
|
| 964 |
<td class="num mono" data-label="Критичные/1000">
|
| 965 |
|
|
|
|
| 995 |
</tr>
|
| 996 |
|
| 997 |
<tr data-model="openrouter/openai/gpt-5">
|
| 998 |
+
<td class="rank mono sticky-0" data-label="#">#26</td>
|
| 999 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
|
| 1000 |
<td class="num mono" data-label="Критичные/1000">
|
| 1001 |
|
|
|
|
| 1031 |
</tr>
|
| 1032 |
|
| 1033 |
<tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
|
| 1034 |
+
<td class="rank mono sticky-0" data-label="#">#27</td>
|
| 1035 |
<td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
|
| 1036 |
<td class="num mono" data-label="Критичные/1000">
|
| 1037 |
|
|
|
|
| 1067 |
</tr>
|
| 1068 |
|
| 1069 |
<tr data-model="openrouter/openai/gpt-oss-120b">
|
| 1070 |
+
<td class="rank mono sticky-0" data-label="#">#28</td>
|
| 1071 |
<td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
|
| 1072 |
<td class="num mono" data-label="Критичные/1000">
|
| 1073 |
|
|
|
|
| 1103 |
</tr>
|
| 1104 |
|
| 1105 |
<tr data-model="openrouter/mistralai/mistral-nemo">
|
| 1106 |
+
<td class="rank mono sticky-0" data-label="#">#29</td>
|
| 1107 |
<td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
|
| 1108 |
<td class="num mono" data-label="Критичные/1000">
|
| 1109 |
|
|
|
|
| 1139 |
</tr>
|
| 1140 |
|
| 1141 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 1142 |
+
<td class="rank mono sticky-0" data-label="#">#30</td>
|
| 1143 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
|
| 1144 |
<td class="num mono" data-label="Критичные/1000">
|
| 1145 |
|
|
|
|
| 1175 |
</tr>
|
| 1176 |
|
| 1177 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 1178 |
+
<td class="rank mono sticky-0" data-label="#">#31</td>
|
| 1179 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
|
| 1180 |
<td class="num mono" data-label="Критичные/1000">
|
| 1181 |
|
|
|
|
| 1233 |
</div>
|
| 1234 |
<p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
|
| 1235 |
<p class="info-text">
|
| 1236 |
+
Обновлено: 2025-10-28 09:19:30 | Всего моделей: 31 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
|
| 1237 |
</p>
|
| 1238 |
</div>
|
| 1239 |
<script>
|