Spaces:
Running
Running
add google/gemma-3n-E4B-it (AI Studio)
Browse files- index.html +53 -17
index.html
CHANGED
|
@@ -670,8 +670,44 @@
|
|
| 670 |
<td class="num mono" data-label="Всего токенов">135,889</td>
|
| 671 |
</tr>
|
| 672 |
|
| 673 |
-
<tr data-model="
|
| 674 |
<td class="rank mono sticky-0" data-label="#">#17</td>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 675 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-Next-80B-A3B-Instruct (Alibaba API)</td>
|
| 676 |
<td class="num mono" data-label="Критичные/1000">
|
| 677 |
|
|
@@ -707,7 +743,7 @@
|
|
| 707 |
</tr>
|
| 708 |
|
| 709 |
<tr data-model="openrouter/baidu/ernie-4.5-300b-a47b">
|
| 710 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 711 |
<td class="model-name sticky-1" data-label="Модель">baidu/ERNIE-4.5-300B-A47B-PT (Novita API)</td>
|
| 712 |
<td class="num mono" data-label="Критичные/1000">
|
| 713 |
|
|
@@ -743,7 +779,7 @@
|
|
| 743 |
</tr>
|
| 744 |
|
| 745 |
<tr data-model="openai/Qwen/Qwen3-32B">
|
| 746 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 747 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
|
| 748 |
<td class="num mono" data-label="Критичные/1000">
|
| 749 |
|
|
@@ -779,7 +815,7 @@
|
|
| 779 |
</tr>
|
| 780 |
|
| 781 |
<tr data-model="openai/t-tech/T-pro-it-2.0">
|
| 782 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 783 |
<td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
|
| 784 |
<td class="num mono" data-label="Критичные/1000">
|
| 785 |
|
|
@@ -815,7 +851,7 @@
|
|
| 815 |
</tr>
|
| 816 |
|
| 817 |
<tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
|
| 818 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 819 |
<td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
|
| 820 |
<td class="num mono" data-label="Критичные/1000">
|
| 821 |
|
|
@@ -851,7 +887,7 @@
|
|
| 851 |
</tr>
|
| 852 |
|
| 853 |
<tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
|
| 854 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 855 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
|
| 856 |
<td class="num mono" data-label="Критичные/1000">
|
| 857 |
|
|
@@ -887,7 +923,7 @@
|
|
| 887 |
</tr>
|
| 888 |
|
| 889 |
<tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
|
| 890 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 891 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
|
| 892 |
<td class="num mono" data-label="Критичные/1000">
|
| 893 |
|
|
@@ -923,7 +959,7 @@
|
|
| 923 |
</tr>
|
| 924 |
|
| 925 |
<tr data-model="openrouter/moonshotai/kimi-k2-0905">
|
| 926 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 927 |
<td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
|
| 928 |
<td class="num mono" data-label="Критичные/1000">
|
| 929 |
|
|
@@ -959,7 +995,7 @@
|
|
| 959 |
</tr>
|
| 960 |
|
| 961 |
<tr data-model="openrouter/z-ai/glm-4.6">
|
| 962 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 963 |
<td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
|
| 964 |
<td class="num mono" data-label="Критичные/1000">
|
| 965 |
|
|
@@ -995,7 +1031,7 @@
|
|
| 995 |
</tr>
|
| 996 |
|
| 997 |
<tr data-model="openrouter/openai/gpt-5">
|
| 998 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 999 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
|
| 1000 |
<td class="num mono" data-label="Критичные/1000">
|
| 1001 |
|
|
@@ -1031,7 +1067,7 @@
|
|
| 1031 |
</tr>
|
| 1032 |
|
| 1033 |
<tr data-model="openrouter/openai/gpt-5">
|
| 1034 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1035 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
|
| 1036 |
<td class="num mono" data-label="Критичные/1000">
|
| 1037 |
|
|
@@ -1067,7 +1103,7 @@
|
|
| 1067 |
</tr>
|
| 1068 |
|
| 1069 |
<tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
|
| 1070 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1071 |
<td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
|
| 1072 |
<td class="num mono" data-label="Критичные/1000">
|
| 1073 |
|
|
@@ -1103,7 +1139,7 @@
|
|
| 1103 |
</tr>
|
| 1104 |
|
| 1105 |
<tr data-model="openrouter/openai/gpt-oss-120b">
|
| 1106 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1107 |
<td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
|
| 1108 |
<td class="num mono" data-label="Критичные/1000">
|
| 1109 |
|
|
@@ -1139,7 +1175,7 @@
|
|
| 1139 |
</tr>
|
| 1140 |
|
| 1141 |
<tr data-model="openrouter/mistralai/mistral-nemo">
|
| 1142 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1143 |
<td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
|
| 1144 |
<td class="num mono" data-label="Критичные/1000">
|
| 1145 |
|
|
@@ -1175,7 +1211,7 @@
|
|
| 1175 |
</tr>
|
| 1176 |
|
| 1177 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 1178 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1179 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
|
| 1180 |
<td class="num mono" data-label="Критичные/1000">
|
| 1181 |
|
|
@@ -1211,7 +1247,7 @@
|
|
| 1211 |
</tr>
|
| 1212 |
|
| 1213 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 1214 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1215 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
|
| 1216 |
<td class="num mono" data-label="Критичные/1000">
|
| 1217 |
|
|
@@ -1269,7 +1305,7 @@
|
|
| 1269 |
</div>
|
| 1270 |
<p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
|
| 1271 |
<p class="info-text">
|
| 1272 |
-
Обновлено: 2025-10-
|
| 1273 |
</p>
|
| 1274 |
</div>
|
| 1275 |
<script>
|
|
|
|
| 670 |
<td class="num mono" data-label="Всего токенов">135,889</td>
|
| 671 |
</tr>
|
| 672 |
|
| 673 |
+
<tr data-model="litellm_proxy/tmp-gemma-3n-e4b-it">
|
| 674 |
<td class="rank mono sticky-0" data-label="#">#17</td>
|
| 675 |
+
<td class="model-name sticky-1" data-label="Модель">google/gemma-3n-E4B-it (AI Studio)</td>
|
| 676 |
+
<td class="num mono" data-label="Критичные/1000">
|
| 677 |
+
|
| 678 |
+
0.18 ± 0.01
|
| 679 |
+
|
| 680 |
+
</td>
|
| 681 |
+
<td class="num mono" data-label="Обычные/1000">
|
| 682 |
+
|
| 683 |
+
0.50 ± 0.02
|
| 684 |
+
|
| 685 |
+
</td>
|
| 686 |
+
<td class="num mono" data-label="Доп./1000">
|
| 687 |
+
|
| 688 |
+
0.48 ± 0.07
|
| 689 |
+
|
| 690 |
+
</td>
|
| 691 |
+
<td data-label="Нормировано ошибок">
|
| 692 |
+
<div class="score-cell">
|
| 693 |
+
<div class="progress-bar">
|
| 694 |
+
|
| 695 |
+
|
| 696 |
+
|
| 697 |
+
<div class="progress-fill" style="width: 74.30555555555556%"></div>
|
| 698 |
+
</div>
|
| 699 |
+
<span class="score-value">
|
| 700 |
+
|
| 701 |
+
1.11
|
| 702 |
+
|
| 703 |
+
</span>
|
| 704 |
+
</div>
|
| 705 |
+
</td>
|
| 706 |
+
<td class="num mono" data-label="Всего токенов">99,646</td>
|
| 707 |
+
</tr>
|
| 708 |
+
|
| 709 |
+
<tr data-model="openrouter/qwen/qwen3-next-80b-a3b-instruct">
|
| 710 |
+
<td class="rank mono sticky-0" data-label="#">#18</td>
|
| 711 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-Next-80B-A3B-Instruct (Alibaba API)</td>
|
| 712 |
<td class="num mono" data-label="Критичные/1000">
|
| 713 |
|
|
|
|
| 743 |
</tr>
|
| 744 |
|
| 745 |
<tr data-model="openrouter/baidu/ernie-4.5-300b-a47b">
|
| 746 |
+
<td class="rank mono sticky-0" data-label="#">#19</td>
|
| 747 |
<td class="model-name sticky-1" data-label="Модель">baidu/ERNIE-4.5-300B-A47B-PT (Novita API)</td>
|
| 748 |
<td class="num mono" data-label="Критичные/1000">
|
| 749 |
|
|
|
|
| 779 |
</tr>
|
| 780 |
|
| 781 |
<tr data-model="openai/Qwen/Qwen3-32B">
|
| 782 |
+
<td class="rank mono sticky-0" data-label="#">#20</td>
|
| 783 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
|
| 784 |
<td class="num mono" data-label="Критичные/1000">
|
| 785 |
|
|
|
|
| 815 |
</tr>
|
| 816 |
|
| 817 |
<tr data-model="openai/t-tech/T-pro-it-2.0">
|
| 818 |
+
<td class="rank mono sticky-0" data-label="#">#21</td>
|
| 819 |
<td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
|
| 820 |
<td class="num mono" data-label="Критичные/1000">
|
| 821 |
|
|
|
|
| 851 |
</tr>
|
| 852 |
|
| 853 |
<tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
|
| 854 |
+
<td class="rank mono sticky-0" data-label="#">#22</td>
|
| 855 |
<td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
|
| 856 |
<td class="num mono" data-label="Критичные/1000">
|
| 857 |
|
|
|
|
| 887 |
</tr>
|
| 888 |
|
| 889 |
<tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
|
| 890 |
+
<td class="rank mono sticky-0" data-label="#">#23</td>
|
| 891 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
|
| 892 |
<td class="num mono" data-label="Критичные/1000">
|
| 893 |
|
|
|
|
| 923 |
</tr>
|
| 924 |
|
| 925 |
<tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
|
| 926 |
+
<td class="rank mono sticky-0" data-label="#">#24</td>
|
| 927 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
|
| 928 |
<td class="num mono" data-label="Критичные/1000">
|
| 929 |
|
|
|
|
| 959 |
</tr>
|
| 960 |
|
| 961 |
<tr data-model="openrouter/moonshotai/kimi-k2-0905">
|
| 962 |
+
<td class="rank mono sticky-0" data-label="#">#25</td>
|
| 963 |
<td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
|
| 964 |
<td class="num mono" data-label="Критичные/1000">
|
| 965 |
|
|
|
|
| 995 |
</tr>
|
| 996 |
|
| 997 |
<tr data-model="openrouter/z-ai/glm-4.6">
|
| 998 |
+
<td class="rank mono sticky-0" data-label="#">#26</td>
|
| 999 |
<td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
|
| 1000 |
<td class="num mono" data-label="Критичные/1000">
|
| 1001 |
|
|
|
|
| 1031 |
</tr>
|
| 1032 |
|
| 1033 |
<tr data-model="openrouter/openai/gpt-5">
|
| 1034 |
+
<td class="rank mono sticky-0" data-label="#">#27</td>
|
| 1035 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
|
| 1036 |
<td class="num mono" data-label="Критичные/1000">
|
| 1037 |
|
|
|
|
| 1067 |
</tr>
|
| 1068 |
|
| 1069 |
<tr data-model="openrouter/openai/gpt-5">
|
| 1070 |
+
<td class="rank mono sticky-0" data-label="#">#28</td>
|
| 1071 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
|
| 1072 |
<td class="num mono" data-label="Критичные/1000">
|
| 1073 |
|
|
|
|
| 1103 |
</tr>
|
| 1104 |
|
| 1105 |
<tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
|
| 1106 |
+
<td class="rank mono sticky-0" data-label="#">#29</td>
|
| 1107 |
<td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
|
| 1108 |
<td class="num mono" data-label="Критичные/1000">
|
| 1109 |
|
|
|
|
| 1139 |
</tr>
|
| 1140 |
|
| 1141 |
<tr data-model="openrouter/openai/gpt-oss-120b">
|
| 1142 |
+
<td class="rank mono sticky-0" data-label="#">#30</td>
|
| 1143 |
<td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
|
| 1144 |
<td class="num mono" data-label="Критичные/1000">
|
| 1145 |
|
|
|
|
| 1175 |
</tr>
|
| 1176 |
|
| 1177 |
<tr data-model="openrouter/mistralai/mistral-nemo">
|
| 1178 |
+
<td class="rank mono sticky-0" data-label="#">#31</td>
|
| 1179 |
<td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
|
| 1180 |
<td class="num mono" data-label="Критичные/1000">
|
| 1181 |
|
|
|
|
| 1211 |
</tr>
|
| 1212 |
|
| 1213 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 1214 |
+
<td class="rank mono sticky-0" data-label="#">#32</td>
|
| 1215 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
|
| 1216 |
<td class="num mono" data-label="Критичные/1000">
|
| 1217 |
|
|
|
|
| 1247 |
</tr>
|
| 1248 |
|
| 1249 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 1250 |
+
<td class="rank mono sticky-0" data-label="#">#33</td>
|
| 1251 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
|
| 1252 |
<td class="num mono" data-label="Критичные/1000">
|
| 1253 |
|
|
|
|
| 1305 |
</div>
|
| 1306 |
<p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
|
| 1307 |
<p class="info-text">
|
| 1308 |
+
Обновлено: 2025-10-30 11:50:26 | Всего моделей: 33 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
|
| 1309 |
</p>
|
| 1310 |
</div>
|
| 1311 |
<script>
|