Spaces:
Running
Running
add Qwen3-VL-8B-Instruct
Browse files- index.html +44 -8
index.html
CHANGED
|
@@ -706,8 +706,44 @@
|
|
| 706 |
<td class="num mono" data-label="Всего токенов">137,855</td>
|
| 707 |
</tr>
|
| 708 |
|
| 709 |
-
<tr data-model="openrouter/
|
| 710 |
<td class="rank mono sticky-0" data-label="#">#18</td>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 711 |
<td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
|
| 712 |
<td class="num mono" data-label="Критичные/1000">
|
| 713 |
|
|
@@ -743,7 +779,7 @@
|
|
| 743 |
</tr>
|
| 744 |
|
| 745 |
<tr data-model="openrouter/z-ai/glm-4.6">
|
| 746 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 747 |
<td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
|
| 748 |
<td class="num mono" data-label="Критичные/1000">
|
| 749 |
|
|
@@ -779,7 +815,7 @@
|
|
| 779 |
</tr>
|
| 780 |
|
| 781 |
<tr data-model="openrouter/openai/gpt-5">
|
| 782 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 783 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
|
| 784 |
<td class="num mono" data-label="Критичные/1000">
|
| 785 |
|
|
@@ -815,7 +851,7 @@
|
|
| 815 |
</tr>
|
| 816 |
|
| 817 |
<tr data-model="openrouter/openai/gpt-5">
|
| 818 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 819 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
|
| 820 |
<td class="num mono" data-label="Критичные/1000">
|
| 821 |
|
|
@@ -851,7 +887,7 @@
|
|
| 851 |
</tr>
|
| 852 |
|
| 853 |
<tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
|
| 854 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 855 |
<td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
|
| 856 |
<td class="num mono" data-label="Критичные/1000">
|
| 857 |
|
|
@@ -887,7 +923,7 @@
|
|
| 887 |
</tr>
|
| 888 |
|
| 889 |
<tr data-model="openrouter/openai/gpt-oss-120b">
|
| 890 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 891 |
<td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
|
| 892 |
<td class="num mono" data-label="Критичные/1000">
|
| 893 |
|
|
@@ -923,7 +959,7 @@
|
|
| 923 |
</tr>
|
| 924 |
|
| 925 |
<tr data-model="openrouter/mistralai/mistral-nemo">
|
| 926 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 927 |
<td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
|
| 928 |
<td class="num mono" data-label="Критичные/1000">
|
| 929 |
|
|
@@ -981,7 +1017,7 @@
|
|
| 981 |
</div>
|
| 982 |
<p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
|
| 983 |
<p class="info-text">
|
| 984 |
-
Обновлено: 2025-10-
|
| 985 |
</p>
|
| 986 |
</div>
|
| 987 |
<script>
|
|
|
|
| 706 |
<td class="num mono" data-label="Всего токенов">137,855</td>
|
| 707 |
</tr>
|
| 708 |
|
| 709 |
+
<tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
|
| 710 |
<td class="rank mono sticky-0" data-label="#">#18</td>
|
| 711 |
+
<td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
|
| 712 |
+
<td class="num mono" data-label="Критичные/1000">
|
| 713 |
+
|
| 714 |
+
0.24 ± 0.03
|
| 715 |
+
|
| 716 |
+
</td>
|
| 717 |
+
<td class="num mono" data-label="Обычные/1000">
|
| 718 |
+
|
| 719 |
+
1.02 ± 0.05
|
| 720 |
+
|
| 721 |
+
</td>
|
| 722 |
+
<td class="num mono" data-label="Доп./1000">
|
| 723 |
+
|
| 724 |
+
0.32 ± 0.01
|
| 725 |
+
|
| 726 |
+
</td>
|
| 727 |
+
<td data-label="Нормировано ошибок">
|
| 728 |
+
<div class="score-cell">
|
| 729 |
+
<div class="progress-bar">
|
| 730 |
+
|
| 731 |
+
|
| 732 |
+
|
| 733 |
+
<div class="progress-fill" style="width: 40.07220216606498%"></div>
|
| 734 |
+
</div>
|
| 735 |
+
<span class="score-value">
|
| 736 |
+
|
| 737 |
+
1.66 ± 0.11
|
| 738 |
+
|
| 739 |
+
</span>
|
| 740 |
+
</div>
|
| 741 |
+
</td>
|
| 742 |
+
<td class="num mono" data-label="Всего токенов">165,307</td>
|
| 743 |
+
</tr>
|
| 744 |
+
|
| 745 |
+
<tr data-model="openrouter/moonshotai/kimi-k2-0905">
|
| 746 |
+
<td class="rank mono sticky-0" data-label="#">#19</td>
|
| 747 |
<td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
|
| 748 |
<td class="num mono" data-label="Критичные/1000">
|
| 749 |
|
|
|
|
| 779 |
</tr>
|
| 780 |
|
| 781 |
<tr data-model="openrouter/z-ai/glm-4.6">
|
| 782 |
+
<td class="rank mono sticky-0" data-label="#">#20</td>
|
| 783 |
<td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
|
| 784 |
<td class="num mono" data-label="Критичные/1000">
|
| 785 |
|
|
|
|
| 815 |
</tr>
|
| 816 |
|
| 817 |
<tr data-model="openrouter/openai/gpt-5">
|
| 818 |
+
<td class="rank mono sticky-0" data-label="#">#21</td>
|
| 819 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
|
| 820 |
<td class="num mono" data-label="Критичные/1000">
|
| 821 |
|
|
|
|
| 851 |
</tr>
|
| 852 |
|
| 853 |
<tr data-model="openrouter/openai/gpt-5">
|
| 854 |
+
<td class="rank mono sticky-0" data-label="#">#22</td>
|
| 855 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
|
| 856 |
<td class="num mono" data-label="Критичные/1000">
|
| 857 |
|
|
|
|
| 887 |
</tr>
|
| 888 |
|
| 889 |
<tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
|
| 890 |
+
<td class="rank mono sticky-0" data-label="#">#23</td>
|
| 891 |
<td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
|
| 892 |
<td class="num mono" data-label="Критичные/1000">
|
| 893 |
|
|
|
|
| 923 |
</tr>
|
| 924 |
|
| 925 |
<tr data-model="openrouter/openai/gpt-oss-120b">
|
| 926 |
+
<td class="rank mono sticky-0" data-label="#">#24</td>
|
| 927 |
<td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
|
| 928 |
<td class="num mono" data-label="Критичные/1000">
|
| 929 |
|
|
|
|
| 959 |
</tr>
|
| 960 |
|
| 961 |
<tr data-model="openrouter/mistralai/mistral-nemo">
|
| 962 |
+
<td class="rank mono sticky-0" data-label="#">#25</td>
|
| 963 |
<td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
|
| 964 |
<td class="num mono" data-label="Критичные/1000">
|
| 965 |
|
|
|
|
| 1017 |
</div>
|
| 1018 |
<p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
|
| 1019 |
<p class="info-text">
|
| 1020 |
+
Обновлено: 2025-10-24 14:31:35 | Всего моделей: 25 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
|
| 1021 |
</p>
|
| 1022 |
</div>
|
| 1023 |
<script>
|